git-commit-vandalism/count-delta.c
Junio C Hamano 355e76a4a3 [PATCH] Tweak count-delta interface
Make it return copied source and insertion separately, so that
later implementation of heuristics can use them more flexibly.

This does not change the heuristics implemented in
diffcore-rename nor diffcore-break in any way.

Signed-off-by: Junio C Hamano <junkio@cox.net>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2005-06-03 11:23:03 -07:00

98 lines
2.5 KiB
C

/*
* Copyright (C) 2005 Junio C Hamano
* The delta-parsing part is almost straight copy of patch-delta.c
* which is (C) 2005 Nicolas Pitre <nico@cam.org>.
*/
#include <stdlib.h>
#include <string.h>
#include <limits.h>
#include "count-delta.h"
static unsigned long get_hdr_size(const unsigned char **datap)
{
const unsigned char *data = *datap;
unsigned long size;
unsigned char cmd;
int i;
size = i = 0;
cmd = *data++;
while (cmd) {
if (cmd & 1)
size |= *data++ << i;
i += 8;
cmd >>= 1;
}
*datap = data;
return size;
}
/*
* NOTE. We do not _interpret_ delta fully. As an approximation, we
* just count the number of bytes that are copied from the source, and
* the number of literal data bytes that are inserted.
*
* Number of bytes that are _not_ copied from the source is deletion,
* and number of inserted literal bytes are addition, so sum of them
* is the extent of damage. xdelta can express an edit that copies
* data inside of the destination which originally came from the
* source. We do not count that in the following routine, so we are
* undercounting the source material that remains in the final output
* that way.
*/
int count_delta(void *delta_buf, unsigned long delta_size,
unsigned long *src_copied, unsigned long *literal_added)
{
unsigned long copied_from_source, added_literal;
const unsigned char *data, *top;
unsigned char cmd;
unsigned long src_size, dst_size, out;
/* the smallest delta size possible is 6 bytes */
if (delta_size < 6)
return -1;
data = delta_buf;
top = delta_buf + delta_size;
src_size = get_hdr_size(&data);
dst_size = get_hdr_size(&data);
added_literal = copied_from_source = out = 0;
while (data < top) {
cmd = *data++;
if (cmd & 0x80) {
unsigned long cp_off = 0, cp_size = 0;
if (cmd & 0x01) cp_off = *data++;
if (cmd & 0x02) cp_off |= (*data++ << 8);
if (cmd & 0x04) cp_off |= (*data++ << 16);
if (cmd & 0x08) cp_off |= (*data++ << 24);
if (cmd & 0x10) cp_size = *data++;
if (cmd & 0x20) cp_size |= (*data++ << 8);
if (cp_size == 0) cp_size = 0x10000;
if (cmd & 0x40)
/* copy from dst */
;
else
copied_from_source += cp_size;
out += cp_size;
} else {
/* write literal into dst */
added_literal += cmd;
out += cmd;
data += cmd;
}
}
/* sanity check */
if (data != top || out != dst_size)
return -1;
/* delete size is what was _not_ copied from source.
* edit size is that and literal additions.
*/
*src_copied = copied_from_source;
*literal_added = added_literal;
return 0;
}