355e76a4a3
Make it return copied source and insertion separately, so that later implementation of heuristics can use them more flexibly. This does not change the heuristics implemented in diffcore-rename nor diffcore-break in any way. Signed-off-by: Junio C Hamano <junkio@cox.net> Signed-off-by: Linus Torvalds <torvalds@osdl.org>
98 lines
2.5 KiB
C
98 lines
2.5 KiB
C
/*
|
|
* Copyright (C) 2005 Junio C Hamano
|
|
* The delta-parsing part is almost straight copy of patch-delta.c
|
|
* which is (C) 2005 Nicolas Pitre <nico@cam.org>.
|
|
*/
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <limits.h>
|
|
#include "count-delta.h"
|
|
|
|
static unsigned long get_hdr_size(const unsigned char **datap)
|
|
{
|
|
const unsigned char *data = *datap;
|
|
unsigned long size;
|
|
unsigned char cmd;
|
|
int i;
|
|
size = i = 0;
|
|
cmd = *data++;
|
|
while (cmd) {
|
|
if (cmd & 1)
|
|
size |= *data++ << i;
|
|
i += 8;
|
|
cmd >>= 1;
|
|
}
|
|
*datap = data;
|
|
return size;
|
|
}
|
|
|
|
/*
|
|
* NOTE. We do not _interpret_ delta fully. As an approximation, we
|
|
* just count the number of bytes that are copied from the source, and
|
|
* the number of literal data bytes that are inserted.
|
|
*
|
|
* Number of bytes that are _not_ copied from the source is deletion,
|
|
* and number of inserted literal bytes are addition, so sum of them
|
|
* is the extent of damage. xdelta can express an edit that copies
|
|
* data inside of the destination which originally came from the
|
|
* source. We do not count that in the following routine, so we are
|
|
* undercounting the source material that remains in the final output
|
|
* that way.
|
|
*/
|
|
int count_delta(void *delta_buf, unsigned long delta_size,
|
|
unsigned long *src_copied, unsigned long *literal_added)
|
|
{
|
|
unsigned long copied_from_source, added_literal;
|
|
const unsigned char *data, *top;
|
|
unsigned char cmd;
|
|
unsigned long src_size, dst_size, out;
|
|
|
|
/* the smallest delta size possible is 6 bytes */
|
|
if (delta_size < 6)
|
|
return -1;
|
|
|
|
data = delta_buf;
|
|
top = delta_buf + delta_size;
|
|
|
|
src_size = get_hdr_size(&data);
|
|
dst_size = get_hdr_size(&data);
|
|
|
|
added_literal = copied_from_source = out = 0;
|
|
while (data < top) {
|
|
cmd = *data++;
|
|
if (cmd & 0x80) {
|
|
unsigned long cp_off = 0, cp_size = 0;
|
|
if (cmd & 0x01) cp_off = *data++;
|
|
if (cmd & 0x02) cp_off |= (*data++ << 8);
|
|
if (cmd & 0x04) cp_off |= (*data++ << 16);
|
|
if (cmd & 0x08) cp_off |= (*data++ << 24);
|
|
if (cmd & 0x10) cp_size = *data++;
|
|
if (cmd & 0x20) cp_size |= (*data++ << 8);
|
|
if (cp_size == 0) cp_size = 0x10000;
|
|
|
|
if (cmd & 0x40)
|
|
/* copy from dst */
|
|
;
|
|
else
|
|
copied_from_source += cp_size;
|
|
out += cp_size;
|
|
} else {
|
|
/* write literal into dst */
|
|
added_literal += cmd;
|
|
out += cmd;
|
|
data += cmd;
|
|
}
|
|
}
|
|
|
|
/* sanity check */
|
|
if (data != top || out != dst_size)
|
|
return -1;
|
|
|
|
/* delete size is what was _not_ copied from source.
|
|
* edit size is that and literal additions.
|
|
*/
|
|
*src_copied = copied_from_source;
|
|
*literal_added = added_literal;
|
|
return 0;
|
|
}
|