summaryrefslogtreecommitdiffstats
path: root/count-delta.c
blob: dd81e9296591d463a7b06570bc24dc201a836b2e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
/*
 * Copyright (C) 2005 Junio C Hamano
 * The delta-parsing part is almost straight copy of patch-delta.c
 * which is (C) 2005 Nicolas Pitre <nico@cam.org>.
 */
#include <stdlib.h>
#include <string.h>
#include <limits.h>
#include "delta.h"
#include "count-delta.h"

static unsigned long get_hdr_size(const unsigned char **datap)
{
	const unsigned char *data = *datap;
	unsigned long size;
	unsigned char cmd;
	int i;
	size = i = 0;
	cmd = *data++;
	while (cmd) {
		if (cmd & 1)
			size |= *data++ << i;
		i += 8;
		cmd >>= 1;
	}
	*datap = data;
	return size;
}

/*
 * NOTE.  We do not _interpret_ delta fully.  As an approximation, we
 * just count the number of bytes that are copied from the source, and
 * the number of literal data bytes that are inserted.  Number of
 * bytes that are _not_ copied from the source is deletion, and number
 * of inserted literal bytes are addition, so sum of them is what we
 * return.  xdelta can express an edit that copies data inside of the
 * destination which originally came from the source.  We do not count
 * that in the following routine, so we are undercounting the source
 * material that remains in the final output that way.
 */
unsigned long count_delta(void *delta_buf, unsigned long delta_size)
{
	unsigned long copied_from_source, added_literal;
	const unsigned char *data, *top;
	unsigned char cmd;
	unsigned long src_size, dst_size, out;

	/* the smallest delta size possible is 6 bytes */
	if (delta_size < 6)
		return UINT_MAX;

	data = delta_buf;
	top = delta_buf + delta_size;

	src_size = get_hdr_size(&data);
	dst_size = get_hdr_size(&data);

	added_literal = copied_from_source = out = 0;
	while (data < top) {
		cmd = *data++;
		if (cmd & 0x80) {
			unsigned long cp_off = 0, cp_size = 0;
			if (cmd & 0x01) cp_off = *data++;
			if (cmd & 0x02) cp_off |= (*data++ << 8);
			if (cmd & 0x04) cp_off |= (*data++ << 16);
			if (cmd & 0x08) cp_off |= (*data++ << 24);
			if (cmd & 0x10) cp_size = *data++;
			if (cmd & 0x20) cp_size |= (*data++ << 8);
			if (cp_size == 0) cp_size = 0x10000;

			if (cmd & 0x40)
				/* copy from dst */
				;
			else
				copied_from_source += cp_size;
			out += cp_size;
		} else {
			/* write literal into dst */
			added_literal += cmd;
			out += cmd;
			data += cmd;
		}
	}

	/* sanity check */
	if (data != top || out != dst_size)
		return UINT_MAX;

	/* delete size is what was _not_ copied from source.
	 * edit size is that and literal additions.
	 */
	return (src_size - copied_from_source) + added_literal;
}