335 lines
		
	
	
		
			7.1 KiB
		
	
	
	
		
			C
		
	
	
			
		
		
	
	
			335 lines
		
	
	
		
			7.1 KiB
		
	
	
	
		
			C
		
	
	
| /*
 | |
|  * diff-delta.c: generate a delta between two buffers
 | |
|  *
 | |
|  *  Many parts of this file have been lifted from LibXDiff version 0.10.
 | |
|  *  http://www.xmailserver.org/xdiff-lib.html
 | |
|  *
 | |
|  *  LibXDiff was written by Davide Libenzi <davidel@xmailserver.org>
 | |
|  *  Copyright (C) 2003	Davide Libenzi
 | |
|  *
 | |
|  *  Many mods for GIT usage by Nicolas Pitre <nico@cam.org>, (C) 2005.
 | |
|  *
 | |
|  *  This file is free software; you can redistribute it and/or
 | |
|  *  modify it under the terms of the GNU Lesser General Public
 | |
|  *  License as published by the Free Software Foundation; either
 | |
|  *  version 2.1 of the License, or (at your option) any later version.
 | |
|  *
 | |
|  *  Use of this within git automatically means that the LGPL
 | |
|  *  licensing gets turned into GPLv2 within this project.
 | |
|  */
 | |
| 
 | |
| #include <stdlib.h>
 | |
| #include "delta.h"
 | |
| 
 | |
| 
 | |
| /* block size: min = 16, max = 64k, power of 2 */
 | |
| #define BLK_SIZE 16
 | |
| 
 | |
| #define MIN(a, b) ((a) < (b) ? (a) : (b))
 | |
| 
 | |
| #define GR_PRIME 0x9e370001
 | |
| #define HASH(v, b) (((unsigned int)(v) * GR_PRIME) >> (32 - (b)))
 | |
| 	
 | |
| /* largest prime smaller than 65536 */
 | |
| #define BASE 65521
 | |
| 
 | |
| /* NMAX is the largest n such that 255n(n+1)/2 + (n+1)(BASE-1) <= 2^32-1 */
 | |
| #define NMAX 5552
 | |
| 
 | |
| #define DO1(buf, i)  { s1 += buf[i]; s2 += s1; }
 | |
| #define DO2(buf, i)  DO1(buf, i); DO1(buf, i + 1);
 | |
| #define DO4(buf, i)  DO2(buf, i); DO2(buf, i + 2);
 | |
| #define DO8(buf, i)  DO4(buf, i); DO4(buf, i + 4);
 | |
| #define DO16(buf)    DO8(buf, 0); DO8(buf, 8);
 | |
| 
 | |
| static unsigned int adler32(unsigned int adler, const unsigned char *buf, int len)
 | |
| {
 | |
| 	int k;
 | |
| 	unsigned int s1 = adler & 0xffff;
 | |
| 	unsigned int s2 = adler >> 16;
 | |
| 
 | |
| 	while (len > 0) {
 | |
| 		k = MIN(len, NMAX);
 | |
| 		len -= k;
 | |
| 		while (k >= 16) {
 | |
| 			DO16(buf);
 | |
| 			buf += 16;
 | |
| 			k -= 16;
 | |
| 		}
 | |
| 		if (k != 0)
 | |
| 			do {
 | |
| 				s1 += *buf++;
 | |
| 				s2 += s1;
 | |
| 			} while (--k);
 | |
| 		s1 %= BASE;
 | |
| 		s2 %= BASE;
 | |
| 	}
 | |
| 
 | |
| 	return (s2 << 16) | s1;
 | |
| }
 | |
| 
 | |
| static unsigned int hashbits(unsigned int size)
 | |
| {
 | |
| 	unsigned int val = 1, bits = 0;
 | |
| 	while (val < size && bits < 32) {
 | |
| 		val <<= 1;
 | |
| 	       	bits++;
 | |
| 	}
 | |
| 	return bits ? bits: 1;
 | |
| }
 | |
| 
 | |
| typedef struct s_chanode {
 | |
| 	struct s_chanode *next;
 | |
| 	int icurr;
 | |
| } chanode_t;
 | |
| 
 | |
| typedef struct s_chastore {
 | |
| 	chanode_t *head, *tail;
 | |
| 	int isize, nsize;
 | |
| 	chanode_t *ancur;
 | |
| 	chanode_t *sncur;
 | |
| 	int scurr;
 | |
| } chastore_t;
 | |
| 
 | |
| static void cha_init(chastore_t *cha, int isize, int icount)
 | |
| {
 | |
| 	cha->head = cha->tail = NULL;
 | |
| 	cha->isize = isize;
 | |
| 	cha->nsize = icount * isize;
 | |
| 	cha->ancur = cha->sncur = NULL;
 | |
| 	cha->scurr = 0;
 | |
| }
 | |
| 
 | |
| static void *cha_alloc(chastore_t *cha)
 | |
| {
 | |
| 	chanode_t *ancur;
 | |
| 	void *data;
 | |
| 
 | |
| 	ancur = cha->ancur;
 | |
| 	if (!ancur || ancur->icurr == cha->nsize) {
 | |
| 		ancur = malloc(sizeof(chanode_t) + cha->nsize);
 | |
| 		if (!ancur)
 | |
| 			return NULL;
 | |
| 		ancur->icurr = 0;
 | |
| 		ancur->next = NULL;
 | |
| 		if (cha->tail)
 | |
| 			cha->tail->next = ancur;
 | |
| 		if (!cha->head)
 | |
| 			cha->head = ancur;
 | |
| 		cha->tail = ancur;
 | |
| 		cha->ancur = ancur;
 | |
| 	}
 | |
| 
 | |
| 	data = (void *)ancur + sizeof(chanode_t) + ancur->icurr;
 | |
| 	ancur->icurr += cha->isize;
 | |
| 	return data;
 | |
| }
 | |
| 
 | |
| static void cha_free(chastore_t *cha)
 | |
| {
 | |
| 	chanode_t *cur = cha->head;
 | |
| 	while (cur) {
 | |
| 		chanode_t *tmp = cur;
 | |
| 		cur = cur->next;
 | |
| 		free(tmp);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| typedef struct s_bdrecord {
 | |
| 	struct s_bdrecord *next;
 | |
| 	unsigned int fp;
 | |
| 	const unsigned char *ptr;
 | |
| } bdrecord_t;
 | |
| 
 | |
| typedef struct s_bdfile {
 | |
| 	const unsigned char *data, *top;
 | |
| 	chastore_t cha;
 | |
| 	unsigned int fphbits;
 | |
| 	bdrecord_t **fphash;
 | |
| } bdfile_t;
 | |
| 
 | |
| static int delta_prepare(const unsigned char *buf, int bufsize, bdfile_t *bdf)
 | |
| {
 | |
| 	unsigned int fphbits;
 | |
| 	int i, hsize;
 | |
| 	const unsigned char *base, *data, *top;
 | |
| 	bdrecord_t *brec;
 | |
| 	bdrecord_t **fphash;
 | |
| 
 | |
| 	fphbits = hashbits(bufsize / BLK_SIZE + 1);
 | |
| 	hsize = 1 << fphbits;
 | |
| 	fphash = malloc(hsize * sizeof(bdrecord_t *));
 | |
| 	if (!fphash)
 | |
| 		return -1;
 | |
| 	for (i = 0; i < hsize; i++)
 | |
| 		fphash[i] = NULL;
 | |
| 	cha_init(&bdf->cha, sizeof(bdrecord_t), hsize / 4 + 1);
 | |
| 
 | |
| 	bdf->data = data = base = buf;
 | |
| 	bdf->top = top = buf + bufsize;
 | |
| 	data += (bufsize / BLK_SIZE) * BLK_SIZE;
 | |
| 	if (data == top)
 | |
| 		data -= BLK_SIZE;
 | |
| 
 | |
| 	for ( ; data >= base; data -= BLK_SIZE) {
 | |
| 		brec = cha_alloc(&bdf->cha);
 | |
| 		if (!brec) {
 | |
| 			cha_free(&bdf->cha);
 | |
| 			free(fphash);
 | |
| 			return -1;
 | |
| 		}
 | |
| 		brec->fp = adler32(0, data, MIN(BLK_SIZE, top - data));
 | |
| 		brec->ptr = data;
 | |
| 		i = HASH(brec->fp, fphbits);
 | |
| 		brec->next = fphash[i];
 | |
| 		fphash[i] = brec;
 | |
| 	}
 | |
| 
 | |
| 	bdf->fphbits = fphbits;
 | |
| 	bdf->fphash = fphash;
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static void delta_cleanup(bdfile_t *bdf)
 | |
| {
 | |
| 	free(bdf->fphash);
 | |
| 	cha_free(&bdf->cha);
 | |
| }
 | |
| 
 | |
| #define COPYOP_SIZE(o, s) \
 | |
|     (!!(o & 0xff) + !!(o & 0xff00) + !!(o & 0xff0000) + !!(o & 0xff000000) + \
 | |
|      !!(s & 0xff) + !!(s & 0xff00) + 1)
 | |
| 
 | |
| void *diff_delta(void *from_buf, unsigned long from_size,
 | |
| 		 void *to_buf, unsigned long to_size,
 | |
| 		 unsigned long *delta_size,
 | |
| 		 unsigned long max_size)
 | |
| {
 | |
| 	int i, outpos, outsize, inscnt, csize, msize, moff;
 | |
| 	unsigned int fp;
 | |
| 	const unsigned char *data, *top, *ptr1, *ptr2;
 | |
| 	unsigned char *out, *orig;
 | |
| 	bdrecord_t *brec;
 | |
| 	bdfile_t bdf;
 | |
| 
 | |
| 	if (!from_size || !to_size || delta_prepare(from_buf, from_size, &bdf))
 | |
| 		return NULL;
 | |
| 	
 | |
| 	outpos = 0;
 | |
| 	outsize = 8192;
 | |
| 	out = malloc(outsize);
 | |
| 	if (!out) {
 | |
| 		delta_cleanup(&bdf);
 | |
| 		return NULL;
 | |
| 	}
 | |
| 
 | |
| 	data = to_buf;
 | |
| 	top = to_buf + to_size;
 | |
| 
 | |
| 	/* store reference buffer size */
 | |
| 	out[outpos++] = from_size;
 | |
| 	from_size >>= 7;
 | |
| 	while (from_size) {
 | |
| 		out[outpos - 1] |= 0x80;
 | |
| 		out[outpos++] = from_size;
 | |
| 		from_size >>= 7;
 | |
| 	}
 | |
| 
 | |
| 	/* store target buffer size */
 | |
| 	out[outpos++] = to_size;
 | |
| 	to_size >>= 7;
 | |
| 	while (to_size) {
 | |
| 		out[outpos - 1] |= 0x80;
 | |
| 		out[outpos++] = to_size;
 | |
| 		to_size >>= 7;
 | |
| 	}
 | |
| 
 | |
| 	inscnt = 0;
 | |
| 	moff = 0;
 | |
| 	while (data < top) {
 | |
| 		msize = 0;
 | |
| 		fp = adler32(0, data, MIN(top - data, BLK_SIZE));
 | |
| 		i = HASH(fp, bdf.fphbits);
 | |
| 		for (brec = bdf.fphash[i]; brec; brec = brec->next) {
 | |
| 			if (brec->fp == fp) {
 | |
| 				csize = bdf.top - brec->ptr;
 | |
| 				if (csize > top - data)
 | |
| 					csize = top - data;
 | |
| 				for (ptr1 = brec->ptr, ptr2 = data; 
 | |
| 				     csize && *ptr1 == *ptr2;
 | |
| 				     csize--, ptr1++, ptr2++);
 | |
| 
 | |
| 				csize = ptr1 - brec->ptr;
 | |
| 				if (csize > msize) {
 | |
| 					moff = brec->ptr - bdf.data;
 | |
| 					msize = csize;
 | |
| 					if (msize >= 0x10000) {
 | |
| 						msize = 0x10000;
 | |
| 						break;
 | |
| 					}
 | |
| 				}
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		if (!msize || msize < COPYOP_SIZE(moff, msize)) {
 | |
| 			if (!inscnt)
 | |
| 				outpos++;
 | |
| 			out[outpos++] = *data++;
 | |
| 			inscnt++;
 | |
| 			if (inscnt == 0x7f) {
 | |
| 				out[outpos - inscnt - 1] = inscnt;
 | |
| 				inscnt = 0;
 | |
| 			}
 | |
| 		} else {
 | |
| 			if (inscnt) {
 | |
| 				out[outpos - inscnt - 1] = inscnt;
 | |
| 				inscnt = 0;
 | |
| 			}
 | |
| 
 | |
| 			data += msize;
 | |
| 			orig = out + outpos++;
 | |
| 			i = 0x80;
 | |
| 
 | |
| 			if (moff & 0xff) { out[outpos++] = moff; i |= 0x01; }
 | |
| 			moff >>= 8;
 | |
| 			if (moff & 0xff) { out[outpos++] = moff; i |= 0x02; }
 | |
| 			moff >>= 8;
 | |
| 			if (moff & 0xff) { out[outpos++] = moff; i |= 0x04; }
 | |
| 			moff >>= 8;
 | |
| 			if (moff & 0xff) { out[outpos++] = moff; i |= 0x08; }
 | |
| 
 | |
| 			if (msize & 0xff) { out[outpos++] = msize; i |= 0x10; }
 | |
| 			msize >>= 8;
 | |
| 			if (msize & 0xff) { out[outpos++] = msize; i |= 0x20; }
 | |
| 
 | |
| 			*orig = i;
 | |
| 		}
 | |
| 
 | |
| 		if (max_size && outpos > max_size) {
 | |
| 			free(out);
 | |
| 			delta_cleanup(&bdf);
 | |
| 			return NULL;
 | |
| 		}
 | |
| 
 | |
| 		/* next time around the largest possible output is 1 + 4 + 3 */
 | |
| 		if (outpos > outsize - 8) {
 | |
| 			void *tmp = out;
 | |
| 			outsize = outsize * 3 / 2;
 | |
| 			out = realloc(out, outsize);
 | |
| 			if (!out) {
 | |
| 				free(tmp);
 | |
| 				delta_cleanup(&bdf);
 | |
| 				return NULL;
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (inscnt)
 | |
| 		out[outpos - inscnt - 1] = inscnt;
 | |
| 
 | |
| 	delta_cleanup(&bdf);
 | |
| 	*delta_size = outpos;
 | |
| 	return out;
 | |
| }
 |