git-zlib: handle data streams larger than 4GB
On Windows, zlib's `uLong` type is 32-bit even on 64-bit systems. When processing data streams larger than 4GB, the `total_in` and `total_out` fields in zlib's `z_stream` structure wrap around, which caused the sanity checks in `zlib_post_call()` to trigger `BUG()` assertions. The git_zstream wrapper now tracks its own 64-bit totals rather than copying them from zlib. The sanity checks compare only the low bits, using `maximum_unsigned_value_of_type(uLong)` to mask appropriately for the platform's `uLong` size. This is based on work by LordKiRon in git-for-windows#6076. Signed-off-by: Johannes Schindelin <johannes.schindelin@gmx.de> Signed-off-by: Junio C Hamano <gitster@pobox.com>main
parent
f2063855fb
commit
d05d666977
25
git-zlib.c
25
git-zlib.c
|
|
@ -30,6 +30,9 @@ static const char *zerr_to_string(int status)
|
|||
*/
|
||||
/* #define ZLIB_BUF_MAX ((uInt)-1) */
|
||||
#define ZLIB_BUF_MAX ((uInt) 1024 * 1024 * 1024) /* 1GB */
|
||||
|
||||
/* uLong is 32-bit on Windows, even on 64-bit systems */
|
||||
#define ULONG_MAX_VALUE maximum_unsigned_value_of_type(uLong)
|
||||
static inline uInt zlib_buf_cap(unsigned long len)
|
||||
{
|
||||
return (ZLIB_BUF_MAX < len) ? ZLIB_BUF_MAX : len;
|
||||
|
|
@ -39,31 +42,37 @@ static void zlib_pre_call(git_zstream *s)
|
|||
{
|
||||
s->z.next_in = s->next_in;
|
||||
s->z.next_out = s->next_out;
|
||||
s->z.total_in = s->total_in;
|
||||
s->z.total_out = s->total_out;
|
||||
s->z.total_in = (uLong)(s->total_in & ULONG_MAX_VALUE);
|
||||
s->z.total_out = (uLong)(s->total_out & ULONG_MAX_VALUE);
|
||||
s->z.avail_in = zlib_buf_cap(s->avail_in);
|
||||
s->z.avail_out = zlib_buf_cap(s->avail_out);
|
||||
}
|
||||
|
||||
static void zlib_post_call(git_zstream *s, int status)
|
||||
{
|
||||
unsigned long bytes_consumed;
|
||||
unsigned long bytes_produced;
|
||||
size_t bytes_consumed;
|
||||
size_t bytes_produced;
|
||||
|
||||
bytes_consumed = s->z.next_in - s->next_in;
|
||||
bytes_produced = s->z.next_out - s->next_out;
|
||||
if (s->z.total_out != s->total_out + bytes_produced)
|
||||
/*
|
||||
* zlib's total_out/total_in are uLong which may wrap for >4GB.
|
||||
* We track our own totals and verify only the low bits match.
|
||||
*/
|
||||
if ((s->z.total_out & ULONG_MAX_VALUE) !=
|
||||
((s->total_out + bytes_produced) & ULONG_MAX_VALUE))
|
||||
BUG("total_out mismatch");
|
||||
/*
|
||||
* zlib does not update total_in when it returns Z_NEED_DICT,
|
||||
* causing a mismatch here. Skip the sanity check in that case.
|
||||
*/
|
||||
if (status != Z_NEED_DICT &&
|
||||
s->z.total_in != s->total_in + bytes_consumed)
|
||||
(s->z.total_in & ULONG_MAX_VALUE) !=
|
||||
((s->total_in + bytes_consumed) & ULONG_MAX_VALUE))
|
||||
BUG("total_in mismatch");
|
||||
|
||||
s->total_out = s->z.total_out;
|
||||
s->total_in = s->z.total_in;
|
||||
s->total_out += bytes_produced;
|
||||
s->total_in += bytes_consumed;
|
||||
/* zlib-ng marks `next_in` as `const`, so we have to cast it away. */
|
||||
s->next_in = (unsigned char *) s->z.next_in;
|
||||
s->next_out = s->z.next_out;
|
||||
|
|
|
|||
|
|
@ -7,8 +7,8 @@ typedef struct git_zstream {
|
|||
struct z_stream_s z;
|
||||
unsigned long avail_in;
|
||||
unsigned long avail_out;
|
||||
unsigned long total_in;
|
||||
unsigned long total_out;
|
||||
size_t total_in;
|
||||
size_t total_out;
|
||||
unsigned char *next_in;
|
||||
unsigned char *next_out;
|
||||
} git_zstream;
|
||||
|
|
|
|||
|
|
@ -1118,7 +1118,7 @@ int odb_source_loose_write_stream(struct odb_source *source,
|
|||
} while (ret == Z_OK || ret == Z_BUF_ERROR);
|
||||
|
||||
if (stream.total_in != len + hdrlen)
|
||||
die(_("write stream object %ld != %"PRIuMAX), stream.total_in,
|
||||
die(_("write stream object %"PRIuMAX" != %"PRIuMAX), (uintmax_t)stream.total_in,
|
||||
(uintmax_t)len + hdrlen);
|
||||
|
||||
/*
|
||||
|
|
|
|||
Loading…
Reference in New Issue