Skip to content

Commit e1152b2

Browse files
dschomjcheetham
authored andcommitted
Merge pull request #3533 from PhilipOakley/hashliteral_t
Begin `unsigned long`->`size_t` conversion to support large files on Windows
2 parents a548c62 + 2db4ab3 commit e1152b2

File tree

5 files changed

+59
-20
lines changed

5 files changed

+59
-20
lines changed

object-file.c

Lines changed: 15 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -1779,9 +1779,9 @@ void *read_object_with_reference(struct repository *r,
17791779
}
17801780

17811781
static void hash_object_body(const struct git_hash_algo *algo, git_hash_ctx *c,
1782-
const void *buf, unsigned long len,
1782+
const void *buf, size_t len,
17831783
struct object_id *oid,
1784-
char *hdr, int *hdrlen)
1784+
char *hdr, size_t *hdrlen)
17851785
{
17861786
algo->init_fn(c);
17871787
algo->update_fn(c, hdr, *hdrlen);
@@ -1790,23 +1790,23 @@ static void hash_object_body(const struct git_hash_algo *algo, git_hash_ctx *c,
17901790
}
17911791

17921792
static void write_object_file_prepare(const struct git_hash_algo *algo,
1793-
const void *buf, unsigned long len,
1793+
const void *buf, size_t len,
17941794
enum object_type type, struct object_id *oid,
1795-
char *hdr, int *hdrlen)
1795+
char *hdr, size_t *hdrlen)
17961796
{
17971797
git_hash_ctx c;
17981798

17991799
/* Generate the header */
18001800
*hdrlen = format_object_header(hdr, *hdrlen, type, len);
18011801

1802-
/* Sha1.. */
1802+
/* Hash (function pointers) computation */
18031803
hash_object_body(algo, &c, buf, len, oid, hdr, hdrlen);
18041804
}
18051805

18061806
static void write_object_file_prepare_literally(const struct git_hash_algo *algo,
1807-
const void *buf, unsigned long len,
1807+
const void *buf, size_t len,
18081808
const char *type, struct object_id *oid,
1809-
char *hdr, int *hdrlen)
1809+
char *hdr, size_t *hdrlen)
18101810
{
18111811
git_hash_ctx c;
18121812

@@ -1858,17 +1858,17 @@ int finalize_object_file(const char *tmpfile, const char *filename)
18581858
}
18591859

18601860
static void hash_object_file_literally(const struct git_hash_algo *algo,
1861-
const void *buf, unsigned long len,
1861+
const void *buf, size_t len,
18621862
const char *type, struct object_id *oid)
18631863
{
18641864
char hdr[MAX_HEADER_LEN];
1865-
int hdrlen = sizeof(hdr);
1865+
size_t hdrlen = sizeof(hdr);
18661866

18671867
write_object_file_prepare_literally(algo, buf, len, type, oid, hdr, &hdrlen);
18681868
}
18691869

18701870
void hash_object_file(const struct git_hash_algo *algo, const void *buf,
1871-
unsigned long len, enum object_type type,
1871+
size_t len, enum object_type type,
18721872
struct object_id *oid)
18731873
{
18741874
hash_object_file_literally(algo, buf, len, type_name(type), oid);
@@ -2210,12 +2210,12 @@ int stream_loose_object(struct input_stream *in_stream, size_t len,
22102210
return err;
22112211
}
22122212

2213-
int write_object_file_flags(const void *buf, unsigned long len,
2213+
int write_object_file_flags(const void *buf, size_t len,
22142214
enum object_type type, struct object_id *oid,
22152215
unsigned flags)
22162216
{
22172217
char hdr[MAX_HEADER_LEN];
2218-
int hdrlen = sizeof(hdr);
2218+
size_t hdrlen = sizeof(hdr);
22192219

22202220
/* Normally if we have it in the pack then we do not bother writing
22212221
* it out into .git/objects/??/?{38} file.
@@ -2227,12 +2227,13 @@ int write_object_file_flags(const void *buf, unsigned long len,
22272227
return write_loose_object(oid, hdr, hdrlen, buf, len, 0, flags);
22282228
}
22292229

2230-
int write_object_file_literally(const void *buf, unsigned long len,
2230+
int write_object_file_literally(const void *buf, size_t len,
22312231
const char *type, struct object_id *oid,
22322232
unsigned flags)
22332233
{
22342234
char *header;
2235-
int hdrlen, status = 0;
2235+
size_t hdrlen;
2236+
int status = 0;
22362237

22372238
/* type string, SP, %lu of the length plus NUL must fit this */
22382239
hdrlen = strlen(type) + MAX_HEADER_LEN;

object-store.h

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -251,10 +251,10 @@ void *repo_read_object_file(struct repository *r,
251251
int oid_object_info(struct repository *r, const struct object_id *, unsigned long *);
252252

253253
void hash_object_file(const struct git_hash_algo *algo, const void *buf,
254-
unsigned long len, enum object_type type,
254+
size_t len, enum object_type type,
255255
struct object_id *oid);
256256

257-
int write_object_file_flags(const void *buf, unsigned long len,
257+
int write_object_file_flags(const void *buf, size_t len,
258258
enum object_type type, struct object_id *oid,
259259
unsigned flags);
260260
static inline int write_object_file(const void *buf, unsigned long len,
@@ -263,7 +263,7 @@ static inline int write_object_file(const void *buf, unsigned long len,
263263
return write_object_file_flags(buf, len, type, oid, 0);
264264
}
265265

266-
int write_object_file_literally(const void *buf, unsigned long len,
266+
int write_object_file_literally(const void *buf, size_t len,
267267
const char *type, struct object_id *oid,
268268
unsigned flags);
269269
int stream_loose_object(struct input_stream *in_stream, size_t len,

sha1dc_git.c

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,10 +27,9 @@ void git_SHA1DCFinal(unsigned char hash[20], SHA1_CTX *ctx)
2727
/*
2828
* Same as SHA1DCUpdate, but adjust types to match git's usual interface.
2929
*/
30-
void git_SHA1DCUpdate(SHA1_CTX *ctx, const void *vdata, unsigned long len)
30+
void git_SHA1DCUpdate(SHA1_CTX *ctx, const void *vdata, size_t len)
3131
{
3232
const char *data = vdata;
33-
/* We expect an unsigned long, but sha1dc only takes an int */
3433
while (len > INT_MAX) {
3534
SHA1DCUpdate(ctx, data, INT_MAX);
3635
data += INT_MAX;

sha1dc_git.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ void git_SHA1DCInit(SHA1_CTX *);
1515
#endif
1616

1717
void git_SHA1DCFinal(unsigned char [20], SHA1_CTX *);
18-
void git_SHA1DCUpdate(SHA1_CTX *ctx, const void *data, unsigned long len);
18+
void git_SHA1DCUpdate(SHA1_CTX *ctx, const void *data, size_t len);
1919

2020
#define platform_SHA_IS_SHA1DC /* used by "test-tool sha1-is-sha1dc" */
2121
#define platform_SHA_CTX SHA1_CTX

t/t1007-hash-object.sh

Lines changed: 39 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -50,6 +50,9 @@ test_expect_success 'setup' '
5050
5151
example sha1:ddd3f836d3e3fbb7ae289aa9ae83536f76956399
5252
example sha256:b44fe1fe65589848253737db859bd490453510719d7424daab03daf0767b85ae
53+
54+
large5GB sha1:0be2be10a4c8764f32c4bf372a98edc731a4b204
55+
large5GB sha256:dc18ca621300c8d3cfa505a275641ebab00de189859e022a975056882d313e64
5356
EOF
5457
'
5558

@@ -260,4 +263,40 @@ test_expect_success '--literally with extra-long type' '
260263
echo example | git hash-object -t $t --literally --stdin
261264
'
262265

266+
test_expect_success EXPENSIVE,SIZE_T_IS_64BIT,!LONG_IS_64BIT \
267+
'files over 4GB hash literally' '
268+
test-tool genzeros $((5*1024*1024*1024)) >big &&
269+
test_oid large5GB >expect &&
270+
git hash-object --stdin --literally <big >actual &&
271+
test_cmp expect actual
272+
'
273+
274+
test_expect_success EXPENSIVE,SIZE_T_IS_64BIT,!LONG_IS_64BIT \
275+
'files over 4GB hash correctly via --stdin' '
276+
{ test -f big || test-tool genzeros $((5*1024*1024*1024)) >big; } &&
277+
test_oid large5GB >expect &&
278+
git hash-object --stdin <big >actual &&
279+
test_cmp expect actual
280+
'
281+
282+
test_expect_success EXPENSIVE,SIZE_T_IS_64BIT,!LONG_IS_64BIT \
283+
'files over 4GB hash correctly' '
284+
{ test -f big || test-tool genzeros $((5*1024*1024*1024)) >big; } &&
285+
test_oid large5GB >expect &&
286+
git hash-object -- big >actual &&
287+
test_cmp expect actual
288+
'
289+
290+
# This clean filter does nothing, other than excercising the interface.
291+
# We ensure that cleaning doesn't mangle large files on 64-bit Windows.
292+
test_expect_success EXPENSIVE,SIZE_T_IS_64BIT,!LONG_IS_64BIT \
293+
'hash filtered files over 4GB correctly' '
294+
{ test -f big || test-tool genzeros $((5*1024*1024*1024)) >big; } &&
295+
test_oid large5GB >expect &&
296+
test_config filter.null-filter.clean "cat" &&
297+
echo "big filter=null-filter" >.gitattributes &&
298+
git hash-object -- big >actual &&
299+
test_cmp expect actual
300+
'
301+
263302
test_done

0 commit comments

Comments
 (0)