Skip to content

Commit 090b4da

Browse files
committed
Merge pull request #3533 from PhilipOakley/hashliteral_t
Begin `unsigned long`->`size_t` conversion to support large files on Windows
2 parents c402d01 + a37ca0e commit 090b4da

File tree

5 files changed

+59
-21
lines changed

5 files changed

+59
-21
lines changed

object-file.c

Lines changed: 15 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -1934,9 +1934,9 @@ void *read_object_with_reference(struct repository *r,
19341934
}
19351935

19361936
static void hash_object_body(const struct git_hash_algo *algo, git_hash_ctx *c,
1937-
const void *buf, unsigned long len,
1937+
const void *buf, size_t len,
19381938
struct object_id *oid,
1939-
char *hdr, int *hdrlen)
1939+
char *hdr, size_t *hdrlen)
19401940
{
19411941
algo->init_fn(c);
19421942
algo->update_fn(c, hdr, *hdrlen);
@@ -1945,23 +1945,23 @@ static void hash_object_body(const struct git_hash_algo *algo, git_hash_ctx *c,
19451945
}
19461946

19471947
static void write_object_file_prepare(const struct git_hash_algo *algo,
1948-
const void *buf, unsigned long len,
1948+
const void *buf, size_t len,
19491949
enum object_type type, struct object_id *oid,
1950-
char *hdr, int *hdrlen)
1950+
char *hdr, size_t *hdrlen)
19511951
{
19521952
git_hash_ctx c;
19531953

19541954
/* Generate the header */
19551955
*hdrlen = format_object_header(hdr, *hdrlen, type, len);
19561956

1957-
/* Sha1.. */
1957+
/* Hash (function pointers) computation */
19581958
hash_object_body(algo, &c, buf, len, oid, hdr, hdrlen);
19591959
}
19601960

19611961
static void write_object_file_prepare_literally(const struct git_hash_algo *algo,
1962-
const void *buf, unsigned long len,
1962+
const void *buf, size_t len,
19631963
const char *type, struct object_id *oid,
1964-
char *hdr, int *hdrlen)
1964+
char *hdr, size_t *hdrlen)
19651965
{
19661966
git_hash_ctx c;
19671967

@@ -2081,17 +2081,17 @@ int finalize_object_file_flags(const char *tmpfile, const char *filename,
20812081
}
20822082

20832083
static void hash_object_file_literally(const struct git_hash_algo *algo,
2084-
const void *buf, unsigned long len,
2084+
const void *buf, size_t len,
20852085
const char *type, struct object_id *oid)
20862086
{
20872087
char hdr[MAX_HEADER_LEN];
2088-
int hdrlen = sizeof(hdr);
2088+
size_t hdrlen = sizeof(hdr);
20892089

20902090
write_object_file_prepare_literally(algo, buf, len, type, oid, hdr, &hdrlen);
20912091
}
20922092

20932093
void hash_object_file(const struct git_hash_algo *algo, const void *buf,
2094-
unsigned long len, enum object_type type,
2094+
size_t len, enum object_type type,
20952095
struct object_id *oid)
20962096
{
20972097
hash_object_file_literally(algo, buf, len, type_name(type), oid);
@@ -2457,7 +2457,7 @@ int stream_loose_object(struct input_stream *in_stream, size_t len,
24572457
return err;
24582458
}
24592459

2460-
int write_object_file_flags(const void *buf, unsigned long len,
2460+
int write_object_file_flags(const void *buf, size_t len,
24612461
enum object_type type, struct object_id *oid,
24622462
struct object_id *compat_oid_in, unsigned flags)
24632463
{
@@ -2466,7 +2466,7 @@ int write_object_file_flags(const void *buf, unsigned long len,
24662466
const struct git_hash_algo *compat = repo->compat_hash_algo;
24672467
struct object_id compat_oid;
24682468
char hdr[MAX_HEADER_LEN];
2469-
int hdrlen = sizeof(hdr);
2469+
size_t hdrlen = sizeof(hdr);
24702470

24712471
/* Generate compat_oid */
24722472
if (compat) {
@@ -2497,7 +2497,7 @@ int write_object_file_flags(const void *buf, unsigned long len,
24972497
return 0;
24982498
}
24992499

2500-
int write_object_file_literally(const void *buf, unsigned long len,
2500+
int write_object_file_literally(const void *buf, size_t len,
25012501
const char *type, struct object_id *oid,
25022502
unsigned flags)
25032503
{
@@ -2506,8 +2506,8 @@ int write_object_file_literally(const void *buf, unsigned long len,
25062506
const struct git_hash_algo *algo = repo->hash_algo;
25072507
const struct git_hash_algo *compat = repo->compat_hash_algo;
25082508
struct object_id compat_oid;
2509-
int hdrlen, status = 0;
2510-
int compat_type = -1;
2509+
size_t hdrlen;
2510+
int status = 0, compat_type = -1;
25112511

25122512
if (compat) {
25132513
compat_type = type_from_string_gently(type, -1, 1);

object-store-ll.h

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -270,10 +270,10 @@ void *repo_read_object_file(struct repository *r,
270270
int oid_object_info(struct repository *r, const struct object_id *, unsigned long *);
271271

272272
void hash_object_file(const struct git_hash_algo *algo, const void *buf,
273-
unsigned long len, enum object_type type,
273+
size_t len, enum object_type type,
274274
struct object_id *oid);
275275

276-
int write_object_file_flags(const void *buf, unsigned long len,
276+
int write_object_file_flags(const void *buf, size_t len,
277277
enum object_type type, struct object_id *oid,
278278
struct object_id *comapt_oid_in, unsigned flags);
279279
static inline int write_object_file(const void *buf, unsigned long len,
@@ -282,7 +282,7 @@ static inline int write_object_file(const void *buf, unsigned long len,
282282
return write_object_file_flags(buf, len, type, oid, NULL, 0);
283283
}
284284

285-
int write_object_file_literally(const void *buf, unsigned long len,
285+
int write_object_file_literally(const void *buf, size_t len,
286286
const char *type, struct object_id *oid,
287287
unsigned flags);
288288
int stream_loose_object(struct input_stream *in_stream, size_t len,

sha1dc_git.c

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,10 +27,9 @@ void git_SHA1DCFinal(unsigned char hash[20], SHA1_CTX *ctx)
2727
/*
2828
* Same as SHA1DCUpdate, but adjust types to match git's usual interface.
2929
*/
30-
void git_SHA1DCUpdate(SHA1_CTX *ctx, const void *vdata, unsigned long len)
30+
void git_SHA1DCUpdate(SHA1_CTX *ctx, const void *vdata, size_t len)
3131
{
3232
const char *data = vdata;
33-
/* We expect an unsigned long, but sha1dc only takes an int */
3433
while (len > INT_MAX) {
3534
SHA1DCUpdate(ctx, data, INT_MAX);
3635
data += INT_MAX;

sha1dc_git.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ void git_SHA1DCInit(SHA1_CTX *);
1515
#endif
1616

1717
void git_SHA1DCFinal(unsigned char [20], SHA1_CTX *);
18-
void git_SHA1DCUpdate(SHA1_CTX *ctx, const void *data, unsigned long len);
18+
void git_SHA1DCUpdate(SHA1_CTX *ctx, const void *data, size_t len);
1919

2020
#define platform_SHA_IS_SHA1DC /* used by "test-tool sha1-is-sha1dc" */
2121

t/t1007-hash-object.sh

Lines changed: 39 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -49,6 +49,9 @@ test_expect_success 'setup' '
4949
5050
example sha1:ddd3f836d3e3fbb7ae289aa9ae83536f76956399
5151
example sha256:b44fe1fe65589848253737db859bd490453510719d7424daab03daf0767b85ae
52+
53+
large5GB sha1:0be2be10a4c8764f32c4bf372a98edc731a4b204
54+
large5GB sha256:dc18ca621300c8d3cfa505a275641ebab00de189859e022a975056882d313e64
5255
EOF
5356
'
5457

@@ -265,4 +268,40 @@ test_expect_success '--stdin outside of repository (uses SHA-1)' '
265268
test_cmp expect actual
266269
'
267270

271+
test_expect_success EXPENSIVE,SIZE_T_IS_64BIT,!LONG_IS_64BIT \
272+
'files over 4GB hash literally' '
273+
test-tool genzeros $((5*1024*1024*1024)) >big &&
274+
test_oid large5GB >expect &&
275+
git hash-object --stdin --literally <big >actual &&
276+
test_cmp expect actual
277+
'
278+
279+
test_expect_success EXPENSIVE,SIZE_T_IS_64BIT,!LONG_IS_64BIT \
280+
'files over 4GB hash correctly via --stdin' '
281+
{ test -f big || test-tool genzeros $((5*1024*1024*1024)) >big; } &&
282+
test_oid large5GB >expect &&
283+
git hash-object --stdin <big >actual &&
284+
test_cmp expect actual
285+
'
286+
287+
test_expect_success EXPENSIVE,SIZE_T_IS_64BIT,!LONG_IS_64BIT \
288+
'files over 4GB hash correctly' '
289+
{ test -f big || test-tool genzeros $((5*1024*1024*1024)) >big; } &&
290+
test_oid large5GB >expect &&
291+
git hash-object -- big >actual &&
292+
test_cmp expect actual
293+
'
294+
295+
# This clean filter does nothing, other than excercising the interface.
296+
# We ensure that cleaning doesn't mangle large files on 64-bit Windows.
297+
test_expect_success EXPENSIVE,SIZE_T_IS_64BIT,!LONG_IS_64BIT \
298+
'hash filtered files over 4GB correctly' '
299+
{ test -f big || test-tool genzeros $((5*1024*1024*1024)) >big; } &&
300+
test_oid large5GB >expect &&
301+
test_config filter.null-filter.clean "cat" &&
302+
echo "big filter=null-filter" >.gitattributes &&
303+
git hash-object -- big >actual &&
304+
test_cmp expect actual
305+
'
306+
268307
test_done

0 commit comments

Comments
 (0)