#!/bin/sh test_description='git pack-objects using object filtering' GIT_TEST_DEFAULT_INITIAL_BRANCH_NAME=main export GIT_TEST_DEFAULT_INITIAL_BRANCH_NAME . ./test-lib.sh # Test blob:none filter. test_expect_success 'setup r1' ' git init r1 && for n in 1 2 3 4 5 do echo "This is file: $n" > r1/file.$n && git -C r1 add file.$n && git -C r1 commit -m "$n" || return 1 done ' parse_verify_pack_blob_oid () { awk '{print $1}' - } test_expect_success 'verify blob count in normal packfile' ' git -C r1 ls-files -s file.1 file.2 file.3 file.4 file.5 \ >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r1 pack-objects --revs --stdout >all.pack <<-EOF && HEAD EOF git -C r1 index-pack ../all.pack && git -C r1 verify-pack -v ../all.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify blob:none packfile has no blobs' ' git -C r1 pack-objects --revs --stdout --filter=blob:none >filter.pack <<-EOF && HEAD EOF git -C r1 index-pack ../filter.pack && git -C r1 verify-pack -v ../filter.pack >verify_result && ! grep blob verify_result ' test_expect_success 'verify blob:none packfile without --stdout' ' git -C r1 pack-objects --revs --filter=blob:none mypackname >packhash <<-EOF && HEAD EOF git -C r1 verify-pack -v "mypackname-$(cat packhash).pack" >verify_result && ! grep blob verify_result ' test_expect_success 'verify normal and blob:none packfiles have same commits/trees' ' git -C r1 verify-pack -v ../all.pack >verify_result && grep -E "commit|tree" verify_result | parse_verify_pack_blob_oid | sort >expected && git -C r1 verify-pack -v ../filter.pack >verify_result && grep -E "commit|tree" verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'get an error for missing tree object' ' git init r5 && echo foo >r5/foo && git -C r5 add foo && git -C r5 commit -m "foo" && git -C r5 rev-parse HEAD^{tree} >tree && del=$(sed "s|..|&/|" tree) && rm r5/.git/objects/$del && test_must_fail git -C r5 pack-objects --revs --stdout 2>bad_tree <<-EOF && HEAD EOF grep "bad tree object" bad_tree ' test_expect_success 'setup for tests of tree:0' ' mkdir r1/subtree && echo "This is a file in a subtree" >r1/subtree/file && git -C r1 add subtree/file && git -C r1 commit -m subtree ' test_expect_success 'verify tree:0 packfile has no blobs or trees' ' git -C r1 pack-objects --revs --stdout --filter=tree:0 >commitsonly.pack <<-EOF && HEAD EOF git -C r1 index-pack ../commitsonly.pack && git -C r1 verify-pack -v ../commitsonly.pack >objs && ! grep -E "tree|blob" objs ' test_expect_success 'grab tree directly when using tree:0' ' # We should get the tree specified directly but not its blobs or subtrees. git -C r1 pack-objects --revs --stdout --filter=tree:0 >commitsonly.pack <<-EOF && HEAD: EOF git -C r1 index-pack ../commitsonly.pack && git -C r1 verify-pack -v ../commitsonly.pack >objs && awk "/tree|blob/{print \$1}" objs >trees_and_blobs && git -C r1 rev-parse HEAD: >expected && test_cmp expected trees_and_blobs ' # Test blob:limit=[kmg] filter. # We boundary test around the size parameter. The filter is strictly less than # the value, so size 500 and 1000 should have the same results, but 1001 should # filter more. test_expect_success 'setup r2' ' git init r2 && for n in 1000 10000 do printf "%"$n"s" X > r2/large.$n && git -C r2 add large.$n && git -C r2 commit -m "$n" || return 1 done ' test_expect_success 'verify blob count in normal packfile' ' git -C r2 ls-files -s large.1000 large.10000 >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r2 pack-objects --revs --stdout >all.pack <<-EOF && HEAD EOF git -C r2 index-pack ../all.pack && git -C r2 verify-pack -v ../all.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify blob:limit=500 omits all blobs' ' git -C r2 pack-objects --revs --stdout --filter=blob:limit=500 >filter.pack <<-EOF && HEAD EOF git -C r2 index-pack ../filter.pack && git -C r2 verify-pack -v ../filter.pack >verify_result && ! grep blob verify_result ' test_expect_success 'verify blob:limit=1000' ' git -C r2 pack-objects --revs --stdout --filter=blob:limit=1000 >filter.pack <<-EOF && HEAD EOF git -C r2 index-pack ../filter.pack && git -C r2 verify-pack -v ../filter.pack >verify_result && ! grep blob verify_result ' test_expect_success 'verify blob:limit=1001' ' git -C r2 ls-files -s large.1000 >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r2 pack-objects --revs --stdout --filter=blob:limit=1001 >filter.pack <<-EOF && HEAD EOF git -C r2 index-pack ../filter.pack && git -C r2 verify-pack -v ../filter.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify blob:limit=10001' ' git -C r2 ls-files -s large.1000 large.10000 >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r2 pack-objects --revs --stdout --filter=blob:limit=10001 >filter.pack <<-EOF && HEAD EOF git -C r2 index-pack ../filter.pack && git -C r2 verify-pack -v ../filter.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify blob:limit=1k' ' git -C r2 ls-files -s large.1000 >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r2 pack-objects --revs --stdout --filter=blob:limit=1k >filter.pack <<-EOF && HEAD EOF git -C r2 index-pack ../filter.pack && git -C r2 verify-pack -v ../filter.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify explicitly specifying oversized blob in input' ' git -C r2 ls-files -s large.1000 large.10000 >ls_files_result && test_parse_ls_files_stage_oids expected && echo HEAD >objects && git -C r2 rev-parse HEAD:large.10000 >>objects && git -C r2 pack-objects --revs --stdout --filter=blob:limit=1k filter.pack && git -C r2 index-pack ../filter.pack && git -C r2 verify-pack -v ../filter.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify blob:limit=1m' ' git -C r2 ls-files -s large.1000 large.10000 >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r2 pack-objects --revs --stdout --filter=blob:limit=1m >filter.pack <<-EOF && HEAD EOF git -C r2 index-pack ../filter.pack && git -C r2 verify-pack -v ../filter.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify normal and blob:limit packfiles have same commits/trees' ' git -C r2 verify-pack -v ../all.pack >verify_result && grep -E "commit|tree" verify_result | parse_verify_pack_blob_oid | sort >expected && git -C r2 verify-pack -v ../filter.pack >verify_result && grep -E "commit|tree" verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify small limit and big limit results in small limit' ' git -C r2 ls-files -s large.1000 >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r2 pack-objects --revs --stdout --filter=blob:limit=1001 \ --filter=blob:limit=10001 >filter.pack <<-EOF && HEAD EOF git -C r2 index-pack ../filter.pack && git -C r2 verify-pack -v ../filter.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify big limit and small limit results in small limit' ' git -C r2 ls-files -s large.1000 >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r2 pack-objects --revs --stdout --filter=blob:limit=10001 \ --filter=blob:limit=1001 >filter.pack <<-EOF && HEAD EOF git -C r2 index-pack ../filter.pack && git -C r2 verify-pack -v ../filter.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' # Test sparse:path= filter. # !!!! # NOTE: sparse:path filter support has been dropped for security reasons, # so the tests have been changed to make sure that using it fails. # !!!! # Use a local file containing a sparse-checkout specification to filter # out blobs not required for the corresponding sparse-checkout. We do not # require sparse-checkout to actually be enabled. test_expect_success 'setup r3' ' git init r3 && mkdir r3/dir1 && for n in sparse1 sparse2 do echo "This is file: $n" > r3/$n && git -C r3 add $n && echo "This is file: dir1/$n" > r3/dir1/$n && git -C r3 add dir1/$n || return 1 done && git -C r3 commit -m "sparse" && echo dir1/ >pattern1 && echo sparse1 >pattern2 ' test_expect_success 'verify blob count in normal packfile' ' git -C r3 ls-files -s sparse1 sparse2 dir1/sparse1 dir1/sparse2 \ >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r3 pack-objects --revs --stdout >all.pack <<-EOF && HEAD EOF git -C r3 index-pack ../all.pack && git -C r3 verify-pack -v ../all.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify sparse:path=pattern1 fails' ' test_must_fail git -C r3 pack-objects --revs --stdout \ --filter=sparse:path=../pattern1 <<-EOF HEAD EOF ' test_expect_success 'verify sparse:path=pattern2 fails' ' test_must_fail git -C r3 pack-objects --revs --stdout \ --filter=sparse:path=../pattern2 <<-EOF HEAD EOF ' # Test sparse:oid= filter. # Use a blob containing a sparse-checkout specification to filter # out blobs not required for the corresponding sparse-checkout. We do not # require sparse-checkout to actually be enabled. test_expect_success 'setup r4' ' git init r4 && mkdir r4/dir1 && for n in sparse1 sparse2 do echo "This is file: $n" > r4/$n && git -C r4 add $n && echo "This is file: dir1/$n" > r4/dir1/$n && git -C r4 add dir1/$n || return 1 done && echo dir1/ >r4/pattern && git -C r4 add pattern && git -C r4 commit -m "pattern" ' test_expect_success 'verify blob count in normal packfile' ' git -C r4 ls-files -s pattern sparse1 sparse2 dir1/sparse1 dir1/sparse2 \ >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r4 pack-objects --revs --stdout >all.pack <<-EOF && HEAD EOF git -C r4 index-pack ../all.pack && git -C r4 verify-pack -v ../all.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify sparse:oid=OID' ' git -C r4 ls-files -s dir1/sparse1 dir1/sparse2 >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r4 ls-files -s pattern >staged && oid=$(test_parse_ls_files_stage_oids filter.pack <<-EOF && HEAD EOF git -C r4 index-pack ../filter.pack && git -C r4 verify-pack -v ../filter.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' test_expect_success 'verify sparse:oid=oid-ish' ' git -C r4 ls-files -s dir1/sparse1 dir1/sparse2 >ls_files_result && test_parse_ls_files_stage_oids expected && git -C r4 pack-objects --revs --stdout --filter=sparse:oid=main:pattern >filter.pack <<-EOF && HEAD EOF git -C r4 index-pack ../filter.pack && git -C r4 verify-pack -v ../filter.pack >verify_result && grep blob verify_result | parse_verify_pack_blob_oid | sort >observed && test_cmp expected observed ' # Delete some loose objects and use pack-objects, but WITHOUT any filtering. # This models previously omitted objects that we did not receive. test_expect_success 'setup r1 - delete loose blobs' ' git -C r1 ls-files -s file.1 file.2 file.3 file.4 file.5 \ >ls_files_result && test_parse_ls_files_stage_oids expected && for id in `sed "s|..|&/|" expected` do rm r1/.git/objects/$id || return 1 done ' test_expect_success 'verify pack-objects fails w/ missing objects' ' test_must_fail git -C r1 pack-objects --revs --stdout >miss.pack <<-EOF HEAD EOF ' test_expect_success 'verify pack-objects fails w/ --missing=error' ' test_must_fail git -C r1 pack-objects --revs --stdout --missing=error >miss.pack <<-EOF HEAD EOF ' test_expect_success 'verify pack-objects w/ --missing=allow-any' ' git -C r1 pack-objects --revs --stdout --missing=allow-any >miss.pack <<-EOF HEAD EOF ' # Test that --path-walk produces the same object set as standard traversal # when using sparse:oid filters with cone-mode patterns. # # The sparse:oid filter restricts only blobs, not trees. Both standard # and path-walk should produce identical sets of blobs, commits, and trees. test_expect_success 'setup pw_sparse for path-walk comparison' ' git init pw_sparse && mkdir -p pw_sparse/inc/sub pw_sparse/exc/sub && for n in 1 2 do echo "inc $n" >pw_sparse/inc/file$n && echo "inc sub $n" >pw_sparse/inc/sub/file$n && echo "exc $n" >pw_sparse/exc/file$n && echo "exc sub $n" >pw_sparse/exc/sub/file$n && echo "root $n" >pw_sparse/root$n || return 1 done && git -C pw_sparse add . && git -C pw_sparse commit -m "first" && echo "inc 1 modified" >pw_sparse/inc/file1 && echo "exc 1 modified" >pw_sparse/exc/file1 && echo "root 1 modified" >pw_sparse/root1 && git -C pw_sparse add . && git -C pw_sparse commit -m "second" && # Cone-mode sparse pattern: include root + inc/ printf "/*\n!/*/\n/inc/\n" | git -C pw_sparse hash-object -w --stdin >sparse_oid ' test_expect_success 'sparse:oid with --path-walk produces same blobs' ' oid=$(cat sparse_oid) && git -C pw_sparse pack-objects --revs --stdout \ --filter=sparse:oid=$oid >standard.pack <<-EOF && HEAD EOF git -C pw_sparse index-pack ../standard.pack && git -C pw_sparse verify-pack -v ../standard.pack >standard_verify && git -C pw_sparse pack-objects --revs --stdout \ --path-walk --filter=sparse:oid=$oid >pathwalk.pack <<-EOF && HEAD EOF git -C pw_sparse index-pack ../pathwalk.pack && git -C pw_sparse verify-pack -v ../pathwalk.pack >pathwalk_verify && # Blobs must match exactly grep -E "^[0-9a-f]{40} blob" standard_verify | awk "{print \$1}" | sort >standard_blobs && grep -E "^[0-9a-f]{40} blob" pathwalk_verify | awk "{print \$1}" | sort >pathwalk_blobs && test_cmp standard_blobs pathwalk_blobs && # Commits must match exactly grep -E "^[0-9a-f]{40} commit" standard_verify | awk "{print \$1}" | sort >standard_commits && grep -E "^[0-9a-f]{40} commit" pathwalk_verify | awk "{print \$1}" | sort >pathwalk_commits && test_cmp standard_commits pathwalk_commits ' test_expect_success 'sparse:oid with --path-walk includes all trees' ' # The sparse:oid filter restricts only blobs, not trees. # Both standard and path-walk should include the same trees. grep -E "^[0-9a-f]{40} tree" standard_verify | awk "{print \$1}" | sort >standard_trees && grep -E "^[0-9a-f]{40} tree" pathwalk_verify | awk "{print \$1}" | sort >pathwalk_trees && test_cmp standard_trees pathwalk_trees ' # Test the edge case where the same tree/blob OID appears at both an # in-cone and out-of-cone path. When sibling directories have identical # contents, they share a tree OID. The path-walk defers marking objects # SEEN until after checking sparse patterns, so an object at an out-of-cone # path can still be discovered at an in-cone path. test_expect_success 'setup pw_shared for shared OID across cone boundary' ' git init pw_shared && mkdir pw_shared/aaa pw_shared/zzz && echo "shared content" >pw_shared/aaa/file && echo "shared content" >pw_shared/zzz/file && echo "root file" >pw_shared/rootfile && git -C pw_shared add . && git -C pw_shared commit -m "aaa and zzz share tree OID" && # Verify they share a tree OID aaa_tree=$(git -C pw_shared rev-parse HEAD:aaa) && zzz_tree=$(git -C pw_shared rev-parse HEAD:zzz) && test "$aaa_tree" = "$zzz_tree" && # Cone pattern: include root + zzz/ (not aaa/) printf "/*\n!/*/\n/zzz/\n" | git -C pw_shared hash-object -w --stdin >shared_sparse_oid ' test_expect_success 'shared tree OID: --path-walk blobs match standard' ' oid=$(cat shared_sparse_oid) && git -C pw_shared pack-objects --revs --stdout \ --filter=sparse:oid=$oid >shared_std.pack <<-EOF && HEAD EOF git -C pw_shared index-pack ../shared_std.pack && git -C pw_shared verify-pack -v ../shared_std.pack >shared_std_verify && git -C pw_shared pack-objects --revs --stdout \ --path-walk --filter=sparse:oid=$oid >shared_pw.pack <<-EOF && HEAD EOF git -C pw_shared index-pack ../shared_pw.pack && git -C pw_shared verify-pack -v ../shared_pw.pack >shared_pw_verify && grep -E "^[0-9a-f]{40} blob" shared_std_verify | awk "{print \$1}" | sort >shared_std_blobs && grep -E "^[0-9a-f]{40} blob" shared_pw_verify | awk "{print \$1}" | sort >shared_pw_blobs && test_cmp shared_std_blobs shared_pw_blobs ' test_done