Merge branch 'jt/fetch-tips-in-partial-clone'
[git/git.git] / t / t5616-partial-clone.sh
1 #!/bin/sh
2
3 test_description='git partial clone'
4
5 . ./test-lib.sh
6
7 # create a normal "src" repo where we can later create new commits.
8 # expect_1.oids will contain a list of the OIDs of all blobs.
9 test_expect_success 'setup normal src repo' '
10 echo "{print \$1}" >print_1.awk &&
11 echo "{print \$2}" >print_2.awk &&
12
13 git init src &&
14 for n in 1 2 3 4
15 do
16 echo "This is file: $n" > src/file.$n.txt
17 git -C src add file.$n.txt
18 git -C src commit -m "file $n"
19 git -C src ls-files -s file.$n.txt >>temp
20 done &&
21 awk -f print_2.awk <temp | sort >expect_1.oids &&
22 test_line_count = 4 expect_1.oids
23 '
24
25 # bare clone "src" giving "srv.bare" for use as our server.
26 test_expect_success 'setup bare clone for server' '
27 git clone --bare "file://$(pwd)/src" srv.bare &&
28 git -C srv.bare config --local uploadpack.allowfilter 1 &&
29 git -C srv.bare config --local uploadpack.allowanysha1inwant 1
30 '
31
32 # do basic partial clone from "srv.bare"
33 # confirm we are missing all of the known blobs.
34 # confirm partial clone was registered in the local config.
35 test_expect_success 'do partial clone 1' '
36 git clone --no-checkout --filter=blob:none "file://$(pwd)/srv.bare" pc1 &&
37
38 git -C pc1 rev-list --quiet --objects --missing=print HEAD >revs &&
39 awk -f print_1.awk revs |
40 sed "s/?//" |
41 sort >observed.oids &&
42
43 test_cmp expect_1.oids observed.oids &&
44 test "$(git -C pc1 config --local core.repositoryformatversion)" = "1" &&
45 test "$(git -C pc1 config --local extensions.partialclone)" = "origin" &&
46 test "$(git -C pc1 config --local core.partialclonefilter)" = "blob:none"
47 '
48
49 # checkout master to force dynamic object fetch of blobs at HEAD.
50 test_expect_success 'verify checkout with dynamic object fetch' '
51 git -C pc1 rev-list --quiet --objects --missing=print HEAD >observed &&
52 test_line_count = 4 observed &&
53 git -C pc1 checkout master &&
54 git -C pc1 rev-list --quiet --objects --missing=print HEAD >observed &&
55 test_line_count = 0 observed
56 '
57
58 # create new commits in "src" repo to establish a blame history on file.1.txt
59 # and push to "srv.bare".
60 test_expect_success 'push new commits to server' '
61 git -C src remote add srv "file://$(pwd)/srv.bare" &&
62 for x in a b c d e
63 do
64 echo "Mod file.1.txt $x" >>src/file.1.txt
65 git -C src add file.1.txt
66 git -C src commit -m "mod $x"
67 done &&
68 git -C src blame master -- file.1.txt >expect.blame &&
69 git -C src push -u srv master
70 '
71
72 # (partial) fetch in the partial clone repo from the promisor remote.
73 # verify that fetch inherited the filter-spec from the config and DOES NOT
74 # have the new blobs.
75 test_expect_success 'partial fetch inherits filter settings' '
76 git -C pc1 fetch origin &&
77 git -C pc1 rev-list --quiet --objects --missing=print \
78 master..origin/master >observed &&
79 test_line_count = 5 observed
80 '
81
82 # force dynamic object fetch using diff.
83 # we should only get 1 new blob (for the file in origin/master).
84 test_expect_success 'verify diff causes dynamic object fetch' '
85 git -C pc1 diff master..origin/master -- file.1.txt &&
86 git -C pc1 rev-list --quiet --objects --missing=print \
87 master..origin/master >observed &&
88 test_line_count = 4 observed
89 '
90
91 # force full dynamic object fetch of the file's history using blame.
92 # we should get the intermediate blobs for the file.
93 test_expect_success 'verify blame causes dynamic object fetch' '
94 git -C pc1 blame origin/master -- file.1.txt >observed.blame &&
95 test_cmp expect.blame observed.blame &&
96 git -C pc1 rev-list --quiet --objects --missing=print \
97 master..origin/master >observed &&
98 test_line_count = 0 observed
99 '
100
101 # create new commits in "src" repo to establish a history on file.2.txt
102 # and push to "srv.bare".
103 test_expect_success 'push new commits to server for file.2.txt' '
104 for x in a b c d e f
105 do
106 echo "Mod file.2.txt $x" >>src/file.2.txt
107 git -C src add file.2.txt
108 git -C src commit -m "mod $x"
109 done &&
110 git -C src push -u srv master
111 '
112
113 # Do FULL fetch by disabling inherited filter-spec using --no-filter.
114 # Verify we have all the new blobs.
115 test_expect_success 'override inherited filter-spec using --no-filter' '
116 git -C pc1 fetch --no-filter origin &&
117 git -C pc1 rev-list --quiet --objects --missing=print \
118 master..origin/master >observed &&
119 test_line_count = 0 observed
120 '
121
122 # create new commits in "src" repo to establish a history on file.3.txt
123 # and push to "srv.bare".
124 test_expect_success 'push new commits to server for file.3.txt' '
125 for x in a b c d e f
126 do
127 echo "Mod file.3.txt $x" >>src/file.3.txt
128 git -C src add file.3.txt
129 git -C src commit -m "mod $x"
130 done &&
131 git -C src push -u srv master
132 '
133
134 # Do a partial fetch and then try to manually fetch the missing objects.
135 # This can be used as the basis of a pre-command hook to bulk fetch objects
136 # perhaps combined with a command in dry-run mode.
137 test_expect_success 'manual prefetch of missing objects' '
138 git -C pc1 fetch --filter=blob:none origin &&
139
140 git -C pc1 rev-list --quiet --objects --missing=print \
141 master..origin/master >revs &&
142 awk -f print_1.awk revs |
143 sed "s/?//" |
144 sort >observed.oids &&
145
146 test_line_count = 6 observed.oids &&
147 git -C pc1 fetch-pack --stdin "file://$(pwd)/srv.bare" <observed.oids &&
148
149 git -C pc1 rev-list --quiet --objects --missing=print \
150 master..origin/master >revs &&
151 awk -f print_1.awk revs |
152 sed "s/?//" |
153 sort >observed.oids &&
154
155 test_line_count = 0 observed.oids
156 '
157
158 test_expect_success 'partial clone with transfer.fsckobjects=1 uses index-pack --fsck-objects' '
159 git init src &&
160 test_commit -C src x &&
161 test_config -C src uploadpack.allowfilter 1 &&
162 test_config -C src uploadpack.allowanysha1inwant 1 &&
163
164 GIT_TRACE="$(pwd)/trace" git -c transfer.fsckobjects=1 \
165 clone --filter="blob:none" "file://$(pwd)/src" dst &&
166 grep "git index-pack.*--fsck-objects" trace
167 '
168
169 test_expect_success 'partial clone fetches blobs pointed to by refs even if normally filtered out' '
170 rm -rf src dst &&
171 git init src &&
172 test_commit -C src x &&
173 test_config -C src uploadpack.allowfilter 1 &&
174 test_config -C src uploadpack.allowanysha1inwant 1 &&
175
176 # Create a tag pointing to a blob.
177 BLOB=$(echo blob-contents | git -C src hash-object --stdin -w) &&
178 git -C src tag myblob "$BLOB" &&
179
180 git clone --filter="blob:none" "file://$(pwd)/src" dst 2>err &&
181 ! grep "does not point to a valid object" err &&
182 git -C dst fsck
183 '
184
185 test_expect_success 'fetch what is specified on CLI even if already promised' '
186 rm -rf src dst.git &&
187 git init src &&
188 test_commit -C src foo &&
189 test_config -C src uploadpack.allowfilter 1 &&
190 test_config -C src uploadpack.allowanysha1inwant 1 &&
191
192 git hash-object --stdin <src/foo.t >blob &&
193
194 git clone --bare --filter=blob:none "file://$(pwd)/src" dst.git &&
195 git -C dst.git rev-list --objects --quiet --missing=print HEAD >missing_before &&
196 grep "?$(cat blob)" missing_before &&
197 git -C dst.git fetch origin $(cat blob) &&
198 git -C dst.git rev-list --objects --quiet --missing=print HEAD >missing_after &&
199 ! grep "?$(cat blob)" missing_after
200 '
201
202 . "$TEST_DIRECTORY"/lib-httpd.sh
203 start_httpd
204
205 # Converts bytes into a form suitable for inclusion in a sed command. For
206 # example, "printf 'ab\r\n' | hex_unpack" results in '\x61\x62\x0d\x0a'.
207 sed_escape () {
208 perl -e '$/ = undef; $input = <>; print unpack("H2" x length($input), $input)' |
209 sed 's/\(..\)/\\x\1/g'
210 }
211
212 test_expect_success 'upon cloning, check that all refs point to objects' '
213 SERVER="$HTTPD_DOCUMENT_ROOT_PATH/server" &&
214 rm -rf "$SERVER" repo &&
215 test_create_repo "$SERVER" &&
216 test_commit -C "$SERVER" foo &&
217 test_config -C "$SERVER" uploadpack.allowfilter 1 &&
218 test_config -C "$SERVER" uploadpack.allowanysha1inwant 1 &&
219
220 # Create a tag pointing to a blob.
221 BLOB=$(echo blob-contents | git -C "$SERVER" hash-object --stdin -w) &&
222 git -C "$SERVER" tag myblob "$BLOB" &&
223
224 # Craft a packfile not including that blob.
225 git -C "$SERVER" rev-parse HEAD |
226 git -C "$SERVER" pack-objects --stdout >incomplete.pack &&
227
228 # Replace the existing packfile with the crafted one. The protocol
229 # requires that the packfile be sent in sideband 1, hence the extra
230 # \x01 byte at the beginning.
231 printf "1,/packfile/!c %04x\\\\x01%s0000" \
232 "$(($(wc -c <incomplete.pack) + 5))" \
233 "$(sed_escape <incomplete.pack)" \
234 >"$HTTPD_ROOT_PATH/one-time-sed" &&
235
236 # Use protocol v2 because the sed command looks for the "packfile"
237 # section header.
238 test_config -C "$SERVER" protocol.version 2 &&
239 test_must_fail git -c protocol.version=2 clone \
240 --filter=blob:none $HTTPD_URL/one_time_sed/server repo 2>err &&
241
242 grep "did not send all necessary objects" err &&
243
244 # Ensure that the one-time-sed script was used.
245 ! test -e "$HTTPD_ROOT_PATH/one-time-sed"
246 '
247
248 test_expect_success 'when partial cloning, tolerate server not sending target of tag' '
249 SERVER="$HTTPD_DOCUMENT_ROOT_PATH/server" &&
250 rm -rf "$SERVER" repo &&
251 test_create_repo "$SERVER" &&
252 test_commit -C "$SERVER" foo &&
253 test_config -C "$SERVER" uploadpack.allowfilter 1 &&
254 test_config -C "$SERVER" uploadpack.allowanysha1inwant 1 &&
255
256 # Create an annotated tag pointing to a blob.
257 BLOB=$(echo blob-contents | git -C "$SERVER" hash-object --stdin -w) &&
258 git -C "$SERVER" tag -m message -a myblob "$BLOB" &&
259
260 # Craft a packfile including the tag, but not the blob it points to.
261 # Also, omit objects referenced from HEAD in order to force a second
262 # fetch (to fetch missing objects) upon the automatic checkout that
263 # happens after a clone.
264 printf "%s\n%s\n--not\n%s\n%s\n" \
265 $(git -C "$SERVER" rev-parse HEAD) \
266 $(git -C "$SERVER" rev-parse myblob) \
267 $(git -C "$SERVER" rev-parse HEAD^{tree}) \
268 $(git -C "$SERVER" rev-parse myblob^{blob}) |
269 git -C "$SERVER" pack-objects --thin --stdout >incomplete.pack &&
270
271 # Replace the existing packfile with the crafted one. The protocol
272 # requires that the packfile be sent in sideband 1, hence the extra
273 # \x01 byte at the beginning.
274 printf "1,/packfile/!c %04x\\\\x01%s0000" \
275 "$(($(wc -c <incomplete.pack) + 5))" \
276 "$(sed_escape <incomplete.pack)" \
277 >"$HTTPD_ROOT_PATH/one-time-sed" &&
278
279 # Use protocol v2 because the sed command looks for the "packfile"
280 # section header.
281 test_config -C "$SERVER" protocol.version 2 &&
282
283 # Exercise to make sure it works.
284 git -c protocol.version=2 clone \
285 --filter=blob:none $HTTPD_URL/one_time_sed/server repo 2> err &&
286 ! grep "missing object referenced by" err &&
287
288 # Ensure that the one-time-sed script was used.
289 ! test -e "$HTTPD_ROOT_PATH/one-time-sed"
290 '
291
292 stop_httpd
293
294 test_done