2 * Copyright (c) 2020 Ori Bernstein
3 * Copyright (c) 2021 Stefan Sperling <stsp@openbsd.org>
5 * Permission to use, copy, modify, and distribute this software for any
6 * purpose with or without fee is hereby granted, provided that the above
7 * copyright notice and this permission notice appear in all copies.
9 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
18 #include "got_compat.h"
20 #include <sys/types.h>
21 #include <sys/queue.h>
39 #include "got_error.h"
40 #include "got_cancel.h"
41 #include "got_object.h"
43 #include "got_reference.h"
44 #include "got_repository.h"
45 #include "got_repository_admin.h"
47 #include "got_lib_deltify.h"
48 #include "got_lib_delta.h"
49 #include "got_lib_hash.h"
50 #include "got_lib_object.h"
51 #include "got_lib_object_idset.h"
52 #include "got_lib_object_cache.h"
53 #include "got_lib_deflate.h"
54 #include "got_lib_ratelimit.h"
55 #include "got_lib_pack.h"
56 #include "got_lib_pack_create.h"
57 #include "got_lib_repository.h"
58 #include "got_lib_inflate.h"
59 #include "got_lib_poll.h"
61 #include "murmurhash2.h"
64 #define MIN(_a,_b) ((_a) < (_b) ? (_a) : (_b))
68 #define MAX(_a,_b) ((_a) > (_b) ? (_a) : (_b))
72 #define nitems(_a) (sizeof((_a)) / sizeof((_a)[0]))
75 static const struct got_error
*
76 alloc_meta(struct got_pack_meta
**new, struct got_object_id
*id
,
77 const char *path
, int obj_type
, time_t mtime
, uint32_t seed
)
79 struct got_pack_meta
*m
;
83 m
= calloc(1, sizeof(*m
));
85 return got_error_from_errno("calloc");
87 memcpy(&m
->id
, id
, sizeof(m
->id
));
89 m
->path_hash
= murmurhash2(path
, strlen(path
), seed
);
90 m
->obj_type
= obj_type
;
97 clear_meta(struct got_pack_meta
*meta
)
102 free(meta
->delta_buf
);
103 meta
->delta_buf
= NULL
;
104 free(meta
->base_obj_id
);
105 meta
->base_obj_id
= NULL
;
106 meta
->reused_delta_offset
= 0;
107 got_deltify_free(meta
->dtab
);
112 free_nmeta(struct got_pack_meta
**meta
, int nmeta
)
116 for (i
= 0; i
< nmeta
; i
++)
123 delta_order_cmp(const void *pa
, const void *pb
)
125 struct got_pack_meta
*a
, *b
;
127 a
= *(struct got_pack_meta
**)pa
;
128 b
= *(struct got_pack_meta
**)pb
;
130 if (a
->obj_type
!= b
->obj_type
)
131 return a
->obj_type
- b
->obj_type
;
132 if (a
->path_hash
< b
->path_hash
)
134 if (a
->path_hash
> b
->path_hash
)
136 if (a
->mtime
< b
->mtime
)
138 if (a
->mtime
> b
->mtime
)
140 return got_object_id_cmp(&a
->id
, &b
->id
);
144 delta_size(struct got_delta_instruction
*deltas
, int ndeltas
)
148 for (i
= 0; i
< ndeltas
; i
++) {
150 size
+= GOT_DELTA_SIZE_SHIFT
;
152 size
+= deltas
[i
].len
+ 1;
157 static const struct got_error
*
158 append(unsigned char **p
, size_t *len
, off_t
*sz
, void *seg
, int nseg
)
162 if (*len
+ nseg
>= *sz
) {
163 while (*len
+ nseg
>= *sz
)
165 n
= realloc(*p
, *sz
);
167 return got_error_from_errno("realloc");
170 memcpy(*p
+ *len
, seg
, nseg
);
175 static const struct got_error
*
176 encode_delta_in_mem(struct got_pack_meta
*m
, struct got_raw_object
*o
,
177 struct got_delta_instruction
*deltas
, int ndeltas
,
178 off_t delta_size
, off_t base_size
)
180 const struct got_error
*err
;
181 unsigned char buf
[16], *bp
;
183 size_t len
= 0, compressed_len
;
184 off_t bufsize
= delta_size
;
186 struct got_delta_instruction
*d
;
189 delta_buf
= malloc(bufsize
);
190 if (delta_buf
== NULL
)
191 return got_error_from_errno("malloc");
193 /* base object size */
194 buf
[0] = base_size
& GOT_DELTA_SIZE_VAL_MASK
;
195 n
= base_size
>> GOT_DELTA_SIZE_SHIFT
;
196 for (i
= 1; n
> 0; i
++) {
197 buf
[i
- 1] |= GOT_DELTA_SIZE_MORE
;
198 buf
[i
] = n
& GOT_DELTA_SIZE_VAL_MASK
;
199 n
>>= GOT_DELTA_SIZE_SHIFT
;
201 err
= append(&delta_buf
, &len
, &bufsize
, buf
, i
);
205 /* target object size */
206 buf
[0] = o
->size
& GOT_DELTA_SIZE_VAL_MASK
;
207 n
= o
->size
>> GOT_DELTA_SIZE_SHIFT
;
208 for (i
= 1; n
> 0; i
++) {
209 buf
[i
- 1] |= GOT_DELTA_SIZE_MORE
;
210 buf
[i
] = n
& GOT_DELTA_SIZE_VAL_MASK
;
211 n
>>= GOT_DELTA_SIZE_SHIFT
;
213 err
= append(&delta_buf
, &len
, &bufsize
, buf
, i
);
217 for (j
= 0; j
< ndeltas
; j
++) {
222 buf
[0] = GOT_DELTA_BASE_COPY
;
223 for (i
= 0; i
< 4; i
++) {
224 /* DELTA_COPY_OFF1 ... DELTA_COPY_OFF4 */
233 if (n
!= GOT_DELTA_COPY_DEFAULT_LEN
) {
234 /* DELTA_COPY_LEN1 ... DELTA_COPY_LEN3 */
235 for (i
= 0; i
< 3 && n
> 0; i
++) {
236 buf
[0] |= 1 << (i
+ 4);
241 err
= append(&delta_buf
, &len
, &bufsize
,
245 } else if (o
->f
== NULL
) {
247 while (n
!= d
->len
) {
248 buf
[0] = (d
->len
- n
< 127) ? d
->len
- n
: 127;
249 err
= append(&delta_buf
, &len
, &bufsize
,
253 err
= append(&delta_buf
, &len
, &bufsize
,
254 o
->data
+ o
->hdrlen
+ d
->offset
+ n
,
263 if (fseeko(o
->f
, o
->hdrlen
+ d
->offset
, SEEK_SET
) == -1) {
264 err
= got_error_from_errno("fseeko");
268 while (n
!= d
->len
) {
269 buf
[0] = (d
->len
- n
< 127) ? d
->len
- n
: 127;
270 err
= append(&delta_buf
, &len
, &bufsize
,
274 r
= fread(content
, 1, buf
[0], o
->f
);
276 err
= got_ferror(o
->f
, GOT_ERR_IO
);
279 err
= append(&delta_buf
, &len
, &bufsize
,
288 err
= got_deflate_to_mem_mmap(&m
->delta_buf
, &compressed_len
,
289 NULL
, NULL
, delta_buf
, 0, len
);
294 m
->delta_compressed_len
= compressed_len
;
300 static const struct got_error
*
301 encode_delta(struct got_pack_meta
*m
, struct got_raw_object
*o
,
302 struct got_delta_instruction
*deltas
, int ndeltas
,
303 off_t base_size
, FILE *f
)
305 const struct got_error
*err
;
306 unsigned char buf
[16], *bp
;
309 struct got_deflate_buf zb
;
310 struct got_delta_instruction
*d
;
311 off_t delta_len
= 0, compressed_len
= 0;
313 err
= got_deflate_init(&zb
, NULL
, GOT_DEFLATE_BUFSIZE
);
317 /* base object size */
318 buf
[0] = base_size
& GOT_DELTA_SIZE_VAL_MASK
;
319 n
= base_size
>> GOT_DELTA_SIZE_SHIFT
;
320 for (i
= 1; n
> 0; i
++) {
321 buf
[i
- 1] |= GOT_DELTA_SIZE_MORE
;
322 buf
[i
] = n
& GOT_DELTA_SIZE_VAL_MASK
;
323 n
>>= GOT_DELTA_SIZE_SHIFT
;
326 err
= got_deflate_append_to_file_mmap(&zb
, &compressed_len
,
332 /* target object size */
333 buf
[0] = o
->size
& GOT_DELTA_SIZE_VAL_MASK
;
334 n
= o
->size
>> GOT_DELTA_SIZE_SHIFT
;
335 for (i
= 1; n
> 0; i
++) {
336 buf
[i
- 1] |= GOT_DELTA_SIZE_MORE
;
337 buf
[i
] = n
& GOT_DELTA_SIZE_VAL_MASK
;
338 n
>>= GOT_DELTA_SIZE_SHIFT
;
341 err
= got_deflate_append_to_file_mmap(&zb
, &compressed_len
,
347 for (j
= 0; j
< ndeltas
; j
++) {
352 buf
[0] = GOT_DELTA_BASE_COPY
;
353 for (i
= 0; i
< 4; i
++) {
354 /* DELTA_COPY_OFF1 ... DELTA_COPY_OFF4 */
362 if (n
!= GOT_DELTA_COPY_DEFAULT_LEN
) {
363 /* DELTA_COPY_LEN1 ... DELTA_COPY_LEN3 */
364 for (i
= 0; i
< 3 && n
> 0; i
++) {
365 buf
[0] |= 1 << (i
+ 4);
370 err
= got_deflate_append_to_file_mmap(&zb
,
371 &compressed_len
, buf
, 0, bp
- buf
, f
, NULL
);
374 delta_len
+= (bp
- buf
);
375 } else if (o
->f
== NULL
) {
377 while (n
!= d
->len
) {
378 buf
[0] = (d
->len
- n
< 127) ? d
->len
- n
: 127;
379 err
= got_deflate_append_to_file_mmap(&zb
,
380 &compressed_len
, buf
, 0, 1, f
, NULL
);
384 err
= got_deflate_append_to_file_mmap(&zb
,
386 o
->data
+ o
->hdrlen
+ d
->offset
+ n
, 0,
396 if (fseeko(o
->f
, o
->hdrlen
+ d
->offset
, SEEK_SET
) == -1) {
397 err
= got_error_from_errno("fseeko");
401 while (n
!= d
->len
) {
402 buf
[0] = (d
->len
- n
< 127) ? d
->len
- n
: 127;
403 err
= got_deflate_append_to_file_mmap(&zb
,
404 &compressed_len
, buf
, 0, 1, f
, NULL
);
408 r
= fread(content
, 1, buf
[0], o
->f
);
410 err
= got_ferror(o
->f
, GOT_ERR_IO
);
413 err
= got_deflate_append_to_file_mmap(&zb
,
414 &compressed_len
, content
, 0, buf
[0], f
,
424 err
= got_deflate_flush(&zb
, f
, NULL
, &compressed_len
);
429 if (compressed_len
!= ftello(f
) - m
->delta_offset
) {
430 err
= got_error(GOT_ERR_COMPRESSION
);
434 m
->delta_len
= delta_len
;
435 m
->delta_compressed_len
= compressed_len
;
437 got_deflate_end(&zb
);
441 const struct got_error
*
442 got_pack_report_progress(got_pack_progress_cb progress_cb
, void *progress_arg
,
443 struct got_ratelimit
*rl
, int ncolored
, int nfound
, int ntrees
,
444 off_t packfile_size
, int ncommits
, int nobj_total
, int obj_deltify
,
445 int nobj_written
, int pack_done
)
447 const struct got_error
*err
;
450 if (progress_cb
== NULL
)
453 err
= got_ratelimit_check(&elapsed
, rl
);
457 return progress_cb(progress_arg
, ncolored
, nfound
, ntrees
,
458 packfile_size
, ncommits
, nobj_total
, obj_deltify
, nobj_written
,
462 const struct got_error
*
463 got_pack_add_meta(struct got_pack_meta
*m
, struct got_pack_metavec
*v
)
465 if (v
->nmeta
== v
->metasz
){
466 size_t newsize
= 2 * v
->metasz
;
467 struct got_pack_meta
**new;
468 new = reallocarray(v
->meta
, newsize
, sizeof(*new));
470 return got_error_from_errno("reallocarray");
475 v
->meta
[v
->nmeta
++] = m
;
479 const struct got_error
*
480 got_pack_find_pack_for_reuse(struct got_packidx
**best_packidx
,
481 struct got_repository
*repo
)
483 const struct got_error
*err
= NULL
;
484 struct got_pathlist_entry
*pe
;
485 const char *best_packidx_path
= NULL
;
488 *best_packidx
= NULL
;
490 RB_FOREACH(pe
, got_pathlist_head
, &repo
->packidx_paths
) {
491 const char *path_packidx
= pe
->path
;
492 struct got_packidx
*packidx
;
495 err
= got_repo_get_packidx(&packidx
, path_packidx
, repo
);
499 nobj
= be32toh(packidx
->hdr
.fanout_table
[0xff]);
500 if (nobj
> nobj_max
) {
501 best_packidx_path
= path_packidx
;
506 if (best_packidx_path
) {
507 err
= got_repo_get_packidx(best_packidx
, best_packidx_path
,
514 const struct got_error
*
515 got_pack_cache_pack_for_packidx(struct got_pack
**pack
,
516 struct got_packidx
*packidx
, struct got_repository
*repo
)
518 const struct got_error
*err
;
519 char *path_packfile
= NULL
;
521 err
= got_packidx_get_packfile_path(&path_packfile
,
522 packidx
->path_packidx
);
526 *pack
= got_repo_get_cached_pack(repo
, path_packfile
);
528 err
= got_repo_cache_pack(pack
, repo
, path_packfile
, packidx
);
537 static const struct got_error
*
538 pick_deltas(struct got_pack_meta
**meta
, int nmeta
, int ncolored
,
539 int nfound
, int ntrees
, int ncommits
, int nreused
, FILE *delta_cache
,
540 struct got_repository
*repo
,
541 got_pack_progress_cb progress_cb
, void *progress_arg
,
542 struct got_ratelimit
*rl
, got_cancel_cb cancel_cb
, void *cancel_arg
)
544 const struct got_error
*err
= NULL
;
545 struct got_pack_meta
*m
= NULL
, *base
= NULL
;
546 struct got_raw_object
*raw
= NULL
, *base_raw
= NULL
;
547 struct got_delta_instruction
*deltas
= NULL
, *best_deltas
= NULL
;
548 int i
, j
, ndeltas
, best_ndeltas
;
549 off_t size
, best_size
;
550 const int max_base_candidates
= 3;
551 size_t delta_memsize
= 0;
552 const size_t max_delta_memsize
= 4 * GOT_DELTA_RESULT_SIZE_CACHED_MAX
;
556 delta_seed
= arc4random();
558 qsort(meta
, nmeta
, sizeof(struct got_pack_meta
*), delta_order_cmp
);
559 for (i
= 0; i
< nmeta
; i
++) {
561 err
= (*cancel_cb
)(cancel_arg
);
565 err
= got_pack_report_progress(progress_cb
, progress_arg
, rl
,
566 ncolored
, nfound
, ntrees
, 0L, ncommits
, nreused
+ nmeta
,
572 if (m
->obj_type
== GOT_OBJ_TYPE_COMMIT
||
573 m
->obj_type
== GOT_OBJ_TYPE_TAG
)
576 err
= got_object_raw_open(&raw
, &outfd
, repo
, &m
->id
);
581 if (raw
->f
== NULL
) {
582 err
= got_deltify_init_mem(&m
->dtab
, raw
->data
,
583 raw
->hdrlen
, raw
->size
+ raw
->hdrlen
, delta_seed
);
585 err
= got_deltify_init(&m
->dtab
, raw
->f
, raw
->hdrlen
,
586 raw
->size
+ raw
->hdrlen
, delta_seed
);
591 if (i
> max_base_candidates
) {
592 struct got_pack_meta
*n
= NULL
;
593 n
= meta
[i
- (max_base_candidates
+ 1)];
594 got_deltify_free(n
->dtab
);
598 best_size
= raw
->size
;
600 for (j
= MAX(0, i
- max_base_candidates
); j
< i
; j
++) {
602 err
= (*cancel_cb
)(cancel_arg
);
607 /* long chains make unpacking slow, avoid such bases */
608 if (base
->nchain
>= 128 ||
609 base
->obj_type
!= m
->obj_type
)
612 err
= got_object_raw_open(&base_raw
, &outfd
, repo
,
617 if (raw
->f
== NULL
&& base_raw
->f
== NULL
) {
618 err
= got_deltify_mem_mem(&deltas
, &ndeltas
,
619 raw
->data
, raw
->hdrlen
,
620 raw
->size
+ raw
->hdrlen
, delta_seed
,
621 base
->dtab
, base_raw
->data
,
623 base_raw
->size
+ base_raw
->hdrlen
);
624 } else if (raw
->f
== NULL
) {
625 err
= got_deltify_mem_file(&deltas
, &ndeltas
,
626 raw
->data
, raw
->hdrlen
,
627 raw
->size
+ raw
->hdrlen
, delta_seed
,
628 base
->dtab
, base_raw
->f
,
630 base_raw
->size
+ base_raw
->hdrlen
);
631 } else if (base_raw
->f
== NULL
) {
632 err
= got_deltify_file_mem(&deltas
, &ndeltas
,
634 raw
->size
+ raw
->hdrlen
, delta_seed
,
635 base
->dtab
, base_raw
->data
,
637 base_raw
->size
+ base_raw
->hdrlen
);
639 err
= got_deltify(&deltas
, &ndeltas
,
641 raw
->size
+ raw
->hdrlen
, delta_seed
,
642 base
->dtab
, base_raw
->f
, base_raw
->hdrlen
,
643 base_raw
->size
+ base_raw
->hdrlen
);
645 got_object_raw_close(base_raw
);
650 size
= delta_size(deltas
, ndeltas
);
651 if (size
+ 32 < best_size
){
653 * if we already picked a best delta,
658 best_deltas
= deltas
;
659 best_ndeltas
= ndeltas
;
661 m
->nchain
= base
->nchain
+ 1;
663 m
->head
= base
->head
;
673 if (best_ndeltas
> 0) {
674 if (best_size
<= GOT_DELTA_RESULT_SIZE_CACHED_MAX
&&
675 delta_memsize
+ best_size
<= max_delta_memsize
) {
676 delta_memsize
+= best_size
;
677 err
= encode_delta_in_mem(m
, raw
, best_deltas
,
678 best_ndeltas
, best_size
, m
->prev
->size
);
680 m
->delta_offset
= ftello(delta_cache
);
681 err
= encode_delta(m
, raw
, best_deltas
,
682 best_ndeltas
, m
->prev
->size
, delta_cache
);
691 got_object_raw_close(raw
);
696 got_object_raw_close(raw
);
698 got_object_raw_close(base_raw
);
699 if (outfd
!= -1 && close(outfd
) == -1 && err
== NULL
)
700 err
= got_error_from_errno("close");
706 static const struct got_error
*
707 search_packidx(int *found
, struct got_object_id
*id
,
708 struct got_repository
*repo
)
710 const struct got_error
*err
= NULL
;
711 struct got_packidx
*packidx
= NULL
;
716 err
= got_repo_search_packidx(&packidx
, &idx
, repo
, id
);
718 *found
= 1; /* object is already packed */
719 else if (err
->code
== GOT_ERR_NO_OBJ
)
724 const struct got_error
*
725 got_pack_add_object(int want_meta
, struct got_object_idset
*idset
,
726 struct got_object_id
*id
, const char *path
, int obj_type
,
727 time_t mtime
, uint32_t seed
, int loose_obj_only
,
728 struct got_repository
*repo
, int *ncolored
, int *nfound
, int *ntrees
,
729 got_pack_progress_cb progress_cb
, void *progress_arg
,
730 struct got_ratelimit
*rl
)
732 const struct got_error
*err
;
733 struct got_pack_meta
*m
= NULL
;
735 if (loose_obj_only
) {
737 err
= search_packidx(&is_packed
, id
, repo
);
740 if (is_packed
&& want_meta
)
745 err
= alloc_meta(&m
, id
, path
, obj_type
, mtime
, seed
);
750 err
= got_pack_report_progress(progress_cb
, progress_arg
, rl
,
751 *ncolored
, *nfound
, *ntrees
, 0L, 0, 0, 0, 0, 0);
759 err
= got_object_idset_add(idset
, id
, m
);
767 const struct got_error
*
768 got_pack_load_tree_entries(struct got_object_id_queue
*ids
, int want_meta
,
769 struct got_object_idset
*idset
, struct got_object_idset
*idset_exclude
,
770 struct got_tree_object
*tree
,
771 const char *dpath
, time_t mtime
, uint32_t seed
, struct got_repository
*repo
,
772 int loose_obj_only
, int *ncolored
, int *nfound
, int *ntrees
,
773 got_pack_progress_cb progress_cb
, void *progress_arg
,
774 struct got_ratelimit
*rl
, got_cancel_cb cancel_cb
, void *cancel_arg
)
776 const struct got_error
*err
;
781 err
= got_pack_report_progress(progress_cb
, progress_arg
, rl
,
782 *ncolored
, *nfound
, *ntrees
, 0L, 0, 0, 0, 0, 0);
786 for (i
= 0; i
< got_object_tree_get_nentries(tree
); i
++) {
787 struct got_tree_entry
*e
= got_object_tree_get_entry(tree
, i
);
788 struct got_object_id
*id
= got_tree_entry_get_id(e
);
789 mode_t mode
= got_tree_entry_get_mode(e
);
792 err
= (*cancel_cb
)(cancel_arg
);
797 if (got_object_tree_entry_is_submodule(e
) ||
798 got_object_idset_contains(idset
, id
) ||
799 got_object_idset_contains(idset_exclude
, id
))
803 * If got-read-pack is crawling trees for us then
804 * we are only here to collect blob IDs.
806 if (ids
== NULL
&& S_ISDIR(mode
))
809 if (asprintf(&p
, "%s%s%s", dpath
,
810 got_path_is_root_dir(dpath
) ? "" : "/",
811 got_tree_entry_get_name(e
)) == -1) {
812 err
= got_error_from_errno("asprintf");
817 struct got_object_qid
*qid
;
818 err
= got_object_qid_alloc(&qid
, id
);
823 STAILQ_INSERT_TAIL(ids
, qid
, entry
);
824 } else if (S_ISREG(mode
) || S_ISLNK(mode
)) {
825 err
= got_pack_add_object(want_meta
,
826 want_meta
? idset
: idset_exclude
, id
, p
,
827 GOT_OBJ_TYPE_BLOB
, mtime
, seed
, loose_obj_only
,
828 repo
, ncolored
, nfound
, ntrees
,
829 progress_cb
, progress_arg
, rl
);
844 const struct got_error
*
845 got_pack_load_tree(int want_meta
, struct got_object_idset
*idset
,
846 struct got_object_idset
*idset_exclude
,
847 struct got_object_id
*tree_id
, const char *dpath
, time_t mtime
,
848 uint32_t seed
, struct got_repository
*repo
, int loose_obj_only
,
849 int *ncolored
, int *nfound
, int *ntrees
,
850 got_pack_progress_cb progress_cb
, void *progress_arg
,
851 struct got_ratelimit
*rl
, got_cancel_cb cancel_cb
, void *cancel_arg
)
853 const struct got_error
*err
= NULL
;
854 struct got_object_id_queue tree_ids
;
855 struct got_object_qid
*qid
;
856 struct got_tree_object
*tree
= NULL
;
858 if (got_object_idset_contains(idset
, tree_id
) ||
859 got_object_idset_contains(idset_exclude
, tree_id
))
862 err
= got_object_qid_alloc(&qid
, tree_id
);
865 qid
->data
= strdup(dpath
);
866 if (qid
->data
== NULL
) {
867 err
= got_error_from_errno("strdup");
868 got_object_qid_free(qid
);
872 STAILQ_INIT(&tree_ids
);
873 STAILQ_INSERT_TAIL(&tree_ids
, qid
, entry
);
875 while (!STAILQ_EMPTY(&tree_ids
)) {
878 err
= (*cancel_cb
)(cancel_arg
);
883 qid
= STAILQ_FIRST(&tree_ids
);
884 STAILQ_REMOVE_HEAD(&tree_ids
, entry
);
887 if (got_object_idset_contains(idset
, &qid
->id
) ||
888 got_object_idset_contains(idset_exclude
, &qid
->id
)) {
890 got_object_qid_free(qid
);
894 err
= got_pack_add_object(want_meta
,
895 want_meta
? idset
: idset_exclude
,
896 &qid
->id
, path
, GOT_OBJ_TYPE_TREE
,
897 mtime
, seed
, loose_obj_only
, repo
,
898 ncolored
, nfound
, ntrees
, progress_cb
, progress_arg
, rl
);
901 got_object_qid_free(qid
);
905 err
= got_object_open_as_tree(&tree
, repo
, &qid
->id
);
908 got_object_qid_free(qid
);
912 err
= got_pack_load_tree_entries(&tree_ids
, want_meta
, idset
,
913 idset_exclude
, tree
, path
, mtime
, seed
, repo
,
914 loose_obj_only
, ncolored
, nfound
, ntrees
,
915 progress_cb
, progress_arg
, rl
,
916 cancel_cb
, cancel_arg
);
918 got_object_qid_free(qid
);
922 got_object_tree_close(tree
);
926 STAILQ_FOREACH(qid
, &tree_ids
, entry
)
928 got_object_id_queue_free(&tree_ids
);
930 got_object_tree_close(tree
);
934 static const struct got_error
*
935 load_commit(int want_meta
, struct got_object_idset
*idset
,
936 struct got_object_idset
*idset_exclude
,
937 struct got_object_id
*id
, struct got_repository
*repo
, uint32_t seed
,
938 int loose_obj_only
, int *ncolored
, int *nfound
, int *ntrees
,
939 got_pack_progress_cb progress_cb
, void *progress_arg
,
940 struct got_ratelimit
*rl
, got_cancel_cb cancel_cb
, void *cancel_arg
)
942 const struct got_error
*err
;
943 struct got_commit_object
*commit
;
945 if (got_object_idset_contains(idset
, id
) ||
946 got_object_idset_contains(idset_exclude
, id
))
949 if (loose_obj_only
) {
951 err
= search_packidx(&is_packed
, id
, repo
);
954 if (is_packed
&& want_meta
)
958 err
= got_object_open_as_commit(&commit
, repo
, id
);
962 err
= got_pack_add_object(want_meta
,
963 want_meta
? idset
: idset_exclude
, id
, "", GOT_OBJ_TYPE_COMMIT
,
964 got_object_commit_get_committer_time(commit
), seed
,
965 loose_obj_only
, repo
,
966 ncolored
, nfound
, ntrees
, progress_cb
, progress_arg
, rl
);
970 err
= got_pack_load_tree(want_meta
, idset
, idset_exclude
,
971 got_object_commit_get_tree_id(commit
),
972 "", got_object_commit_get_committer_time(commit
), seed
,
973 repo
, loose_obj_only
, ncolored
, nfound
, ntrees
,
974 progress_cb
, progress_arg
, rl
, cancel_cb
, cancel_arg
);
976 got_object_commit_close(commit
);
980 static const struct got_error
*
981 load_tag(int want_meta
, struct got_object_idset
*idset
,
982 struct got_object_idset
*idset_exclude
,
983 struct got_object_id
*id
, struct got_repository
*repo
, uint32_t seed
,
984 int loose_obj_only
, int *ncolored
, int *nfound
, int *ntrees
,
985 got_pack_progress_cb progress_cb
, void *progress_arg
,
986 struct got_ratelimit
*rl
, got_cancel_cb cancel_cb
, void *cancel_arg
)
988 const struct got_error
*err
;
989 struct got_tag_object
*tag
= NULL
;
991 if (got_object_idset_contains(idset
, id
) ||
992 got_object_idset_contains(idset_exclude
, id
))
995 if (loose_obj_only
) {
997 err
= search_packidx(&is_packed
, id
, repo
);
1000 if (is_packed
&& want_meta
)
1004 err
= got_object_open_as_tag(&tag
, repo
, id
);
1008 err
= got_pack_add_object(want_meta
,
1009 want_meta
? idset
: idset_exclude
, id
, "", GOT_OBJ_TYPE_TAG
,
1010 got_object_tag_get_tagger_time(tag
), seed
, loose_obj_only
, repo
,
1011 ncolored
, nfound
, ntrees
, progress_cb
, progress_arg
, rl
);
1015 switch (got_object_tag_get_object_type(tag
)) {
1016 case GOT_OBJ_TYPE_COMMIT
:
1017 err
= load_commit(want_meta
, idset
, idset_exclude
,
1018 got_object_tag_get_object_id(tag
), repo
, seed
,
1019 loose_obj_only
, ncolored
, nfound
, ntrees
,
1020 progress_cb
, progress_arg
, rl
, cancel_cb
, cancel_arg
);
1022 case GOT_OBJ_TYPE_TREE
:
1023 err
= got_pack_load_tree(want_meta
, idset
, idset_exclude
,
1024 got_object_tag_get_object_id(tag
), "",
1025 got_object_tag_get_tagger_time(tag
), seed
, repo
,
1026 loose_obj_only
, ncolored
, nfound
, ntrees
,
1027 progress_cb
, progress_arg
, rl
, cancel_cb
, cancel_arg
);
1034 got_object_tag_close(tag
);
1038 const struct got_error
*
1039 got_pack_paint_commit(struct got_object_qid
*qid
, intptr_t color
)
1041 if (color
< 0 || color
>= COLOR_MAX
)
1042 return got_error(GOT_ERR_RANGE
);
1044 qid
->data
= (void *)color
;
1048 const struct got_error
*
1049 got_pack_queue_commit_id(struct got_object_id_queue
*ids
,
1050 struct got_object_id
*id
, intptr_t color
, struct got_repository
*repo
)
1052 const struct got_error
*err
;
1053 struct got_object_qid
*qid
;
1055 err
= got_object_qid_alloc(&qid
, id
);
1059 STAILQ_INSERT_TAIL(ids
, qid
, entry
);
1060 return got_pack_paint_commit(qid
, color
);
1063 struct append_id_arg
{
1064 struct got_object_id
**array
;
1066 struct got_object_idset
*drop
;
1067 struct got_object_idset
*skip
;
1070 static const struct got_error
*
1071 append_id(struct got_object_id
*id
, void *data
, void *arg
)
1073 struct append_id_arg
*a
= arg
;
1075 if (got_object_idset_contains(a
->skip
, id
) ||
1076 got_object_idset_contains(a
->drop
, id
))
1079 a
->array
[++a
->idx
] = got_object_id_dup(id
);
1080 if (a
->array
[a
->idx
] == NULL
)
1081 return got_error_from_errno("got_object_id_dup");
1086 static const struct got_error
*
1087 free_meta(struct got_object_id
*id
, void *data
, void *arg
)
1089 struct got_pack_meta
*meta
= data
;
1096 static const struct got_error
*
1097 queue_commit_or_tag_id(struct got_object_id
*id
, intptr_t color
,
1098 struct got_object_id_queue
*ids
, struct got_repository
*repo
)
1100 const struct got_error
*err
;
1101 struct got_tag_object
*tag
= NULL
;
1104 err
= got_object_get_type(&obj_type
, repo
, id
);
1108 if (obj_type
== GOT_OBJ_TYPE_TAG
) {
1109 err
= got_object_open_as_tag(&tag
, repo
, id
);
1112 obj_type
= got_object_tag_get_object_type(tag
);
1113 id
= got_object_tag_get_object_id(tag
);
1116 if (obj_type
== GOT_OBJ_TYPE_COMMIT
) {
1117 err
= got_pack_queue_commit_id(ids
, id
, color
, repo
);
1123 got_object_tag_close(tag
);
1127 const struct got_error
*
1128 got_pack_find_pack_for_commit_painting(struct got_packidx
**best_packidx
,
1129 struct got_object_id_queue
*ids
, int nids
, struct got_repository
*repo
)
1131 const struct got_error
*err
= NULL
;
1132 struct got_pathlist_entry
*pe
;
1133 const char *best_packidx_path
= NULL
;
1135 int ncommits_max
= 0;
1137 *best_packidx
= NULL
;
1140 * Find the largest pack which contains at least some of the
1141 * commits we are interested in.
1143 RB_FOREACH(pe
, got_pathlist_head
, &repo
->packidx_paths
) {
1144 const char *path_packidx
= pe
->path
;
1145 struct got_packidx
*packidx
;
1146 int nobj
, idx
, ncommits
= 0;
1147 struct got_object_qid
*qid
;
1149 err
= got_repo_get_packidx(&packidx
, path_packidx
, repo
);
1153 nobj
= be32toh(packidx
->hdr
.fanout_table
[0xff]);
1154 if (nobj
<= nobj_max
)
1157 STAILQ_FOREACH(qid
, ids
, entry
) {
1158 idx
= got_packidx_get_object_idx(packidx
, &qid
->id
);
1162 if (ncommits
> ncommits_max
) {
1163 best_packidx_path
= path_packidx
;
1165 ncommits_max
= ncommits
;
1169 if (best_packidx_path
&& err
== NULL
) {
1170 err
= got_repo_get_packidx(best_packidx
, best_packidx_path
,
1177 static const struct got_error
*
1178 findtwixt(struct got_object_id
***res
, int *nres
, int *ncolored
,
1179 struct got_object_id
**head
, int nhead
,
1180 struct got_object_id
**tail
, int ntail
,
1181 struct got_repository
*repo
,
1182 got_pack_progress_cb progress_cb
, void *progress_arg
,
1183 struct got_ratelimit
*rl
, got_cancel_cb cancel_cb
, void *cancel_arg
)
1185 const struct got_error
*err
= NULL
;
1186 struct got_object_id_queue ids
;
1187 struct got_object_idset
*keep
, *drop
, *skip
= NULL
;
1195 keep
= got_object_idset_alloc();
1197 return got_error_from_errno("got_object_idset_alloc");
1199 drop
= got_object_idset_alloc();
1201 err
= got_error_from_errno("got_object_idset_alloc");
1205 skip
= got_object_idset_alloc();
1207 err
= got_error_from_errno("got_object_idset_alloc");
1211 for (i
= 0; i
< nhead
; i
++) {
1212 struct got_object_id
*id
= head
[i
];
1215 err
= queue_commit_or_tag_id(id
, COLOR_KEEP
, &ids
, repo
);
1220 for (i
= 0; i
< ntail
; i
++) {
1221 struct got_object_id
*id
= tail
[i
];
1224 err
= queue_commit_or_tag_id(id
, COLOR_DROP
, &ids
, repo
);
1229 err
= got_pack_paint_commits(ncolored
, &ids
, nhead
+ ntail
,
1230 keep
, drop
, skip
, repo
, progress_cb
, progress_arg
, rl
,
1231 cancel_cb
, cancel_arg
);
1235 nkeep
= got_object_idset_num_elements(keep
);
1237 struct append_id_arg arg
;
1238 arg
.array
= calloc(nkeep
, sizeof(struct got_object_id
*));
1239 if (arg
.array
== NULL
) {
1240 err
= got_error_from_errno("calloc");
1246 err
= got_object_idset_for_each(keep
, append_id
, &arg
);
1252 *nres
= arg
.idx
+ 1;
1255 got_object_idset_free(keep
);
1256 got_object_idset_free(drop
);
1258 got_object_idset_free(skip
);
1259 got_object_id_queue_free(&ids
);
1263 static const struct got_error
*
1264 find_pack_for_enumeration(struct got_packidx
**best_packidx
,
1265 struct got_object_id
**ids
, int nids
, struct got_repository
*repo
)
1267 const struct got_error
*err
= NULL
;
1268 struct got_pathlist_entry
*pe
;
1269 const char *best_packidx_path
= NULL
;
1271 int ncommits_max
= 0;
1273 *best_packidx
= NULL
;
1276 * Find the largest pack which contains at least some of the
1277 * commits and tags we are interested in.
1279 RB_FOREACH(pe
, got_pathlist_head
, &repo
->packidx_paths
) {
1280 const char *path_packidx
= pe
->path
;
1281 struct got_packidx
*packidx
;
1282 int nobj
, i
, idx
, ncommits
= 0;
1284 err
= got_repo_get_packidx(&packidx
, path_packidx
, repo
);
1288 nobj
= be32toh(packidx
->hdr
.fanout_table
[0xff]);
1289 if (nobj
<= nobj_max
)
1292 for (i
= 0; i
< nids
; i
++) {
1293 idx
= got_packidx_get_object_idx(packidx
, ids
[i
]);
1297 if (ncommits
> ncommits_max
) {
1298 best_packidx_path
= path_packidx
;
1300 ncommits_max
= ncommits
;
1304 if (best_packidx_path
&& err
== NULL
) {
1305 err
= got_repo_get_packidx(best_packidx
, best_packidx_path
,
1312 static const struct got_error
*
1313 load_object_ids(int *ncolored
, int *nfound
, int *ntrees
,
1314 struct got_object_idset
*idset
, struct got_object_id
**theirs
, int ntheirs
,
1315 struct got_object_id
**ours
, int nours
, struct got_repository
*repo
,
1316 uint32_t seed
, int loose_obj_only
, got_pack_progress_cb progress_cb
,
1317 void *progress_arg
, struct got_ratelimit
*rl
, got_cancel_cb cancel_cb
,
1320 const struct got_error
*err
= NULL
;
1321 struct got_object_id
**ids
= NULL
;
1322 struct got_packidx
*packidx
= NULL
;
1323 int i
, nobj
= 0, obj_type
, found_all_objects
= 0;
1324 struct got_object_idset
*idset_exclude
;
1326 idset_exclude
= got_object_idset_alloc();
1327 if (idset_exclude
== NULL
)
1328 return got_error_from_errno("got_object_idset_alloc");
1334 err
= findtwixt(&ids
, &nobj
, ncolored
, ours
, nours
, theirs
, ntheirs
,
1335 repo
, progress_cb
, progress_arg
, rl
, cancel_cb
, cancel_arg
);
1339 err
= find_pack_for_enumeration(&packidx
, theirs
, ntheirs
, repo
);
1343 err
= got_pack_load_packed_object_ids(&found_all_objects
,
1344 theirs
, ntheirs
, NULL
, 0, 0, seed
, idset
, idset_exclude
,
1345 loose_obj_only
, repo
, packidx
, ncolored
, nfound
, ntrees
,
1346 progress_cb
, progress_arg
, rl
, cancel_cb
, cancel_arg
);
1351 for (i
= 0; i
< ntheirs
; i
++) {
1352 struct got_object_id
*id
= theirs
[i
];
1355 err
= got_object_get_type(&obj_type
, repo
, id
);
1358 if (obj_type
== GOT_OBJ_TYPE_COMMIT
) {
1359 if (!found_all_objects
) {
1360 err
= load_commit(0, idset
, idset_exclude
,
1361 id
, repo
, seed
, loose_obj_only
,
1362 ncolored
, nfound
, ntrees
,
1363 progress_cb
, progress_arg
, rl
,
1364 cancel_cb
, cancel_arg
);
1368 } else if (obj_type
== GOT_OBJ_TYPE_TAG
) {
1369 err
= load_tag(0, idset
, idset_exclude
, id
, repo
,
1370 seed
, loose_obj_only
, ncolored
, nfound
, ntrees
,
1371 progress_cb
, progress_arg
, rl
,
1372 cancel_cb
, cancel_arg
);
1378 found_all_objects
= 0;
1379 err
= find_pack_for_enumeration(&packidx
, ids
, nobj
, repo
);
1383 err
= got_pack_load_packed_object_ids(&found_all_objects
, ids
,
1384 nobj
, theirs
, ntheirs
, 1, seed
, idset
, idset_exclude
,
1385 loose_obj_only
, repo
, packidx
, ncolored
, nfound
, ntrees
,
1386 progress_cb
, progress_arg
, rl
, cancel_cb
, cancel_arg
);
1391 if (!found_all_objects
) {
1392 for (i
= 0; i
< nobj
; i
++) {
1393 err
= load_commit(1, idset
, idset_exclude
, ids
[i
],
1394 repo
, seed
, loose_obj_only
, ncolored
, nfound
,
1395 ntrees
, progress_cb
, progress_arg
, rl
,
1396 cancel_cb
, cancel_arg
);
1402 for (i
= 0; i
< nours
; i
++) {
1403 struct got_object_id
*id
= ours
[i
];
1404 struct got_pack_meta
*m
;
1407 m
= got_object_idset_get(idset
, id
);
1409 err
= got_object_get_type(&obj_type
, repo
, id
);
1413 obj_type
= m
->obj_type
;
1414 if (obj_type
!= GOT_OBJ_TYPE_TAG
)
1416 err
= load_tag(1, idset
, idset_exclude
, id
, repo
,
1417 seed
, loose_obj_only
, ncolored
, nfound
, ntrees
,
1418 progress_cb
, progress_arg
, rl
, cancel_cb
, cancel_arg
);
1423 for (i
= 0; i
< nobj
; i
++) {
1427 got_object_idset_free(idset_exclude
);
1431 static const struct got_error
*
1432 hwrite(int fd
, const void *buf
, off_t len
, struct got_hash
*ctx
)
1434 got_hash_update(ctx
, buf
, len
);
1435 return got_poll_write_full(fd
, buf
, len
);
1438 static const struct got_error
*
1439 hcopy(FILE *fsrc
, int fd_dst
, off_t len
, struct got_hash
*ctx
)
1441 const struct got_error
*err
;
1442 unsigned char buf
[65536];
1446 while (remain
> 0) {
1447 size_t copylen
= MIN(sizeof(buf
), remain
);
1448 n
= fread(buf
, 1, copylen
, fsrc
);
1450 return got_ferror(fsrc
, GOT_ERR_IO
);
1451 got_hash_update(ctx
, buf
, copylen
);
1452 err
= got_poll_write_full(fd_dst
, buf
, copylen
);
1461 static const struct got_error
*
1462 hcopy_mmap(uint8_t *src
, off_t src_offset
, size_t src_size
,
1463 int fd
, off_t len
, struct got_hash
*ctx
)
1465 if (src_offset
+ len
> src_size
)
1466 return got_error(GOT_ERR_RANGE
);
1468 got_hash_update(ctx
, src
+ src_offset
, len
);
1469 return got_poll_write_full(fd
, src
+ src_offset
, len
);
1473 putbe32(char *b
, uint32_t n
)
1482 write_order_cmp(const void *pa
, const void *pb
)
1484 struct got_pack_meta
*a
, *b
, *ahd
, *bhd
;
1486 a
= *(struct got_pack_meta
**)pa
;
1487 b
= *(struct got_pack_meta
**)pb
;
1488 ahd
= (a
->head
== NULL
) ? a
: a
->head
;
1489 bhd
= (b
->head
== NULL
) ? b
: b
->head
;
1490 if (bhd
->mtime
< ahd
->mtime
)
1492 if (bhd
->mtime
> ahd
->mtime
)
1498 if (a
->nchain
!= b
->nchain
)
1499 return a
->nchain
- b
->nchain
;
1500 if (a
->mtime
< b
->mtime
)
1502 if (a
->mtime
> b
->mtime
)
1504 return got_object_id_cmp(&a
->id
, &b
->id
);
1508 reuse_write_order_cmp(const void *pa
, const void *pb
)
1510 struct got_pack_meta
*a
, *b
;
1512 a
= *(struct got_pack_meta
**)pa
;
1513 b
= *(struct got_pack_meta
**)pb
;
1515 if (a
->reused_delta_offset
< b
->reused_delta_offset
)
1517 if (a
->reused_delta_offset
> b
->reused_delta_offset
)
1522 static const struct got_error
*
1523 packhdr(int *hdrlen
, char *hdr
, size_t bufsize
, int obj_type
, size_t len
)
1529 hdr
[0] = obj_type
<< 4;
1530 hdr
[0] |= len
& 0xf;
1532 for (i
= 1; len
!= 0; i
++){
1534 return got_error(GOT_ERR_NO_SPACE
);
1535 hdr
[i
- 1] |= GOT_DELTA_SIZE_MORE
;
1536 hdr
[i
] = len
& GOT_DELTA_SIZE_VAL_MASK
;
1537 len
>>= GOT_DELTA_SIZE_SHIFT
;
1545 packoff(char *hdr
, off_t off
)
1550 rbuf
[0] = off
& GOT_DELTA_SIZE_VAL_MASK
;
1551 for (i
= 1; (off
>>= GOT_DELTA_SIZE_SHIFT
) != 0; i
++) {
1552 rbuf
[i
] = (--off
& GOT_DELTA_SIZE_VAL_MASK
) |
1553 GOT_DELTA_SIZE_MORE
;
1558 hdr
[j
++] = rbuf
[--i
];
1562 static const struct got_error
*
1563 deltahdr(off_t
*packfile_size
, struct got_hash
*ctx
, int packfd
,
1564 int force_refdelta
, struct got_pack_meta
*m
)
1566 const struct got_error
*err
;
1569 size_t digest_len
= got_hash_digest_length(m
->prev
->id
.algo
);
1571 if (m
->prev
->off
!= 0 && !force_refdelta
) {
1572 err
= packhdr(&nh
, buf
, sizeof(buf
),
1573 GOT_OBJ_TYPE_OFFSET_DELTA
, m
->delta_len
);
1576 nh
+= packoff(buf
+ nh
, m
->off
- m
->prev
->off
);
1577 err
= hwrite(packfd
, buf
, nh
, ctx
);
1580 *packfile_size
+= nh
;
1582 err
= packhdr(&nh
, buf
, sizeof(buf
),
1583 GOT_OBJ_TYPE_REF_DELTA
, m
->delta_len
);
1586 err
= hwrite(packfd
, buf
, nh
, ctx
);
1589 *packfile_size
+= nh
;
1590 err
= hwrite(packfd
, m
->prev
->id
.hash
, digest_len
, ctx
);
1593 *packfile_size
+= digest_len
;
1599 static const struct got_error
*
1600 write_packed_object(off_t
*packfile_size
, int packfd
,
1601 FILE *delta_cache
, uint8_t *delta_cache_map
, size_t delta_cache_size
,
1602 struct got_pack_meta
*m
, int *outfd
, struct got_hash
*ctx
,
1603 struct got_repository
*repo
, int force_refdelta
)
1605 const struct got_error
*err
= NULL
;
1606 struct got_deflate_checksum csum
;
1609 struct got_raw_object
*raw
= NULL
;
1610 off_t outlen
, delta_offset
;
1612 memset(&csum
, 0, sizeof(csum
));
1613 csum
.output_ctx
= ctx
;
1615 if (m
->reused_delta_offset
)
1616 delta_offset
= m
->reused_delta_offset
;
1618 delta_offset
= m
->delta_offset
;
1620 m
->off
= *packfile_size
;
1621 if (m
->delta_len
== 0) {
1622 err
= got_object_raw_open(&raw
, outfd
, repo
, &m
->id
);
1625 err
= packhdr(&nh
, buf
, sizeof(buf
),
1626 m
->obj_type
, raw
->size
);
1629 err
= hwrite(packfd
, buf
, nh
, ctx
);
1632 *packfile_size
+= nh
;
1633 if (raw
->f
== NULL
) {
1634 err
= got_deflate_to_fd_mmap(&outlen
,
1635 raw
->data
+ raw
->hdrlen
, 0, raw
->size
,
1640 if (fseeko(raw
->f
, raw
->hdrlen
, SEEK_SET
)
1642 err
= got_error_from_errno("fseeko");
1645 err
= got_deflate_to_fd(&outlen
, raw
->f
,
1646 raw
->size
, packfd
, &csum
);
1650 *packfile_size
+= outlen
;
1651 got_object_raw_close(raw
);
1653 } else if (m
->delta_buf
) {
1654 err
= deltahdr(packfile_size
, ctx
, packfd
, force_refdelta
, m
);
1657 err
= hwrite(packfd
, m
->delta_buf
,
1658 m
->delta_compressed_len
, ctx
);
1661 *packfile_size
+= m
->delta_compressed_len
;
1663 m
->delta_buf
= NULL
;
1664 } else if (delta_cache_map
) {
1665 err
= deltahdr(packfile_size
, ctx
, packfd
, force_refdelta
, m
);
1668 err
= hcopy_mmap(delta_cache_map
, delta_offset
,
1669 delta_cache_size
, packfd
, m
->delta_compressed_len
,
1673 *packfile_size
+= m
->delta_compressed_len
;
1675 if (fseeko(delta_cache
, delta_offset
, SEEK_SET
) == -1) {
1676 err
= got_error_from_errno("fseeko");
1679 err
= deltahdr(packfile_size
, ctx
, packfd
, force_refdelta
, m
);
1682 err
= hcopy(delta_cache
, packfd
,
1683 m
->delta_compressed_len
, ctx
);
1686 *packfile_size
+= m
->delta_compressed_len
;
1690 got_object_raw_close(raw
);
1694 static const struct got_error
*
1695 genpack(struct got_object_id
*pack_hash
, int packfd
,
1696 struct got_pack
*reuse_pack
, FILE *delta_cache
,
1697 struct got_pack_meta
**deltify
, int ndeltify
,
1698 struct got_pack_meta
**reuse
, int nreuse
,
1699 int ncolored
, int nfound
, int ntrees
, int nours
,
1700 struct got_repository
*repo
, int force_refdelta
,
1701 got_pack_progress_cb progress_cb
, void *progress_arg
,
1702 struct got_ratelimit
*rl
,
1703 got_cancel_cb cancel_cb
, void *cancel_arg
)
1705 const struct got_error
*err
= NULL
;
1707 struct got_hash ctx
;
1708 struct got_pack_meta
*m
;
1710 off_t packfile_size
= 0;
1712 int delta_cache_fd
= -1;
1713 uint8_t *delta_cache_map
= NULL
;
1714 size_t delta_cache_size
= 0;
1715 FILE *packfile
= NULL
;
1716 enum got_hash_algorithm algo
;
1719 algo
= got_repo_get_object_format(repo
);
1720 digest_len
= got_hash_digest_length(algo
);
1721 got_hash_init(&ctx
, algo
);
1723 memset(pack_hash
, 0, sizeof(*pack_hash
));
1724 pack_hash
->algo
= algo
;
1726 #ifndef GOT_PACK_NO_MMAP
1727 delta_cache_fd
= dup(fileno(delta_cache
));
1728 if (delta_cache_fd
!= -1) {
1730 if (fstat(delta_cache_fd
, &sb
) == -1) {
1731 err
= got_error_from_errno("fstat");
1734 if (sb
.st_size
> 0 && sb
.st_size
<= SIZE_MAX
) {
1735 delta_cache_map
= mmap(NULL
, sb
.st_size
,
1736 PROT_READ
, MAP_PRIVATE
, delta_cache_fd
, 0);
1737 if (delta_cache_map
== MAP_FAILED
) {
1738 if (errno
!= ENOMEM
) {
1739 err
= got_error_from_errno("mmap");
1742 delta_cache_map
= NULL
; /* fallback on stdio */
1744 delta_cache_size
= (size_t)sb
.st_size
;
1748 err
= hwrite(packfd
, "PACK", 4, &ctx
);
1751 putbe32(buf
, GOT_PACKFILE_VERSION
);
1752 err
= hwrite(packfd
, buf
, 4, &ctx
);
1755 putbe32(buf
, ndeltify
+ nreuse
);
1756 err
= hwrite(packfd
, buf
, 4, &ctx
);
1760 qsort(deltify
, ndeltify
, sizeof(struct got_pack_meta
*),
1762 for (i
= 0; i
< ndeltify
; i
++) {
1763 err
= got_pack_report_progress(progress_cb
, progress_arg
, rl
,
1764 ncolored
, nfound
, ntrees
, packfile_size
, nours
,
1765 ndeltify
+ nreuse
, ndeltify
+ nreuse
, i
, 0);
1769 err
= write_packed_object(&packfile_size
, packfd
,
1770 delta_cache
, delta_cache_map
, delta_cache_size
,
1771 m
, &outfd
, &ctx
, repo
, force_refdelta
);
1776 qsort(reuse
, nreuse
, sizeof(struct got_pack_meta
*),
1777 reuse_write_order_cmp
);
1778 if (nreuse
> 0 && reuse_pack
->map
== NULL
) {
1779 int fd
= dup(reuse_pack
->fd
);
1781 err
= got_error_from_errno("dup");
1784 packfile
= fdopen(fd
, "r");
1785 if (packfile
== NULL
) {
1786 err
= got_error_from_errno("fdopen");
1791 for (i
= 0; i
< nreuse
; i
++) {
1792 err
= got_pack_report_progress(progress_cb
, progress_arg
, rl
,
1793 ncolored
, nfound
, ntrees
, packfile_size
, nours
,
1794 ndeltify
+ nreuse
, ndeltify
+ nreuse
, ndeltify
+ i
, 0);
1798 err
= write_packed_object(&packfile_size
, packfd
,
1799 packfile
, reuse_pack
->map
, reuse_pack
->filesize
,
1800 m
, &outfd
, &ctx
, repo
, force_refdelta
);
1805 got_hash_final_object_id(&ctx
, pack_hash
);
1806 err
= got_poll_write_full(packfd
, pack_hash
->hash
, digest_len
);
1809 packfile_size
+= digest_len
;
1810 packfile_size
+= sizeof(struct got_packfile_hdr
);
1812 err
= progress_cb(progress_arg
, ncolored
, nfound
, ntrees
,
1813 packfile_size
, nours
, ndeltify
+ nreuse
,
1814 ndeltify
+ nreuse
, ndeltify
+ nreuse
, 1);
1819 if (outfd
!= -1 && close(outfd
) == -1 && err
== NULL
)
1820 err
= got_error_from_errno("close");
1821 if (delta_cache_map
&& munmap(delta_cache_map
, delta_cache_size
) == -1)
1822 err
= got_error_from_errno("munmap");
1823 if (delta_cache_fd
!= -1 && close(delta_cache_fd
) == -1 && err
== NULL
)
1824 err
= got_error_from_errno("close");
1825 if (packfile
&& fclose(packfile
) == EOF
&& err
== NULL
)
1826 err
= got_error_from_errno("fclose");
1830 static const struct got_error
*
1831 add_meta_idset_cb(struct got_object_id
*id
, void *data
, void *arg
)
1833 struct got_pack_meta
*m
= data
;
1834 struct got_pack_metavec
*v
= arg
;
1836 if (m
->reused_delta_offset
!= 0)
1839 return got_pack_add_meta(m
, v
);
1842 const struct got_error
*
1843 got_pack_create(struct got_object_id
*packhash
, int packfd
, FILE *delta_cache
,
1844 struct got_object_id
**theirs
, int ntheirs
,
1845 struct got_object_id
**ours
, int nours
,
1846 struct got_repository
*repo
, int loose_obj_only
, int allow_empty
,
1847 int force_refdelta
, got_pack_progress_cb progress_cb
, void *progress_arg
,
1848 struct got_ratelimit
*rl
, got_cancel_cb cancel_cb
, void *cancel_arg
)
1850 const struct got_error
*err
;
1851 struct got_object_idset
*idset
;
1852 struct got_packidx
*reuse_packidx
= NULL
;
1853 struct got_pack
*reuse_pack
= NULL
;
1854 struct got_pack_metavec deltify
, reuse
;
1855 int ncolored
= 0, nfound
= 0, ntrees
= 0;
1859 seed
= arc4random();
1861 memset(&deltify
, 0, sizeof(deltify
));
1862 memset(&reuse
, 0, sizeof(reuse
));
1864 idset
= got_object_idset_alloc();
1866 return got_error_from_errno("got_object_idset_alloc");
1868 err
= load_object_ids(&ncolored
, &nfound
, &ntrees
, idset
, theirs
,
1869 ntheirs
, ours
, nours
, repo
, seed
, loose_obj_only
,
1870 progress_cb
, progress_arg
, rl
, cancel_cb
, cancel_arg
);
1875 err
= progress_cb(progress_arg
, ncolored
, nfound
, ntrees
,
1876 0L, nours
, got_object_idset_num_elements(idset
), 0, 0, 0);
1881 if (got_object_idset_num_elements(idset
) == 0 && !allow_empty
) {
1882 err
= got_error(GOT_ERR_CANNOT_PACK
);
1887 reuse
.meta
= calloc(reuse
.metasz
,
1888 sizeof(struct got_pack_meta
*));
1889 if (reuse
.meta
== NULL
) {
1890 err
= got_error_from_errno("calloc");
1894 err
= got_pack_search_deltas(&reuse_packidx
, &reuse_pack
,
1895 &reuse
, idset
, ncolored
, nfound
, ntrees
, nours
,
1896 repo
, progress_cb
, progress_arg
, rl
, cancel_cb
, cancel_arg
);
1900 if (reuse_packidx
&& reuse_pack
) {
1901 err
= got_repo_pin_pack(repo
, reuse_packidx
, reuse_pack
);
1906 if (fseeko(delta_cache
, 0L, SEEK_END
) == -1) {
1907 err
= got_error_from_errno("fseeko");
1911 ndeltify
= got_object_idset_num_elements(idset
) - reuse
.nmeta
;
1913 deltify
.meta
= calloc(ndeltify
, sizeof(struct got_pack_meta
*));
1914 if (deltify
.meta
== NULL
) {
1915 err
= got_error_from_errno("calloc");
1918 deltify
.metasz
= ndeltify
;
1920 err
= got_object_idset_for_each(idset
, add_meta_idset_cb
,
1924 if (deltify
.nmeta
> 0) {
1925 err
= pick_deltas(deltify
.meta
, deltify
.nmeta
,
1926 ncolored
, nfound
, ntrees
, nours
, reuse
.nmeta
,
1927 delta_cache
, repo
, progress_cb
, progress_arg
, rl
,
1928 cancel_cb
, cancel_arg
);
1934 if (fflush(delta_cache
) == EOF
) {
1935 err
= got_error_from_errno("fflush");
1941 * Report a 1-byte packfile write to indicate we are about
1942 * to start sending packfile data. gotd(8) needs this.
1944 err
= progress_cb(progress_arg
, ncolored
, nfound
, ntrees
,
1945 1 /* packfile_size */, nours
,
1946 got_object_idset_num_elements(idset
),
1947 deltify
.nmeta
+ reuse
.nmeta
, 0, 0);
1952 /* Pinned pack may have moved to different cache slot. */
1953 reuse_pack
= got_repo_get_pinned_pack(repo
);
1955 err
= genpack(packhash
, packfd
, reuse_pack
, delta_cache
, deltify
.meta
,
1956 deltify
.nmeta
, reuse
.meta
, reuse
.nmeta
, ncolored
, nfound
, ntrees
,
1957 nours
, repo
, force_refdelta
, progress_cb
, progress_arg
, rl
,
1958 cancel_cb
, cancel_arg
);
1962 free_nmeta(deltify
.meta
, deltify
.nmeta
);
1963 free_nmeta(reuse
.meta
, reuse
.nmeta
);
1964 got_object_idset_for_each(idset
, free_meta
, NULL
);
1965 got_object_idset_free(idset
);
1966 got_repo_unpin_pack(repo
);