1 #define USE_THE_REPOSITORY_VARIABLE
4 #include "environment.h"
17 #include "csum-file.h"
20 #include "run-command.h"
22 #include "object-file.h"
23 #include "object-name.h"
24 #include "object-store-ll.h"
26 #include "commit-reach.h"
30 #define PACK_ID_BITS 16
31 #define MAX_PACK_ID ((1<<PACK_ID_BITS)-1)
33 #define MAX_DEPTH ((1<<DEPTH_BITS)-1)
36 * We abuse the setuid bit on directories to mean "do not delta".
38 #define NO_DELTA S_ISUID
41 * The amount of additional space required in order to write an object into the
42 * current pack. This is the hash lengths at the end of the pack, plus the
43 * length of one object ID.
45 #define PACK_SIZE_THRESHOLD (the_hash_algo->rawsz * 3)
48 struct pack_idx_entry idx
;
49 struct hashmap_entry ent
;
50 uint32_t type
: TYPE_BITS
,
51 pack_id
: PACK_ID_BITS
,
55 static int object_entry_hashcmp(const void *map_data UNUSED
,
56 const struct hashmap_entry
*eptr
,
57 const struct hashmap_entry
*entry_or_key
,
60 const struct object_id
*oid
= keydata
;
61 const struct object_entry
*e1
, *e2
;
63 e1
= container_of(eptr
, const struct object_entry
, ent
);
65 return oidcmp(&e1
->idx
.oid
, oid
);
67 e2
= container_of(entry_or_key
, const struct object_entry
, ent
);
68 return oidcmp(&e1
->idx
.oid
, &e2
->idx
.oid
);
71 struct object_entry_pool
{
72 struct object_entry_pool
*next_pool
;
73 struct object_entry
*next_free
;
74 struct object_entry
*end
;
75 struct object_entry entries
[FLEX_ARRAY
]; /* more */
80 struct object_id
*oids
[1024];
81 struct object_entry
*marked
[1024];
82 struct mark_set
*sets
[1024];
95 struct atom_str
*next_atom
;
96 unsigned short str_len
;
97 char str_dat
[FLEX_ARRAY
]; /* more */
102 struct tree_content
*tree
;
103 struct atom_str
*name
;
104 struct tree_entry_ms
{
106 struct object_id oid
;
110 struct tree_content
{
111 unsigned int entry_capacity
; /* must match avail_tree_content */
112 unsigned int entry_count
;
113 unsigned int delta_depth
;
114 struct tree_entry
*entries
[FLEX_ARRAY
]; /* more */
117 struct avail_tree_content
{
118 unsigned int entry_capacity
; /* must match tree_content */
119 struct avail_tree_content
*next_avail
;
123 struct branch
*table_next_branch
;
124 struct branch
*active_next_branch
;
126 struct tree_entry branch_tree
;
127 uintmax_t last_commit
;
131 unsigned pack_id
: PACK_ID_BITS
;
132 struct object_id oid
;
136 struct tag
*next_tag
;
138 unsigned int pack_id
;
139 struct object_id oid
;
143 struct hash_list
*next
;
144 struct object_id oid
;
149 WHENSPEC_RAW_PERMISSIVE
,
154 struct recent_command
{
155 struct recent_command
*prev
;
156 struct recent_command
*next
;
160 typedef void (*mark_set_inserter_t
)(struct mark_set
**s
, struct object_id
*oid
, uintmax_t mark
);
161 typedef void (*each_mark_fn_t
)(uintmax_t mark
, void *obj
, void *cbp
);
163 /* Configured limits on output */
164 static unsigned long max_depth
= 50;
165 static off_t max_packsize
;
166 static int unpack_limit
= 100;
167 static int force_update
;
169 /* Stats and misc. counters */
170 static uintmax_t alloc_count
;
171 static uintmax_t marks_set_count
;
172 static uintmax_t object_count_by_type
[1 << TYPE_BITS
];
173 static uintmax_t duplicate_count_by_type
[1 << TYPE_BITS
];
174 static uintmax_t delta_count_by_type
[1 << TYPE_BITS
];
175 static uintmax_t delta_count_attempts_by_type
[1 << TYPE_BITS
];
176 static unsigned long object_count
;
177 static unsigned long branch_count
;
178 static unsigned long branch_load_count
;
180 static FILE *pack_edges
;
181 static unsigned int show_stats
= 1;
182 static int global_argc
;
183 static const char **global_argv
;
184 static const char *global_prefix
;
187 static struct mem_pool fi_mem_pool
= {
188 .block_alloc
= 2*1024*1024 - sizeof(struct mp_block
),
191 /* Atom management */
192 static unsigned int atom_table_sz
= 4451;
193 static unsigned int atom_cnt
;
194 static struct atom_str
**atom_table
;
196 /* The .pack file being generated */
197 static struct pack_idx_option pack_idx_opts
;
198 static unsigned int pack_id
;
199 static struct hashfile
*pack_file
;
200 static struct packed_git
*pack_data
;
201 static struct packed_git
**all_packs
;
202 static off_t pack_size
;
204 /* Table of objects we've written. */
205 static unsigned int object_entry_alloc
= 5000;
206 static struct object_entry_pool
*blocks
;
207 static struct hashmap object_table
;
208 static struct mark_set
*marks
;
209 static char *export_marks_file
;
210 static char *import_marks_file
;
211 static int import_marks_file_from_stream
;
212 static int import_marks_file_ignore_missing
;
213 static int import_marks_file_done
;
214 static int relative_marks_paths
;
217 static struct last_object last_blob
= {
221 /* Tree management */
222 static unsigned int tree_entry_alloc
= 1000;
223 static void *avail_tree_entry
;
224 static unsigned int avail_tree_table_sz
= 100;
225 static struct avail_tree_content
**avail_tree_table
;
226 static size_t tree_entry_allocd
;
227 static struct strbuf old_tree
= STRBUF_INIT
;
228 static struct strbuf new_tree
= STRBUF_INIT
;
231 static unsigned long max_active_branches
= 5;
232 static unsigned long cur_active_branches
;
233 static unsigned long branch_table_sz
= 1039;
234 static struct branch
**branch_table
;
235 static struct branch
*active_branches
;
238 static struct tag
*first_tag
;
239 static struct tag
*last_tag
;
241 /* Input stream parsing */
242 static whenspec_type whenspec
= WHENSPEC_RAW
;
243 static struct strbuf command_buf
= STRBUF_INIT
;
244 static int unread_command_buf
;
245 static struct recent_command cmd_hist
= {
249 static struct recent_command
*cmd_tail
= &cmd_hist
;
250 static struct recent_command
*rc_free
;
251 static unsigned int cmd_save
= 100;
252 static uintmax_t next_mark
;
253 static struct strbuf new_data
= STRBUF_INIT
;
254 static int seen_data_command
;
255 static int require_explicit_termination
;
256 static int allow_unsafe_features
;
258 /* Signal handling */
259 static volatile sig_atomic_t checkpoint_requested
;
261 /* Submodule marks */
262 static struct string_list sub_marks_from
= STRING_LIST_INIT_DUP
;
263 static struct string_list sub_marks_to
= STRING_LIST_INIT_DUP
;
264 static kh_oid_map_t
*sub_oid_map
;
266 /* Where to write output of cat-blob commands */
267 static int cat_blob_fd
= STDOUT_FILENO
;
269 static void parse_argv(void);
270 static void parse_get_mark(const char *p
);
271 static void parse_cat_blob(const char *p
);
272 static void parse_ls(const char *p
, struct branch
*b
);
274 static void for_each_mark(struct mark_set
*m
, uintmax_t base
, each_mark_fn_t callback
, void *p
)
278 for (k
= 0; k
< 1024; k
++) {
280 for_each_mark(m
->data
.sets
[k
], base
+ (k
<< m
->shift
), callback
, p
);
283 for (k
= 0; k
< 1024; k
++) {
284 if (m
->data
.marked
[k
])
285 callback(base
+ k
, m
->data
.marked
[k
], p
);
290 static void dump_marks_fn(uintmax_t mark
, void *object
, void *cbp
) {
291 struct object_entry
*e
= object
;
294 fprintf(f
, ":%" PRIuMAX
" %s\n", mark
, oid_to_hex(&e
->idx
.oid
));
297 static void write_branch_report(FILE *rpt
, struct branch
*b
)
299 fprintf(rpt
, "%s:\n", b
->name
);
301 fprintf(rpt
, " status :");
303 fputs(" active", rpt
);
304 if (b
->branch_tree
.tree
)
305 fputs(" loaded", rpt
);
306 if (is_null_oid(&b
->branch_tree
.versions
[1].oid
))
307 fputs(" dirty", rpt
);
310 fprintf(rpt
, " tip commit : %s\n", oid_to_hex(&b
->oid
));
311 fprintf(rpt
, " old tree : %s\n",
312 oid_to_hex(&b
->branch_tree
.versions
[0].oid
));
313 fprintf(rpt
, " cur tree : %s\n",
314 oid_to_hex(&b
->branch_tree
.versions
[1].oid
));
315 fprintf(rpt
, " commit clock: %" PRIuMAX
"\n", b
->last_commit
);
317 fputs(" last pack : ", rpt
);
318 if (b
->pack_id
< MAX_PACK_ID
)
319 fprintf(rpt
, "%u", b
->pack_id
);
325 static void write_crash_report(const char *err
)
327 char *loc
= git_pathdup("fast_import_crash_%"PRIuMAX
, (uintmax_t) getpid());
328 FILE *rpt
= fopen(loc
, "w");
331 struct recent_command
*rc
;
334 error_errno("can't write crash report %s", loc
);
339 fprintf(stderr
, "fast-import: dumping crash report to %s\n", loc
);
341 fprintf(rpt
, "fast-import crash report:\n");
342 fprintf(rpt
, " fast-import process: %"PRIuMAX
"\n", (uintmax_t) getpid());
343 fprintf(rpt
, " parent process : %"PRIuMAX
"\n", (uintmax_t) getppid());
344 fprintf(rpt
, " at %s\n", show_date(time(NULL
), 0, DATE_MODE(ISO8601
)));
347 fputs("fatal: ", rpt
);
352 fputs("Most Recent Commands Before Crash\n", rpt
);
353 fputs("---------------------------------\n", rpt
);
354 for (rc
= cmd_hist
.next
; rc
!= &cmd_hist
; rc
= rc
->next
) {
355 if (rc
->next
== &cmd_hist
)
364 fputs("Active Branch LRU\n", rpt
);
365 fputs("-----------------\n", rpt
);
366 fprintf(rpt
, " active_branches = %lu cur, %lu max\n",
368 max_active_branches
);
370 fputs(" pos clock name\n", rpt
);
371 fputs(" ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~\n", rpt
);
372 for (b
= active_branches
, lu
= 0; b
; b
= b
->active_next_branch
)
373 fprintf(rpt
, " %2lu) %6" PRIuMAX
" %s\n",
374 ++lu
, b
->last_commit
, b
->name
);
377 fputs("Inactive Branches\n", rpt
);
378 fputs("-----------------\n", rpt
);
379 for (lu
= 0; lu
< branch_table_sz
; lu
++) {
380 for (b
= branch_table
[lu
]; b
; b
= b
->table_next_branch
)
381 write_branch_report(rpt
, b
);
387 fputs("Annotated Tags\n", rpt
);
388 fputs("--------------\n", rpt
);
389 for (tg
= first_tag
; tg
; tg
= tg
->next_tag
) {
390 fputs(oid_to_hex(&tg
->oid
), rpt
);
392 fputs(tg
->name
, rpt
);
398 fputs("Marks\n", rpt
);
399 fputs("-----\n", rpt
);
400 if (export_marks_file
)
401 fprintf(rpt
, " exported to %s\n", export_marks_file
);
403 for_each_mark(marks
, 0, dump_marks_fn
, rpt
);
406 fputs("-------------------\n", rpt
);
407 fputs("END OF CRASH REPORT\n", rpt
);
412 static void end_packfile(void);
413 static void unkeep_all_packs(void);
414 static void dump_marks(void);
416 static NORETURN
void die_nicely(const char *err
, va_list params
)
420 report_fn die_message_fn
= get_die_message_routine();
423 die_message_fn(err
, params
);
426 char message
[2 * PATH_MAX
];
429 vsnprintf(message
, sizeof(message
), err
, cp
);
430 write_crash_report(message
);
438 #ifndef SIGUSR1 /* Windows, for example */
440 static void set_checkpoint_signal(void)
446 static void checkpoint_signal(int signo UNUSED
)
448 checkpoint_requested
= 1;
451 static void set_checkpoint_signal(void)
455 memset(&sa
, 0, sizeof(sa
));
456 sa
.sa_handler
= checkpoint_signal
;
457 sigemptyset(&sa
.sa_mask
);
458 sa
.sa_flags
= SA_RESTART
;
459 sigaction(SIGUSR1
, &sa
, NULL
);
464 static void alloc_objects(unsigned int cnt
)
466 struct object_entry_pool
*b
;
468 b
= xmalloc(sizeof(struct object_entry_pool
)
469 + cnt
* sizeof(struct object_entry
));
470 b
->next_pool
= blocks
;
471 b
->next_free
= b
->entries
;
472 b
->end
= b
->entries
+ cnt
;
477 static struct object_entry
*new_object(struct object_id
*oid
)
479 struct object_entry
*e
;
481 if (blocks
->next_free
== blocks
->end
)
482 alloc_objects(object_entry_alloc
);
484 e
= blocks
->next_free
++;
485 oidcpy(&e
->idx
.oid
, oid
);
489 static struct object_entry
*find_object(struct object_id
*oid
)
491 return hashmap_get_entry_from_hash(&object_table
, oidhash(oid
), oid
,
492 struct object_entry
, ent
);
495 static struct object_entry
*insert_object(struct object_id
*oid
)
497 struct object_entry
*e
;
498 unsigned int hash
= oidhash(oid
);
500 e
= hashmap_get_entry_from_hash(&object_table
, hash
, oid
,
501 struct object_entry
, ent
);
505 hashmap_entry_init(&e
->ent
, hash
);
506 hashmap_add(&object_table
, &e
->ent
);
512 static void invalidate_pack_id(unsigned int id
)
516 struct hashmap_iter iter
;
517 struct object_entry
*e
;
519 hashmap_for_each_entry(&object_table
, &iter
, e
, ent
) {
520 if (e
->pack_id
== id
)
521 e
->pack_id
= MAX_PACK_ID
;
524 for (lu
= 0; lu
< branch_table_sz
; lu
++) {
527 for (b
= branch_table
[lu
]; b
; b
= b
->table_next_branch
)
528 if (b
->pack_id
== id
)
529 b
->pack_id
= MAX_PACK_ID
;
532 for (t
= first_tag
; t
; t
= t
->next_tag
)
533 if (t
->pack_id
== id
)
534 t
->pack_id
= MAX_PACK_ID
;
537 static unsigned int hc_str(const char *s
, size_t len
)
545 static void insert_mark(struct mark_set
**top
, uintmax_t idnum
, struct object_entry
*oe
)
547 struct mark_set
*s
= *top
;
549 while ((idnum
>> s
->shift
) >= 1024) {
550 s
= mem_pool_calloc(&fi_mem_pool
, 1, sizeof(struct mark_set
));
551 s
->shift
= (*top
)->shift
+ 10;
552 s
->data
.sets
[0] = *top
;
556 uintmax_t i
= idnum
>> s
->shift
;
557 idnum
-= i
<< s
->shift
;
558 if (!s
->data
.sets
[i
]) {
559 s
->data
.sets
[i
] = mem_pool_calloc(&fi_mem_pool
, 1, sizeof(struct mark_set
));
560 s
->data
.sets
[i
]->shift
= s
->shift
- 10;
564 if (!s
->data
.marked
[idnum
])
566 s
->data
.marked
[idnum
] = oe
;
569 static void *find_mark(struct mark_set
*s
, uintmax_t idnum
)
571 uintmax_t orig_idnum
= idnum
;
572 struct object_entry
*oe
= NULL
;
573 if ((idnum
>> s
->shift
) < 1024) {
574 while (s
&& s
->shift
) {
575 uintmax_t i
= idnum
>> s
->shift
;
576 idnum
-= i
<< s
->shift
;
580 oe
= s
->data
.marked
[idnum
];
583 die("mark :%" PRIuMAX
" not declared", orig_idnum
);
587 static struct atom_str
*to_atom(const char *s
, unsigned short len
)
589 unsigned int hc
= hc_str(s
, len
) % atom_table_sz
;
592 for (c
= atom_table
[hc
]; c
; c
= c
->next_atom
)
593 if (c
->str_len
== len
&& !strncmp(s
, c
->str_dat
, len
))
596 c
= mem_pool_alloc(&fi_mem_pool
, sizeof(struct atom_str
) + len
+ 1);
598 memcpy(c
->str_dat
, s
, len
);
600 c
->next_atom
= atom_table
[hc
];
606 static struct branch
*lookup_branch(const char *name
)
608 unsigned int hc
= hc_str(name
, strlen(name
)) % branch_table_sz
;
611 for (b
= branch_table
[hc
]; b
; b
= b
->table_next_branch
)
612 if (!strcmp(name
, b
->name
))
617 static struct branch
*new_branch(const char *name
)
619 unsigned int hc
= hc_str(name
, strlen(name
)) % branch_table_sz
;
620 struct branch
*b
= lookup_branch(name
);
623 die("Invalid attempt to create duplicate branch: %s", name
);
624 if (check_refname_format(name
, REFNAME_ALLOW_ONELEVEL
))
625 die("Branch name doesn't conform to GIT standards: %s", name
);
627 b
= mem_pool_calloc(&fi_mem_pool
, 1, sizeof(struct branch
));
628 b
->name
= mem_pool_strdup(&fi_mem_pool
, name
);
629 b
->table_next_branch
= branch_table
[hc
];
630 b
->branch_tree
.versions
[0].mode
= S_IFDIR
;
631 b
->branch_tree
.versions
[1].mode
= S_IFDIR
;
634 b
->pack_id
= MAX_PACK_ID
;
635 branch_table
[hc
] = b
;
640 static unsigned int hc_entries(unsigned int cnt
)
642 cnt
= cnt
& 7 ? (cnt
/ 8) + 1 : cnt
/ 8;
643 return cnt
< avail_tree_table_sz
? cnt
: avail_tree_table_sz
- 1;
646 static struct tree_content
*new_tree_content(unsigned int cnt
)
648 struct avail_tree_content
*f
, *l
= NULL
;
649 struct tree_content
*t
;
650 unsigned int hc
= hc_entries(cnt
);
652 for (f
= avail_tree_table
[hc
]; f
; l
= f
, f
= f
->next_avail
)
653 if (f
->entry_capacity
>= cnt
)
658 l
->next_avail
= f
->next_avail
;
660 avail_tree_table
[hc
] = f
->next_avail
;
662 cnt
= cnt
& 7 ? ((cnt
/ 8) + 1) * 8 : cnt
;
663 f
= mem_pool_alloc(&fi_mem_pool
, sizeof(*t
) + sizeof(t
->entries
[0]) * cnt
);
664 f
->entry_capacity
= cnt
;
667 t
= (struct tree_content
*)f
;
673 static void release_tree_entry(struct tree_entry
*e
);
674 static void release_tree_content(struct tree_content
*t
)
676 struct avail_tree_content
*f
= (struct avail_tree_content
*)t
;
677 unsigned int hc
= hc_entries(f
->entry_capacity
);
678 f
->next_avail
= avail_tree_table
[hc
];
679 avail_tree_table
[hc
] = f
;
682 static void release_tree_content_recursive(struct tree_content
*t
)
685 for (i
= 0; i
< t
->entry_count
; i
++)
686 release_tree_entry(t
->entries
[i
]);
687 release_tree_content(t
);
690 static struct tree_content
*grow_tree_content(
691 struct tree_content
*t
,
694 struct tree_content
*r
= new_tree_content(t
->entry_count
+ amt
);
695 r
->entry_count
= t
->entry_count
;
696 r
->delta_depth
= t
->delta_depth
;
697 COPY_ARRAY(r
->entries
, t
->entries
, t
->entry_count
);
698 release_tree_content(t
);
702 static struct tree_entry
*new_tree_entry(void)
704 struct tree_entry
*e
;
706 if (!avail_tree_entry
) {
707 unsigned int n
= tree_entry_alloc
;
708 tree_entry_allocd
+= n
* sizeof(struct tree_entry
);
710 avail_tree_entry
= e
;
712 *((void**)e
) = e
+ 1;
718 e
= avail_tree_entry
;
719 avail_tree_entry
= *((void**)e
);
723 static void release_tree_entry(struct tree_entry
*e
)
726 release_tree_content_recursive(e
->tree
);
727 *((void**)e
) = avail_tree_entry
;
728 avail_tree_entry
= e
;
731 static struct tree_content
*dup_tree_content(struct tree_content
*s
)
733 struct tree_content
*d
;
734 struct tree_entry
*a
, *b
;
739 d
= new_tree_content(s
->entry_count
);
740 for (i
= 0; i
< s
->entry_count
; i
++) {
742 b
= new_tree_entry();
743 memcpy(b
, a
, sizeof(*a
));
744 if (a
->tree
&& is_null_oid(&b
->versions
[1].oid
))
745 b
->tree
= dup_tree_content(a
->tree
);
750 d
->entry_count
= s
->entry_count
;
751 d
->delta_depth
= s
->delta_depth
;
756 static void start_packfile(void)
758 struct strbuf tmp_file
= STRBUF_INIT
;
759 struct packed_git
*p
;
762 pack_fd
= odb_mkstemp(&tmp_file
, "pack/tmp_pack_XXXXXX");
763 FLEX_ALLOC_STR(p
, pack_name
, tmp_file
.buf
);
764 strbuf_release(&tmp_file
);
766 p
->pack_fd
= pack_fd
;
768 pack_file
= hashfd(pack_fd
, p
->pack_name
);
771 pack_size
= write_pack_header(pack_file
, 0);
774 REALLOC_ARRAY(all_packs
, pack_id
+ 1);
775 all_packs
[pack_id
] = p
;
778 static const char *create_index(void)
781 struct pack_idx_entry
**idx
, **c
, **last
;
782 struct object_entry
*e
;
783 struct object_entry_pool
*o
;
785 /* Build the table of object IDs. */
786 ALLOC_ARRAY(idx
, object_count
);
788 for (o
= blocks
; o
; o
= o
->next_pool
)
789 for (e
= o
->next_free
; e
-- != o
->entries
;)
790 if (pack_id
== e
->pack_id
)
792 last
= idx
+ object_count
;
794 die("internal consistency error creating the index");
796 tmpfile
= write_idx_file(NULL
, idx
, object_count
, &pack_idx_opts
,
802 static char *keep_pack(const char *curr_index_name
)
804 static const char *keep_msg
= "fast-import";
805 struct strbuf name
= STRBUF_INIT
;
808 odb_pack_name(&name
, pack_data
->hash
, "keep");
809 keep_fd
= odb_pack_keep(name
.buf
);
811 die_errno("cannot create keep file");
812 write_or_die(keep_fd
, keep_msg
, strlen(keep_msg
));
814 die_errno("failed to write keep file");
816 odb_pack_name(&name
, pack_data
->hash
, "pack");
817 if (finalize_object_file(pack_data
->pack_name
, name
.buf
))
818 die("cannot store pack file");
820 odb_pack_name(&name
, pack_data
->hash
, "idx");
821 if (finalize_object_file(curr_index_name
, name
.buf
))
822 die("cannot store index file");
823 free((void *)curr_index_name
);
824 return strbuf_detach(&name
, NULL
);
827 static void unkeep_all_packs(void)
829 struct strbuf name
= STRBUF_INIT
;
832 for (k
= 0; k
< pack_id
; k
++) {
833 struct packed_git
*p
= all_packs
[k
];
834 odb_pack_name(&name
, p
->hash
, "keep");
835 unlink_or_warn(name
.buf
);
837 strbuf_release(&name
);
840 static int loosen_small_pack(const struct packed_git
*p
)
842 struct child_process unpack
= CHILD_PROCESS_INIT
;
844 if (lseek(p
->pack_fd
, 0, SEEK_SET
) < 0)
845 die_errno("Failed seeking to start of '%s'", p
->pack_name
);
847 unpack
.in
= p
->pack_fd
;
849 unpack
.stdout_to_stderr
= 1;
850 strvec_push(&unpack
.args
, "unpack-objects");
852 strvec_push(&unpack
.args
, "-q");
854 return run_command(&unpack
);
857 static void end_packfile(void)
861 if (running
|| !pack_data
)
865 clear_delta_base_cache();
867 struct packed_git
*new_p
;
868 struct object_id cur_pack_oid
;
874 close_pack_windows(pack_data
);
875 finalize_hashfile(pack_file
, cur_pack_oid
.hash
, FSYNC_COMPONENT_PACK
, 0);
876 fixup_pack_header_footer(pack_data
->pack_fd
, pack_data
->hash
,
877 pack_data
->pack_name
, object_count
,
878 cur_pack_oid
.hash
, pack_size
);
880 if (object_count
<= unpack_limit
) {
881 if (!loosen_small_pack(pack_data
)) {
882 invalidate_pack_id(pack_id
);
887 close(pack_data
->pack_fd
);
888 idx_name
= keep_pack(create_index());
890 /* Register the packfile with core git's machinery. */
891 new_p
= add_packed_git(idx_name
, strlen(idx_name
), 1);
893 die("core git rejected index %s", idx_name
);
894 all_packs
[pack_id
] = new_p
;
895 install_packed_git(the_repository
, new_p
);
898 /* Print the boundary */
900 fprintf(pack_edges
, "%s:", new_p
->pack_name
);
901 for (i
= 0; i
< branch_table_sz
; i
++) {
902 for (b
= branch_table
[i
]; b
; b
= b
->table_next_branch
) {
903 if (b
->pack_id
== pack_id
)
904 fprintf(pack_edges
, " %s",
905 oid_to_hex(&b
->oid
));
908 for (t
= first_tag
; t
; t
= t
->next_tag
) {
909 if (t
->pack_id
== pack_id
)
910 fprintf(pack_edges
, " %s",
911 oid_to_hex(&t
->oid
));
913 fputc('\n', pack_edges
);
921 close(pack_data
->pack_fd
);
922 unlink_or_warn(pack_data
->pack_name
);
924 FREE_AND_NULL(pack_data
);
927 /* We can't carry a delta across packfiles. */
928 strbuf_release(&last_blob
.data
);
929 last_blob
.offset
= 0;
933 static void cycle_packfile(void)
939 static int store_object(
940 enum object_type type
,
942 struct last_object
*last
,
943 struct object_id
*oidout
,
947 struct object_entry
*e
;
948 unsigned char hdr
[96];
949 struct object_id oid
;
950 unsigned long hdrlen
, deltalen
;
954 hdrlen
= format_object_header((char *)hdr
, sizeof(hdr
), type
,
956 the_hash_algo
->init_fn(&c
);
957 the_hash_algo
->update_fn(&c
, hdr
, hdrlen
);
958 the_hash_algo
->update_fn(&c
, dat
->buf
, dat
->len
);
959 the_hash_algo
->final_oid_fn(&oid
, &c
);
961 oidcpy(oidout
, &oid
);
963 e
= insert_object(&oid
);
965 insert_mark(&marks
, mark
, e
);
967 duplicate_count_by_type
[type
]++;
969 } else if (find_sha1_pack(oid
.hash
,
970 get_all_packs(the_repository
))) {
972 e
->pack_id
= MAX_PACK_ID
;
973 e
->idx
.offset
= 1; /* just not zero! */
974 duplicate_count_by_type
[type
]++;
978 if (last
&& last
->data
.len
&& last
->data
.buf
&& last
->depth
< max_depth
979 && dat
->len
> the_hash_algo
->rawsz
) {
981 delta_count_attempts_by_type
[type
]++;
982 delta
= diff_delta(last
->data
.buf
, last
->data
.len
,
984 &deltalen
, dat
->len
- the_hash_algo
->rawsz
);
988 git_deflate_init(&s
, pack_compression_level
);
991 s
.avail_in
= deltalen
;
993 s
.next_in
= (void *)dat
->buf
;
994 s
.avail_in
= dat
->len
;
996 s
.avail_out
= git_deflate_bound(&s
, s
.avail_in
);
997 s
.next_out
= out
= xmalloc(s
.avail_out
);
998 while (git_deflate(&s
, Z_FINISH
) == Z_OK
)
1000 git_deflate_end(&s
);
1002 /* Determine if we should auto-checkpoint. */
1004 && (pack_size
+ PACK_SIZE_THRESHOLD
+ s
.total_out
) > max_packsize
)
1005 || (pack_size
+ PACK_SIZE_THRESHOLD
+ s
.total_out
) < pack_size
) {
1007 /* This new object needs to *not* have the current pack_id. */
1008 e
->pack_id
= pack_id
+ 1;
1011 /* We cannot carry a delta into the new pack. */
1013 FREE_AND_NULL(delta
);
1015 git_deflate_init(&s
, pack_compression_level
);
1016 s
.next_in
= (void *)dat
->buf
;
1017 s
.avail_in
= dat
->len
;
1018 s
.avail_out
= git_deflate_bound(&s
, s
.avail_in
);
1019 s
.next_out
= out
= xrealloc(out
, s
.avail_out
);
1020 while (git_deflate(&s
, Z_FINISH
) == Z_OK
)
1022 git_deflate_end(&s
);
1027 e
->pack_id
= pack_id
;
1028 e
->idx
.offset
= pack_size
;
1030 object_count_by_type
[type
]++;
1032 crc32_begin(pack_file
);
1035 off_t ofs
= e
->idx
.offset
- last
->offset
;
1036 unsigned pos
= sizeof(hdr
) - 1;
1038 delta_count_by_type
[type
]++;
1039 e
->depth
= last
->depth
+ 1;
1041 hdrlen
= encode_in_pack_object_header(hdr
, sizeof(hdr
),
1042 OBJ_OFS_DELTA
, deltalen
);
1043 hashwrite(pack_file
, hdr
, hdrlen
);
1044 pack_size
+= hdrlen
;
1046 hdr
[pos
] = ofs
& 127;
1048 hdr
[--pos
] = 128 | (--ofs
& 127);
1049 hashwrite(pack_file
, hdr
+ pos
, sizeof(hdr
) - pos
);
1050 pack_size
+= sizeof(hdr
) - pos
;
1053 hdrlen
= encode_in_pack_object_header(hdr
, sizeof(hdr
),
1055 hashwrite(pack_file
, hdr
, hdrlen
);
1056 pack_size
+= hdrlen
;
1059 hashwrite(pack_file
, out
, s
.total_out
);
1060 pack_size
+= s
.total_out
;
1062 e
->idx
.crc32
= crc32_end(pack_file
);
1067 if (last
->no_swap
) {
1070 strbuf_swap(&last
->data
, dat
);
1072 last
->offset
= e
->idx
.offset
;
1073 last
->depth
= e
->depth
;
1078 static void truncate_pack(struct hashfile_checkpoint
*checkpoint
)
1080 if (hashfile_truncate(pack_file
, checkpoint
))
1081 die_errno("cannot truncate pack to skip duplicate");
1082 pack_size
= checkpoint
->offset
;
1085 static void stream_blob(uintmax_t len
, struct object_id
*oidout
, uintmax_t mark
)
1087 size_t in_sz
= 64 * 1024, out_sz
= 64 * 1024;
1088 unsigned char *in_buf
= xmalloc(in_sz
);
1089 unsigned char *out_buf
= xmalloc(out_sz
);
1090 struct object_entry
*e
;
1091 struct object_id oid
;
1092 unsigned long hdrlen
;
1096 struct hashfile_checkpoint checkpoint
;
1099 /* Determine if we should auto-checkpoint. */
1101 && (pack_size
+ PACK_SIZE_THRESHOLD
+ len
) > max_packsize
)
1102 || (pack_size
+ PACK_SIZE_THRESHOLD
+ len
) < pack_size
)
1105 the_hash_algo
->init_fn(&checkpoint
.ctx
);
1106 hashfile_checkpoint(pack_file
, &checkpoint
);
1107 offset
= checkpoint
.offset
;
1109 hdrlen
= format_object_header((char *)out_buf
, out_sz
, OBJ_BLOB
, len
);
1111 the_hash_algo
->init_fn(&c
);
1112 the_hash_algo
->update_fn(&c
, out_buf
, hdrlen
);
1114 crc32_begin(pack_file
);
1116 git_deflate_init(&s
, pack_compression_level
);
1118 hdrlen
= encode_in_pack_object_header(out_buf
, out_sz
, OBJ_BLOB
, len
);
1120 s
.next_out
= out_buf
+ hdrlen
;
1121 s
.avail_out
= out_sz
- hdrlen
;
1123 while (status
!= Z_STREAM_END
) {
1124 if (0 < len
&& !s
.avail_in
) {
1125 size_t cnt
= in_sz
< len
? in_sz
: (size_t)len
;
1126 size_t n
= fread(in_buf
, 1, cnt
, stdin
);
1127 if (!n
&& feof(stdin
))
1128 die("EOF in data (%" PRIuMAX
" bytes remaining)", len
);
1130 the_hash_algo
->update_fn(&c
, in_buf
, n
);
1136 status
= git_deflate(&s
, len
? 0 : Z_FINISH
);
1138 if (!s
.avail_out
|| status
== Z_STREAM_END
) {
1139 size_t n
= s
.next_out
- out_buf
;
1140 hashwrite(pack_file
, out_buf
, n
);
1142 s
.next_out
= out_buf
;
1143 s
.avail_out
= out_sz
;
1152 die("unexpected deflate failure: %d", status
);
1155 git_deflate_end(&s
);
1156 the_hash_algo
->final_oid_fn(&oid
, &c
);
1159 oidcpy(oidout
, &oid
);
1161 e
= insert_object(&oid
);
1164 insert_mark(&marks
, mark
, e
);
1166 if (e
->idx
.offset
) {
1167 duplicate_count_by_type
[OBJ_BLOB
]++;
1168 truncate_pack(&checkpoint
);
1170 } else if (find_sha1_pack(oid
.hash
,
1171 get_all_packs(the_repository
))) {
1173 e
->pack_id
= MAX_PACK_ID
;
1174 e
->idx
.offset
= 1; /* just not zero! */
1175 duplicate_count_by_type
[OBJ_BLOB
]++;
1176 truncate_pack(&checkpoint
);
1181 e
->pack_id
= pack_id
;
1182 e
->idx
.offset
= offset
;
1183 e
->idx
.crc32
= crc32_end(pack_file
);
1185 object_count_by_type
[OBJ_BLOB
]++;
1192 /* All calls must be guarded by find_object() or find_mark() to
1193 * ensure the 'struct object_entry' passed was written by this
1194 * process instance. We unpack the entry by the offset, avoiding
1195 * the need for the corresponding .idx file. This unpacking rule
1196 * works because we only use OBJ_REF_DELTA within the packfiles
1197 * created by fast-import.
1199 * oe must not be NULL. Such an oe usually comes from giving
1200 * an unknown SHA-1 to find_object() or an undefined mark to
1201 * find_mark(). Callers must test for this condition and use
1202 * the standard read_sha1_file() when it happens.
1204 * oe->pack_id must not be MAX_PACK_ID. Such an oe is usually from
1205 * find_mark(), where the mark was reloaded from an existing marks
1206 * file and is referencing an object that this fast-import process
1207 * instance did not write out to a packfile. Callers must test for
1208 * this condition and use read_sha1_file() instead.
1210 static void *gfi_unpack_entry(
1211 struct object_entry
*oe
,
1212 unsigned long *sizep
)
1214 enum object_type type
;
1215 struct packed_git
*p
= all_packs
[oe
->pack_id
];
1216 if (p
== pack_data
&& p
->pack_size
< (pack_size
+ the_hash_algo
->rawsz
)) {
1217 /* The object is stored in the packfile we are writing to
1218 * and we have modified it since the last time we scanned
1219 * back to read a previously written object. If an old
1220 * window covered [p->pack_size, p->pack_size + rawsz) its
1221 * data is stale and is not valid. Closing all windows
1222 * and updating the packfile length ensures we can read
1223 * the newly written data.
1225 close_pack_windows(p
);
1226 hashflush(pack_file
);
1228 /* We have to offer rawsz bytes additional on the end of
1229 * the packfile as the core unpacker code assumes the
1230 * footer is present at the file end and must promise
1231 * at least rawsz bytes within any window it maps. But
1232 * we don't actually create the footer here.
1234 p
->pack_size
= pack_size
+ the_hash_algo
->rawsz
;
1236 return unpack_entry(the_repository
, p
, oe
->idx
.offset
, &type
, sizep
);
1239 static void load_tree(struct tree_entry
*root
)
1241 struct object_id
*oid
= &root
->versions
[1].oid
;
1242 struct object_entry
*myoe
;
1243 struct tree_content
*t
;
1248 root
->tree
= t
= new_tree_content(8);
1249 if (is_null_oid(oid
))
1252 myoe
= find_object(oid
);
1253 if (myoe
&& myoe
->pack_id
!= MAX_PACK_ID
) {
1254 if (myoe
->type
!= OBJ_TREE
)
1255 die("Not a tree: %s", oid_to_hex(oid
));
1256 t
->delta_depth
= myoe
->depth
;
1257 buf
= gfi_unpack_entry(myoe
, &size
);
1259 die("Can't load tree %s", oid_to_hex(oid
));
1261 enum object_type type
;
1262 buf
= repo_read_object_file(the_repository
, oid
, &type
, &size
);
1263 if (!buf
|| type
!= OBJ_TREE
)
1264 die("Can't load tree %s", oid_to_hex(oid
));
1268 while (c
!= (buf
+ size
)) {
1269 struct tree_entry
*e
= new_tree_entry();
1271 if (t
->entry_count
== t
->entry_capacity
)
1272 root
->tree
= t
= grow_tree_content(t
, t
->entry_count
);
1273 t
->entries
[t
->entry_count
++] = e
;
1276 c
= parse_mode(c
, &e
->versions
[1].mode
);
1278 die("Corrupt mode in %s", oid_to_hex(oid
));
1279 e
->versions
[0].mode
= e
->versions
[1].mode
;
1280 e
->name
= to_atom(c
, strlen(c
));
1281 c
+= e
->name
->str_len
+ 1;
1282 oidread(&e
->versions
[0].oid
, (unsigned char *)c
,
1283 the_repository
->hash_algo
);
1284 oidread(&e
->versions
[1].oid
, (unsigned char *)c
,
1285 the_repository
->hash_algo
);
1286 c
+= the_hash_algo
->rawsz
;
1291 static int tecmp0 (const void *_a
, const void *_b
)
1293 struct tree_entry
*a
= *((struct tree_entry
**)_a
);
1294 struct tree_entry
*b
= *((struct tree_entry
**)_b
);
1295 return base_name_compare(
1296 a
->name
->str_dat
, a
->name
->str_len
, a
->versions
[0].mode
,
1297 b
->name
->str_dat
, b
->name
->str_len
, b
->versions
[0].mode
);
1300 static int tecmp1 (const void *_a
, const void *_b
)
1302 struct tree_entry
*a
= *((struct tree_entry
**)_a
);
1303 struct tree_entry
*b
= *((struct tree_entry
**)_b
);
1304 return base_name_compare(
1305 a
->name
->str_dat
, a
->name
->str_len
, a
->versions
[1].mode
,
1306 b
->name
->str_dat
, b
->name
->str_len
, b
->versions
[1].mode
);
1309 static void mktree(struct tree_content
*t
, int v
, struct strbuf
*b
)
1315 QSORT(t
->entries
, t
->entry_count
, tecmp0
);
1317 QSORT(t
->entries
, t
->entry_count
, tecmp1
);
1319 for (i
= 0; i
< t
->entry_count
; i
++) {
1320 if (t
->entries
[i
]->versions
[v
].mode
)
1321 maxlen
+= t
->entries
[i
]->name
->str_len
+ 34;
1325 strbuf_grow(b
, maxlen
);
1326 for (i
= 0; i
< t
->entry_count
; i
++) {
1327 struct tree_entry
*e
= t
->entries
[i
];
1328 if (!e
->versions
[v
].mode
)
1330 strbuf_addf(b
, "%o %s%c",
1331 (unsigned int)(e
->versions
[v
].mode
& ~NO_DELTA
),
1332 e
->name
->str_dat
, '\0');
1333 strbuf_add(b
, e
->versions
[v
].oid
.hash
, the_hash_algo
->rawsz
);
1337 static void store_tree(struct tree_entry
*root
)
1339 struct tree_content
*t
;
1340 unsigned int i
, j
, del
;
1341 struct last_object lo
= { STRBUF_INIT
, 0, 0, /* no_swap */ 1 };
1342 struct object_entry
*le
= NULL
;
1344 if (!is_null_oid(&root
->versions
[1].oid
))
1351 for (i
= 0; i
< t
->entry_count
; i
++) {
1352 if (t
->entries
[i
]->tree
)
1353 store_tree(t
->entries
[i
]);
1356 if (!(root
->versions
[0].mode
& NO_DELTA
))
1357 le
= find_object(&root
->versions
[0].oid
);
1358 if (S_ISDIR(root
->versions
[0].mode
) && le
&& le
->pack_id
== pack_id
) {
1359 mktree(t
, 0, &old_tree
);
1361 lo
.offset
= le
->idx
.offset
;
1362 lo
.depth
= t
->delta_depth
;
1365 mktree(t
, 1, &new_tree
);
1366 store_object(OBJ_TREE
, &new_tree
, &lo
, &root
->versions
[1].oid
, 0);
1368 t
->delta_depth
= lo
.depth
;
1369 for (i
= 0, j
= 0, del
= 0; i
< t
->entry_count
; i
++) {
1370 struct tree_entry
*e
= t
->entries
[i
];
1371 if (e
->versions
[1].mode
) {
1372 e
->versions
[0].mode
= e
->versions
[1].mode
;
1373 oidcpy(&e
->versions
[0].oid
, &e
->versions
[1].oid
);
1374 t
->entries
[j
++] = e
;
1376 release_tree_entry(e
);
1380 t
->entry_count
-= del
;
1383 static void tree_content_replace(
1384 struct tree_entry
*root
,
1385 const struct object_id
*oid
,
1386 const uint16_t mode
,
1387 struct tree_content
*newtree
)
1390 die("Root cannot be a non-directory");
1391 oidclr(&root
->versions
[0].oid
, the_repository
->hash_algo
);
1392 oidcpy(&root
->versions
[1].oid
, oid
);
1394 release_tree_content_recursive(root
->tree
);
1395 root
->tree
= newtree
;
1398 static int tree_content_set(
1399 struct tree_entry
*root
,
1401 const struct object_id
*oid
,
1402 const uint16_t mode
,
1403 struct tree_content
*subtree
)
1405 struct tree_content
*t
;
1408 struct tree_entry
*e
;
1410 slash1
= strchrnul(p
, '/');
1413 die("Empty path component found in input");
1414 if (!*slash1
&& !S_ISDIR(mode
) && subtree
)
1415 die("Non-directories cannot have subtrees");
1420 for (i
= 0; i
< t
->entry_count
; i
++) {
1422 if (e
->name
->str_len
== n
&& !fspathncmp(p
, e
->name
->str_dat
, n
)) {
1425 && e
->versions
[1].mode
== mode
1426 && oideq(&e
->versions
[1].oid
, oid
))
1428 e
->versions
[1].mode
= mode
;
1429 oidcpy(&e
->versions
[1].oid
, oid
);
1431 release_tree_content_recursive(e
->tree
);
1435 * We need to leave e->versions[0].sha1 alone
1436 * to avoid modifying the preimage tree used
1437 * when writing out the parent directory.
1438 * But after replacing the subdir with a
1439 * completely different one, it's not a good
1440 * delta base any more, and besides, we've
1441 * thrown away the tree entries needed to
1442 * make a delta against it.
1444 * So let's just explicitly disable deltas
1447 if (S_ISDIR(e
->versions
[0].mode
))
1448 e
->versions
[0].mode
|= NO_DELTA
;
1450 oidclr(&root
->versions
[1].oid
, the_repository
->hash_algo
);
1453 if (!S_ISDIR(e
->versions
[1].mode
)) {
1454 e
->tree
= new_tree_content(8);
1455 e
->versions
[1].mode
= S_IFDIR
;
1459 if (tree_content_set(e
, slash1
+ 1, oid
, mode
, subtree
)) {
1460 oidclr(&root
->versions
[1].oid
, the_repository
->hash_algo
);
1467 if (t
->entry_count
== t
->entry_capacity
)
1468 root
->tree
= t
= grow_tree_content(t
, t
->entry_count
);
1469 e
= new_tree_entry();
1470 e
->name
= to_atom(p
, n
);
1471 e
->versions
[0].mode
= 0;
1472 oidclr(&e
->versions
[0].oid
, the_repository
->hash_algo
);
1473 t
->entries
[t
->entry_count
++] = e
;
1475 e
->tree
= new_tree_content(8);
1476 e
->versions
[1].mode
= S_IFDIR
;
1477 tree_content_set(e
, slash1
+ 1, oid
, mode
, subtree
);
1480 e
->versions
[1].mode
= mode
;
1481 oidcpy(&e
->versions
[1].oid
, oid
);
1483 oidclr(&root
->versions
[1].oid
, the_repository
->hash_algo
);
1487 static int tree_content_remove(
1488 struct tree_entry
*root
,
1490 struct tree_entry
*backup_leaf
,
1493 struct tree_content
*t
;
1496 struct tree_entry
*e
;
1498 slash1
= strchrnul(p
, '/');
1504 if (!*p
&& allow_root
) {
1510 for (i
= 0; i
< t
->entry_count
; i
++) {
1512 if (e
->name
->str_len
== n
&& !fspathncmp(p
, e
->name
->str_dat
, n
)) {
1513 if (*slash1
&& !S_ISDIR(e
->versions
[1].mode
))
1515 * If p names a file in some subdirectory, and a
1516 * file or symlink matching the name of the
1517 * parent directory of p exists, then p cannot
1518 * exist and need not be deleted.
1521 if (!*slash1
|| !S_ISDIR(e
->versions
[1].mode
))
1525 if (tree_content_remove(e
, slash1
+ 1, backup_leaf
, 0)) {
1526 for (n
= 0; n
< e
->tree
->entry_count
; n
++) {
1527 if (e
->tree
->entries
[n
]->versions
[1].mode
) {
1528 oidclr(&root
->versions
[1].oid
,
1529 the_repository
->hash_algo
);
1543 memcpy(backup_leaf
, e
, sizeof(*backup_leaf
));
1545 release_tree_content_recursive(e
->tree
);
1547 e
->versions
[1].mode
= 0;
1548 oidclr(&e
->versions
[1].oid
, the_repository
->hash_algo
);
1549 oidclr(&root
->versions
[1].oid
, the_repository
->hash_algo
);
1553 static int tree_content_get(
1554 struct tree_entry
*root
,
1556 struct tree_entry
*leaf
,
1559 struct tree_content
*t
;
1562 struct tree_entry
*e
;
1564 slash1
= strchrnul(p
, '/');
1566 if (!n
&& !allow_root
)
1567 die("Empty path component found in input");
1578 for (i
= 0; i
< t
->entry_count
; i
++) {
1580 if (e
->name
->str_len
== n
&& !fspathncmp(p
, e
->name
->str_dat
, n
)) {
1583 if (!S_ISDIR(e
->versions
[1].mode
))
1587 return tree_content_get(e
, slash1
+ 1, leaf
, 0);
1593 memcpy(leaf
, e
, sizeof(*leaf
));
1594 if (e
->tree
&& is_null_oid(&e
->versions
[1].oid
))
1595 leaf
->tree
= dup_tree_content(e
->tree
);
1601 static int update_branch(struct branch
*b
)
1603 static const char *msg
= "fast-import";
1604 struct ref_transaction
*transaction
;
1605 struct object_id old_oid
;
1606 struct strbuf err
= STRBUF_INIT
;
1608 if (is_null_oid(&b
->oid
)) {
1610 refs_delete_ref(get_main_ref_store(the_repository
),
1611 NULL
, b
->name
, NULL
, 0);
1614 if (refs_read_ref(get_main_ref_store(the_repository
), b
->name
, &old_oid
))
1615 oidclr(&old_oid
, the_repository
->hash_algo
);
1616 if (!force_update
&& !is_null_oid(&old_oid
)) {
1617 struct commit
*old_cmit
, *new_cmit
;
1620 old_cmit
= lookup_commit_reference_gently(the_repository
,
1622 new_cmit
= lookup_commit_reference_gently(the_repository
,
1624 if (!old_cmit
|| !new_cmit
)
1625 return error("Branch %s is missing commits.", b
->name
);
1627 ret
= repo_in_merge_bases(the_repository
, old_cmit
, new_cmit
);
1631 warning("Not updating %s"
1632 " (new tip %s does not contain %s)",
1633 b
->name
, oid_to_hex(&b
->oid
),
1634 oid_to_hex(&old_oid
));
1638 transaction
= ref_store_transaction_begin(get_main_ref_store(the_repository
),
1641 ref_transaction_update(transaction
, b
->name
, &b
->oid
, &old_oid
,
1642 NULL
, NULL
, 0, msg
, &err
) ||
1643 ref_transaction_commit(transaction
, &err
)) {
1644 ref_transaction_free(transaction
);
1645 error("%s", err
.buf
);
1646 strbuf_release(&err
);
1649 ref_transaction_free(transaction
);
1650 strbuf_release(&err
);
1654 static void dump_branches(void)
1659 for (i
= 0; i
< branch_table_sz
; i
++) {
1660 for (b
= branch_table
[i
]; b
; b
= b
->table_next_branch
)
1661 failure
|= update_branch(b
);
1665 static void dump_tags(void)
1667 static const char *msg
= "fast-import";
1669 struct strbuf ref_name
= STRBUF_INIT
;
1670 struct strbuf err
= STRBUF_INIT
;
1671 struct ref_transaction
*transaction
;
1673 transaction
= ref_store_transaction_begin(get_main_ref_store(the_repository
),
1676 failure
|= error("%s", err
.buf
);
1679 for (t
= first_tag
; t
; t
= t
->next_tag
) {
1680 strbuf_reset(&ref_name
);
1681 strbuf_addf(&ref_name
, "refs/tags/%s", t
->name
);
1683 if (ref_transaction_update(transaction
, ref_name
.buf
,
1684 &t
->oid
, NULL
, NULL
, NULL
,
1686 failure
|= error("%s", err
.buf
);
1690 if (ref_transaction_commit(transaction
, &err
))
1691 failure
|= error("%s", err
.buf
);
1694 ref_transaction_free(transaction
);
1695 strbuf_release(&ref_name
);
1696 strbuf_release(&err
);
1699 static void dump_marks(void)
1701 struct lock_file mark_lock
= LOCK_INIT
;
1704 if (!export_marks_file
|| (import_marks_file
&& !import_marks_file_done
))
1707 if (safe_create_leading_directories_const(export_marks_file
)) {
1708 failure
|= error_errno("unable to create leading directories of %s",
1713 if (hold_lock_file_for_update(&mark_lock
, export_marks_file
, 0) < 0) {
1714 failure
|= error_errno("Unable to write marks file %s",
1719 f
= fdopen_lock_file(&mark_lock
, "w");
1721 int saved_errno
= errno
;
1722 rollback_lock_file(&mark_lock
);
1723 failure
|= error("Unable to write marks file %s: %s",
1724 export_marks_file
, strerror(saved_errno
));
1728 for_each_mark(marks
, 0, dump_marks_fn
, f
);
1729 if (commit_lock_file(&mark_lock
)) {
1730 failure
|= error_errno("Unable to write file %s",
1736 static void insert_object_entry(struct mark_set
**s
, struct object_id
*oid
, uintmax_t mark
)
1738 struct object_entry
*e
;
1739 e
= find_object(oid
);
1741 enum object_type type
= oid_object_info(the_repository
,
1744 die("object not found: %s", oid_to_hex(oid
));
1745 e
= insert_object(oid
);
1747 e
->pack_id
= MAX_PACK_ID
;
1748 e
->idx
.offset
= 1; /* just not zero! */
1750 insert_mark(s
, mark
, e
);
1753 static void insert_oid_entry(struct mark_set
**s
, struct object_id
*oid
, uintmax_t mark
)
1755 insert_mark(s
, mark
, xmemdupz(oid
, sizeof(*oid
)));
1758 static void read_mark_file(struct mark_set
**s
, FILE *f
, mark_set_inserter_t inserter
)
1761 while (fgets(line
, sizeof(line
), f
)) {
1764 struct object_id oid
;
1766 /* Ensure SHA-1 objects are padded with zeros. */
1767 memset(oid
.hash
, 0, sizeof(oid
.hash
));
1769 end
= strchr(line
, '\n');
1770 if (line
[0] != ':' || !end
)
1771 die("corrupt mark line: %s", line
);
1773 mark
= strtoumax(line
+ 1, &end
, 10);
1774 if (!mark
|| end
== line
+ 1
1776 || get_oid_hex_any(end
+ 1, &oid
) == GIT_HASH_UNKNOWN
)
1777 die("corrupt mark line: %s", line
);
1778 inserter(s
, &oid
, mark
);
1782 static void read_marks(void)
1784 FILE *f
= fopen(import_marks_file
, "r");
1787 else if (import_marks_file_ignore_missing
&& errno
== ENOENT
)
1788 goto done
; /* Marks file does not exist */
1790 die_errno("cannot read '%s'", import_marks_file
);
1791 read_mark_file(&marks
, f
, insert_object_entry
);
1794 import_marks_file_done
= 1;
1798 static int read_next_command(void)
1800 static int stdin_eof
= 0;
1803 unread_command_buf
= 0;
1808 if (unread_command_buf
) {
1809 unread_command_buf
= 0;
1811 struct recent_command
*rc
;
1813 stdin_eof
= strbuf_getline_lf(&command_buf
, stdin
);
1817 if (!seen_data_command
1818 && !starts_with(command_buf
.buf
, "feature ")
1819 && !starts_with(command_buf
.buf
, "option ")) {
1828 cmd_hist
.next
= rc
->next
;
1829 cmd_hist
.next
->prev
= &cmd_hist
;
1833 rc
->buf
= xstrdup(command_buf
.buf
);
1834 rc
->prev
= cmd_tail
;
1835 rc
->next
= cmd_hist
.prev
;
1836 rc
->prev
->next
= rc
;
1839 if (command_buf
.buf
[0] == '#')
1845 static void skip_optional_lf(void)
1847 int term_char
= fgetc(stdin
);
1848 if (term_char
!= '\n' && term_char
!= EOF
)
1849 ungetc(term_char
, stdin
);
1852 static void parse_mark(void)
1855 if (skip_prefix(command_buf
.buf
, "mark :", &v
)) {
1856 next_mark
= strtoumax(v
, NULL
, 10);
1857 read_next_command();
1863 static void parse_original_identifier(void)
1866 if (skip_prefix(command_buf
.buf
, "original-oid ", &v
))
1867 read_next_command();
1870 static int parse_data(struct strbuf
*sb
, uintmax_t limit
, uintmax_t *len_res
)
1875 if (!skip_prefix(command_buf
.buf
, "data ", &data
))
1876 die("Expected 'data n' command, found: %s", command_buf
.buf
);
1878 if (skip_prefix(data
, "<<", &data
)) {
1879 char *term
= xstrdup(data
);
1880 size_t term_len
= command_buf
.len
- (data
- command_buf
.buf
);
1883 if (strbuf_getline_lf(&command_buf
, stdin
) == EOF
)
1884 die("EOF in data (terminator '%s' not found)", term
);
1885 if (term_len
== command_buf
.len
1886 && !strcmp(term
, command_buf
.buf
))
1888 strbuf_addbuf(sb
, &command_buf
);
1889 strbuf_addch(sb
, '\n');
1894 uintmax_t len
= strtoumax(data
, NULL
, 10);
1895 size_t n
= 0, length
= (size_t)len
;
1897 if (limit
&& limit
< len
) {
1902 die("data is too large to use in this context");
1904 while (n
< length
) {
1905 size_t s
= strbuf_fread(sb
, length
- n
, stdin
);
1906 if (!s
&& feof(stdin
))
1907 die("EOF in data (%lu bytes remaining)",
1908 (unsigned long)(length
- n
));
1917 static int validate_raw_date(const char *src
, struct strbuf
*result
, int strict
)
1919 const char *orig_src
= src
;
1925 num
= strtoul(src
, &endp
, 10);
1927 * NEEDSWORK: perhaps check for reasonable values? For example, we
1928 * could error on values representing times more than a
1929 * day in the future.
1931 if (errno
|| endp
== src
|| *endp
!= ' ')
1935 if (*src
!= '-' && *src
!= '+')
1938 num
= strtoul(src
+ 1, &endp
, 10);
1940 * NEEDSWORK: check for brokenness other than num > 1400, such as
1941 * (num % 100) >= 60, or ((num % 100) % 15) != 0 ?
1943 if (errno
|| endp
== src
+ 1 || *endp
|| /* did not parse */
1944 (strict
&& (1400 < num
)) /* parsed a broken timezone */
1948 strbuf_addstr(result
, orig_src
);
1952 static char *parse_ident(const char *buf
)
1956 struct strbuf ident
= STRBUF_INIT
;
1958 /* ensure there is a space delimiter even if there is no name */
1962 ltgt
= buf
+ strcspn(buf
, "<>");
1964 die("Missing < in ident string: %s", buf
);
1965 if (ltgt
!= buf
&& ltgt
[-1] != ' ')
1966 die("Missing space before < in ident string: %s", buf
);
1967 ltgt
= ltgt
+ 1 + strcspn(ltgt
+ 1, "<>");
1969 die("Missing > in ident string: %s", buf
);
1972 die("Missing space after > in ident string: %s", buf
);
1974 name_len
= ltgt
- buf
;
1975 strbuf_add(&ident
, buf
, name_len
);
1979 if (validate_raw_date(ltgt
, &ident
, 1) < 0)
1980 die("Invalid raw date \"%s\" in ident: %s", ltgt
, buf
);
1982 case WHENSPEC_RAW_PERMISSIVE
:
1983 if (validate_raw_date(ltgt
, &ident
, 0) < 0)
1984 die("Invalid raw date \"%s\" in ident: %s", ltgt
, buf
);
1986 case WHENSPEC_RFC2822
:
1987 if (parse_date(ltgt
, &ident
) < 0)
1988 die("Invalid rfc2822 date \"%s\" in ident: %s", ltgt
, buf
);
1991 if (strcmp("now", ltgt
))
1992 die("Date in ident must be 'now': %s", buf
);
1997 return strbuf_detach(&ident
, NULL
);
2000 static void parse_and_store_blob(
2001 struct last_object
*last
,
2002 struct object_id
*oidout
,
2005 static struct strbuf buf
= STRBUF_INIT
;
2008 if (parse_data(&buf
, big_file_threshold
, &len
))
2009 store_object(OBJ_BLOB
, &buf
, last
, oidout
, mark
);
2012 strbuf_release(&last
->data
);
2016 stream_blob(len
, oidout
, mark
);
2021 static void parse_new_blob(void)
2023 read_next_command();
2025 parse_original_identifier();
2026 parse_and_store_blob(&last_blob
, NULL
, next_mark
);
2029 static void unload_one_branch(void)
2031 while (cur_active_branches
2032 && cur_active_branches
>= max_active_branches
) {
2033 uintmax_t min_commit
= ULONG_MAX
;
2034 struct branch
*e
, *l
= NULL
, *p
= NULL
;
2036 for (e
= active_branches
; e
; e
= e
->active_next_branch
) {
2037 if (e
->last_commit
< min_commit
) {
2039 min_commit
= e
->last_commit
;
2045 e
= p
->active_next_branch
;
2046 p
->active_next_branch
= e
->active_next_branch
;
2048 e
= active_branches
;
2049 active_branches
= e
->active_next_branch
;
2052 e
->active_next_branch
= NULL
;
2053 if (e
->branch_tree
.tree
) {
2054 release_tree_content_recursive(e
->branch_tree
.tree
);
2055 e
->branch_tree
.tree
= NULL
;
2057 cur_active_branches
--;
2061 static void load_branch(struct branch
*b
)
2063 load_tree(&b
->branch_tree
);
2066 b
->active_next_branch
= active_branches
;
2067 active_branches
= b
;
2068 cur_active_branches
++;
2069 branch_load_count
++;
2073 static unsigned char convert_num_notes_to_fanout(uintmax_t num_notes
)
2075 unsigned char fanout
= 0;
2076 while ((num_notes
>>= 8))
2081 static void construct_path_with_fanout(const char *hex_sha1
,
2082 unsigned char fanout
, char *path
)
2084 unsigned int i
= 0, j
= 0;
2085 if (fanout
>= the_hash_algo
->rawsz
)
2086 die("Too large fanout (%u)", fanout
);
2088 path
[i
++] = hex_sha1
[j
++];
2089 path
[i
++] = hex_sha1
[j
++];
2093 memcpy(path
+ i
, hex_sha1
+ j
, the_hash_algo
->hexsz
- j
);
2094 path
[i
+ the_hash_algo
->hexsz
- j
] = '\0';
2097 static uintmax_t do_change_note_fanout(
2098 struct tree_entry
*orig_root
, struct tree_entry
*root
,
2099 char *hex_oid
, unsigned int hex_oid_len
,
2100 char *fullpath
, unsigned int fullpath_len
,
2101 unsigned char fanout
)
2103 struct tree_content
*t
;
2104 struct tree_entry
*e
, leaf
;
2105 unsigned int i
, tmp_hex_oid_len
, tmp_fullpath_len
;
2106 uintmax_t num_notes
= 0;
2107 struct object_id oid
;
2108 /* hex oid + '/' between each pair of hex digits + NUL */
2109 char realpath
[GIT_MAX_HEXSZ
+ ((GIT_MAX_HEXSZ
/ 2) - 1) + 1];
2110 const unsigned hexsz
= the_hash_algo
->hexsz
;
2116 for (i
= 0; t
&& i
< t
->entry_count
; i
++) {
2118 tmp_hex_oid_len
= hex_oid_len
+ e
->name
->str_len
;
2119 tmp_fullpath_len
= fullpath_len
;
2122 * We're interested in EITHER existing note entries (entries
2123 * with exactly 40 hex chars in path, not including directory
2124 * separators), OR directory entries that may contain note
2125 * entries (with < 40 hex chars in path).
2126 * Also, each path component in a note entry must be a multiple
2129 if (!e
->versions
[1].mode
||
2130 tmp_hex_oid_len
> hexsz
||
2131 e
->name
->str_len
% 2)
2134 /* This _may_ be a note entry, or a subdir containing notes */
2135 memcpy(hex_oid
+ hex_oid_len
, e
->name
->str_dat
,
2137 if (tmp_fullpath_len
)
2138 fullpath
[tmp_fullpath_len
++] = '/';
2139 memcpy(fullpath
+ tmp_fullpath_len
, e
->name
->str_dat
,
2141 tmp_fullpath_len
+= e
->name
->str_len
;
2142 fullpath
[tmp_fullpath_len
] = '\0';
2144 if (tmp_hex_oid_len
== hexsz
&& !get_oid_hex(hex_oid
, &oid
)) {
2145 /* This is a note entry */
2146 if (fanout
== 0xff) {
2147 /* Counting mode, no rename */
2151 construct_path_with_fanout(hex_oid
, fanout
, realpath
);
2152 if (!strcmp(fullpath
, realpath
)) {
2153 /* Note entry is in correct location */
2158 /* Rename fullpath to realpath */
2159 if (!tree_content_remove(orig_root
, fullpath
, &leaf
, 0))
2160 die("Failed to remove path %s", fullpath
);
2161 tree_content_set(orig_root
, realpath
,
2162 &leaf
.versions
[1].oid
,
2163 leaf
.versions
[1].mode
,
2165 } else if (S_ISDIR(e
->versions
[1].mode
)) {
2166 /* This is a subdir that may contain note entries */
2167 num_notes
+= do_change_note_fanout(orig_root
, e
,
2168 hex_oid
, tmp_hex_oid_len
,
2169 fullpath
, tmp_fullpath_len
, fanout
);
2172 /* The above may have reallocated the current tree_content */
2178 static uintmax_t change_note_fanout(struct tree_entry
*root
,
2179 unsigned char fanout
)
2182 * The size of path is due to one slash between every two hex digits,
2183 * plus the terminating NUL. Note that there is no slash at the end, so
2184 * the number of slashes is one less than half the number of hex
2187 char hex_oid
[GIT_MAX_HEXSZ
], path
[GIT_MAX_HEXSZ
+ (GIT_MAX_HEXSZ
/ 2) - 1 + 1];
2188 return do_change_note_fanout(root
, root
, hex_oid
, 0, path
, 0, fanout
);
2191 static int parse_mapped_oid_hex(const char *hex
, struct object_id
*oid
, const char **end
)
2196 /* Make SHA-1 object IDs have all-zero padding. */
2197 memset(oid
->hash
, 0, sizeof(oid
->hash
));
2199 algo
= parse_oid_hex_any(hex
, oid
, end
);
2200 if (algo
== GIT_HASH_UNKNOWN
)
2203 it
= kh_get_oid_map(sub_oid_map
, *oid
);
2204 /* No such object? */
2205 if (it
== kh_end(sub_oid_map
)) {
2206 /* If we're using the same algorithm, pass it through. */
2207 if (hash_algos
[algo
].format_id
== the_hash_algo
->format_id
)
2211 oidcpy(oid
, kh_value(sub_oid_map
, it
));
2216 * Given a pointer into a string, parse a mark reference:
2218 * idnum ::= ':' bigint;
2220 * Update *endptr to point to the first character after the value.
2222 * Complain if the following character is not what is expected,
2223 * either a space or end of the string.
2225 static uintmax_t parse_mark_ref(const char *p
, char **endptr
)
2231 mark
= strtoumax(p
, endptr
, 10);
2233 die("No value after ':' in mark: %s", command_buf
.buf
);
2238 * Parse the mark reference, and complain if this is not the end of
2241 static uintmax_t parse_mark_ref_eol(const char *p
)
2246 mark
= parse_mark_ref(p
, &end
);
2248 die("Garbage after mark: %s", command_buf
.buf
);
2253 * Parse the mark reference, demanding a trailing space. Update *p to
2254 * point to the first character after the space.
2256 static uintmax_t parse_mark_ref_space(const char **p
)
2261 mark
= parse_mark_ref(*p
, &end
);
2263 die("Missing space after mark: %s", command_buf
.buf
);
2269 * Parse the path string into the strbuf. The path can either be quoted with
2270 * escape sequences or unquoted without escape sequences. Unquoted strings may
2271 * contain spaces only if `is_last_field` is nonzero; otherwise, it stops
2272 * parsing at the first space.
2274 static void parse_path(struct strbuf
*sb
, const char *p
, const char **endp
,
2275 int is_last_field
, const char *field
)
2278 if (unquote_c_style(sb
, p
, endp
))
2279 die("Invalid %s: %s", field
, command_buf
.buf
);
2280 if (strlen(sb
->buf
) != sb
->len
)
2281 die("NUL in %s: %s", field
, command_buf
.buf
);
2284 * Unless we are parsing the last field of a line,
2285 * SP is the end of this field.
2287 *endp
= is_last_field
2289 : strchrnul(p
, ' ');
2290 strbuf_add(sb
, p
, *endp
- p
);
2295 * Parse the path string into the strbuf, and complain if this is not the end of
2296 * the string. Unquoted strings may contain spaces.
2298 static void parse_path_eol(struct strbuf
*sb
, const char *p
, const char *field
)
2302 parse_path(sb
, p
, &end
, 1, field
);
2304 die("Garbage after %s: %s", field
, command_buf
.buf
);
2308 * Parse the path string into the strbuf, and ensure it is followed by a space.
2309 * Unquoted strings may not contain spaces. Update *endp to point to the first
2310 * character after the space.
2312 static void parse_path_space(struct strbuf
*sb
, const char *p
,
2313 const char **endp
, const char *field
)
2315 parse_path(sb
, p
, endp
, 0, field
);
2317 die("Missing space after %s: %s", field
, command_buf
.buf
);
2321 static void file_change_m(const char *p
, struct branch
*b
)
2323 static struct strbuf path
= STRBUF_INIT
;
2324 struct object_entry
*oe
;
2325 struct object_id oid
;
2326 uint16_t mode
, inline_data
= 0;
2328 p
= parse_mode(p
, &mode
);
2330 die("Corrupt mode: %s", command_buf
.buf
);
2335 case S_IFREG
| 0644:
2336 case S_IFREG
| 0755:
2343 die("Corrupt mode: %s", command_buf
.buf
);
2347 oe
= find_mark(marks
, parse_mark_ref_space(&p
));
2348 oidcpy(&oid
, &oe
->idx
.oid
);
2349 } else if (skip_prefix(p
, "inline ", &p
)) {
2351 oe
= NULL
; /* not used with inline_data, but makes gcc happy */
2353 if (parse_mapped_oid_hex(p
, &oid
, &p
))
2354 die("Invalid dataref: %s", command_buf
.buf
);
2355 oe
= find_object(&oid
);
2357 die("Missing space after SHA1: %s", command_buf
.buf
);
2360 strbuf_reset(&path
);
2361 parse_path_eol(&path
, p
, "path");
2363 /* Git does not track empty, non-toplevel directories. */
2364 if (S_ISDIR(mode
) &&
2365 is_empty_tree_oid(&oid
, the_repository
->hash_algo
) &&
2367 tree_content_remove(&b
->branch_tree
, path
.buf
, NULL
, 0);
2371 if (S_ISGITLINK(mode
)) {
2373 die("Git links cannot be specified 'inline': %s",
2376 if (oe
->type
!= OBJ_COMMIT
)
2377 die("Not a commit (actually a %s): %s",
2378 type_name(oe
->type
), command_buf
.buf
);
2381 * Accept the sha1 without checking; it expected to be in
2382 * another repository.
2384 } else if (inline_data
) {
2386 die("Directories cannot be specified 'inline': %s",
2388 while (read_next_command() != EOF
) {
2390 if (skip_prefix(command_buf
.buf
, "cat-blob ", &v
))
2393 parse_and_store_blob(&last_blob
, &oid
, 0);
2398 enum object_type expected
= S_ISDIR(mode
) ?
2400 enum object_type type
= oe
? oe
->type
:
2401 oid_object_info(the_repository
, &oid
,
2404 die("%s not found: %s",
2405 S_ISDIR(mode
) ? "Tree" : "Blob",
2407 if (type
!= expected
)
2408 die("Not a %s (actually a %s): %s",
2409 type_name(expected
), type_name(type
),
2414 tree_content_replace(&b
->branch_tree
, &oid
, mode
, NULL
);
2417 tree_content_set(&b
->branch_tree
, path
.buf
, &oid
, mode
, NULL
);
2420 static void file_change_d(const char *p
, struct branch
*b
)
2422 static struct strbuf path
= STRBUF_INIT
;
2424 strbuf_reset(&path
);
2425 parse_path_eol(&path
, p
, "path");
2426 tree_content_remove(&b
->branch_tree
, path
.buf
, NULL
, 1);
2429 static void file_change_cr(const char *p
, struct branch
*b
, int rename
)
2431 static struct strbuf source
= STRBUF_INIT
;
2432 static struct strbuf dest
= STRBUF_INIT
;
2433 struct tree_entry leaf
;
2435 strbuf_reset(&source
);
2436 parse_path_space(&source
, p
, &p
, "source");
2437 strbuf_reset(&dest
);
2438 parse_path_eol(&dest
, p
, "dest");
2440 memset(&leaf
, 0, sizeof(leaf
));
2442 tree_content_remove(&b
->branch_tree
, source
.buf
, &leaf
, 1);
2444 tree_content_get(&b
->branch_tree
, source
.buf
, &leaf
, 1);
2445 if (!leaf
.versions
[1].mode
)
2446 die("Path %s not in branch", source
.buf
);
2447 if (!*dest
.buf
) { /* C "path/to/subdir" "" */
2448 tree_content_replace(&b
->branch_tree
,
2449 &leaf
.versions
[1].oid
,
2450 leaf
.versions
[1].mode
,
2454 tree_content_set(&b
->branch_tree
, dest
.buf
,
2455 &leaf
.versions
[1].oid
,
2456 leaf
.versions
[1].mode
,
2460 static void note_change_n(const char *p
, struct branch
*b
, unsigned char *old_fanout
)
2462 struct object_entry
*oe
;
2464 struct object_id oid
, commit_oid
;
2465 char path
[GIT_MAX_RAWSZ
* 3];
2466 uint16_t inline_data
= 0;
2467 unsigned char new_fanout
;
2470 * When loading a branch, we don't traverse its tree to count the real
2471 * number of notes (too expensive to do this for all non-note refs).
2472 * This means that recently loaded notes refs might incorrectly have
2473 * b->num_notes == 0, and consequently, old_fanout might be wrong.
2475 * Fix this by traversing the tree and counting the number of notes
2476 * when b->num_notes == 0. If the notes tree is truly empty, the
2477 * calculation should not take long.
2479 if (b
->num_notes
== 0 && *old_fanout
== 0) {
2480 /* Invoke change_note_fanout() in "counting mode". */
2481 b
->num_notes
= change_note_fanout(&b
->branch_tree
, 0xff);
2482 *old_fanout
= convert_num_notes_to_fanout(b
->num_notes
);
2485 /* Now parse the notemodify command. */
2486 /* <dataref> or 'inline' */
2488 oe
= find_mark(marks
, parse_mark_ref_space(&p
));
2489 oidcpy(&oid
, &oe
->idx
.oid
);
2490 } else if (skip_prefix(p
, "inline ", &p
)) {
2492 oe
= NULL
; /* not used with inline_data, but makes gcc happy */
2494 if (parse_mapped_oid_hex(p
, &oid
, &p
))
2495 die("Invalid dataref: %s", command_buf
.buf
);
2496 oe
= find_object(&oid
);
2498 die("Missing space after SHA1: %s", command_buf
.buf
);
2502 s
= lookup_branch(p
);
2504 if (is_null_oid(&s
->oid
))
2505 die("Can't add a note on empty branch.");
2506 oidcpy(&commit_oid
, &s
->oid
);
2507 } else if (*p
== ':') {
2508 uintmax_t commit_mark
= parse_mark_ref_eol(p
);
2509 struct object_entry
*commit_oe
= find_mark(marks
, commit_mark
);
2510 if (commit_oe
->type
!= OBJ_COMMIT
)
2511 die("Mark :%" PRIuMAX
" not a commit", commit_mark
);
2512 oidcpy(&commit_oid
, &commit_oe
->idx
.oid
);
2513 } else if (!repo_get_oid(the_repository
, p
, &commit_oid
)) {
2515 char *buf
= read_object_with_reference(the_repository
,
2519 if (!buf
|| size
< the_hash_algo
->hexsz
+ 6)
2520 die("Not a valid commit: %s", p
);
2523 die("Invalid ref name or SHA1 expression: %s", p
);
2526 read_next_command();
2527 parse_and_store_blob(&last_blob
, &oid
, 0);
2529 if (oe
->type
!= OBJ_BLOB
)
2530 die("Not a blob (actually a %s): %s",
2531 type_name(oe
->type
), command_buf
.buf
);
2532 } else if (!is_null_oid(&oid
)) {
2533 enum object_type type
= oid_object_info(the_repository
, &oid
,
2536 die("Blob not found: %s", command_buf
.buf
);
2537 if (type
!= OBJ_BLOB
)
2538 die("Not a blob (actually a %s): %s",
2539 type_name(type
), command_buf
.buf
);
2542 construct_path_with_fanout(oid_to_hex(&commit_oid
), *old_fanout
, path
);
2543 if (tree_content_remove(&b
->branch_tree
, path
, NULL
, 0))
2546 if (is_null_oid(&oid
))
2547 return; /* nothing to insert */
2550 new_fanout
= convert_num_notes_to_fanout(b
->num_notes
);
2551 construct_path_with_fanout(oid_to_hex(&commit_oid
), new_fanout
, path
);
2552 tree_content_set(&b
->branch_tree
, path
, &oid
, S_IFREG
| 0644, NULL
);
2555 static void file_change_deleteall(struct branch
*b
)
2557 release_tree_content_recursive(b
->branch_tree
.tree
);
2558 oidclr(&b
->branch_tree
.versions
[0].oid
, the_repository
->hash_algo
);
2559 oidclr(&b
->branch_tree
.versions
[1].oid
, the_repository
->hash_algo
);
2560 load_tree(&b
->branch_tree
);
2564 static void parse_from_commit(struct branch
*b
, char *buf
, unsigned long size
)
2566 if (!buf
|| size
< the_hash_algo
->hexsz
+ 6)
2567 die("Not a valid commit: %s", oid_to_hex(&b
->oid
));
2568 if (memcmp("tree ", buf
, 5)
2569 || get_oid_hex(buf
+ 5, &b
->branch_tree
.versions
[1].oid
))
2570 die("The commit %s is corrupt", oid_to_hex(&b
->oid
));
2571 oidcpy(&b
->branch_tree
.versions
[0].oid
,
2572 &b
->branch_tree
.versions
[1].oid
);
2575 static void parse_from_existing(struct branch
*b
)
2577 if (is_null_oid(&b
->oid
)) {
2578 oidclr(&b
->branch_tree
.versions
[0].oid
, the_repository
->hash_algo
);
2579 oidclr(&b
->branch_tree
.versions
[1].oid
, the_repository
->hash_algo
);
2584 buf
= read_object_with_reference(the_repository
,
2585 &b
->oid
, OBJ_COMMIT
, &size
,
2587 parse_from_commit(b
, buf
, size
);
2592 static int parse_objectish(struct branch
*b
, const char *objectish
)
2595 struct object_id oid
;
2597 oidcpy(&oid
, &b
->branch_tree
.versions
[1].oid
);
2599 s
= lookup_branch(objectish
);
2601 die("Can't create a branch from itself: %s", b
->name
);
2603 struct object_id
*t
= &s
->branch_tree
.versions
[1].oid
;
2604 oidcpy(&b
->oid
, &s
->oid
);
2605 oidcpy(&b
->branch_tree
.versions
[0].oid
, t
);
2606 oidcpy(&b
->branch_tree
.versions
[1].oid
, t
);
2607 } else if (*objectish
== ':') {
2608 uintmax_t idnum
= parse_mark_ref_eol(objectish
);
2609 struct object_entry
*oe
= find_mark(marks
, idnum
);
2610 if (oe
->type
!= OBJ_COMMIT
)
2611 die("Mark :%" PRIuMAX
" not a commit", idnum
);
2612 if (!oideq(&b
->oid
, &oe
->idx
.oid
)) {
2613 oidcpy(&b
->oid
, &oe
->idx
.oid
);
2614 if (oe
->pack_id
!= MAX_PACK_ID
) {
2616 char *buf
= gfi_unpack_entry(oe
, &size
);
2617 parse_from_commit(b
, buf
, size
);
2620 parse_from_existing(b
);
2622 } else if (!repo_get_oid(the_repository
, objectish
, &b
->oid
)) {
2623 parse_from_existing(b
);
2624 if (is_null_oid(&b
->oid
))
2628 die("Invalid ref name or SHA1 expression: %s", objectish
);
2630 if (b
->branch_tree
.tree
&& !oideq(&oid
, &b
->branch_tree
.versions
[1].oid
)) {
2631 release_tree_content_recursive(b
->branch_tree
.tree
);
2632 b
->branch_tree
.tree
= NULL
;
2635 read_next_command();
2639 static int parse_from(struct branch
*b
)
2643 if (!skip_prefix(command_buf
.buf
, "from ", &from
))
2646 return parse_objectish(b
, from
);
2649 static int parse_objectish_with_prefix(struct branch
*b
, const char *prefix
)
2653 if (!skip_prefix(command_buf
.buf
, prefix
, &base
))
2656 return parse_objectish(b
, base
);
2659 static struct hash_list
*parse_merge(unsigned int *count
)
2661 struct hash_list
*list
= NULL
, **tail
= &list
, *n
;
2666 while (skip_prefix(command_buf
.buf
, "merge ", &from
)) {
2667 n
= xmalloc(sizeof(*n
));
2668 s
= lookup_branch(from
);
2670 oidcpy(&n
->oid
, &s
->oid
);
2671 else if (*from
== ':') {
2672 uintmax_t idnum
= parse_mark_ref_eol(from
);
2673 struct object_entry
*oe
= find_mark(marks
, idnum
);
2674 if (oe
->type
!= OBJ_COMMIT
)
2675 die("Mark :%" PRIuMAX
" not a commit", idnum
);
2676 oidcpy(&n
->oid
, &oe
->idx
.oid
);
2677 } else if (!repo_get_oid(the_repository
, from
, &n
->oid
)) {
2679 char *buf
= read_object_with_reference(the_repository
,
2683 if (!buf
|| size
< the_hash_algo
->hexsz
+ 6)
2684 die("Not a valid commit: %s", from
);
2687 die("Invalid ref name or SHA1 expression: %s", from
);
2694 read_next_command();
2699 static void parse_new_commit(const char *arg
)
2701 static struct strbuf msg
= STRBUF_INIT
;
2703 char *author
= NULL
;
2704 char *committer
= NULL
;
2705 char *encoding
= NULL
;
2706 struct hash_list
*merge_list
= NULL
;
2707 unsigned int merge_count
;
2708 unsigned char prev_fanout
, new_fanout
;
2711 b
= lookup_branch(arg
);
2713 b
= new_branch(arg
);
2715 read_next_command();
2717 parse_original_identifier();
2718 if (skip_prefix(command_buf
.buf
, "author ", &v
)) {
2719 author
= parse_ident(v
);
2720 read_next_command();
2722 if (skip_prefix(command_buf
.buf
, "committer ", &v
)) {
2723 committer
= parse_ident(v
);
2724 read_next_command();
2727 die("Expected committer but didn't get one");
2728 if (skip_prefix(command_buf
.buf
, "encoding ", &v
)) {
2729 encoding
= xstrdup(v
);
2730 read_next_command();
2732 parse_data(&msg
, 0, NULL
);
2733 read_next_command();
2735 merge_list
= parse_merge(&merge_count
);
2737 /* ensure the branch is active/loaded */
2738 if (!b
->branch_tree
.tree
|| !max_active_branches
) {
2739 unload_one_branch();
2743 prev_fanout
= convert_num_notes_to_fanout(b
->num_notes
);
2746 while (command_buf
.len
> 0) {
2747 if (skip_prefix(command_buf
.buf
, "M ", &v
))
2748 file_change_m(v
, b
);
2749 else if (skip_prefix(command_buf
.buf
, "D ", &v
))
2750 file_change_d(v
, b
);
2751 else if (skip_prefix(command_buf
.buf
, "R ", &v
))
2752 file_change_cr(v
, b
, 1);
2753 else if (skip_prefix(command_buf
.buf
, "C ", &v
))
2754 file_change_cr(v
, b
, 0);
2755 else if (skip_prefix(command_buf
.buf
, "N ", &v
))
2756 note_change_n(v
, b
, &prev_fanout
);
2757 else if (!strcmp("deleteall", command_buf
.buf
))
2758 file_change_deleteall(b
);
2759 else if (skip_prefix(command_buf
.buf
, "ls ", &v
))
2761 else if (skip_prefix(command_buf
.buf
, "cat-blob ", &v
))
2764 unread_command_buf
= 1;
2767 if (read_next_command() == EOF
)
2771 new_fanout
= convert_num_notes_to_fanout(b
->num_notes
);
2772 if (new_fanout
!= prev_fanout
)
2773 b
->num_notes
= change_note_fanout(&b
->branch_tree
, new_fanout
);
2775 /* build the tree and the commit */
2776 store_tree(&b
->branch_tree
);
2777 oidcpy(&b
->branch_tree
.versions
[0].oid
,
2778 &b
->branch_tree
.versions
[1].oid
);
2780 strbuf_reset(&new_data
);
2781 strbuf_addf(&new_data
, "tree %s\n",
2782 oid_to_hex(&b
->branch_tree
.versions
[1].oid
));
2783 if (!is_null_oid(&b
->oid
))
2784 strbuf_addf(&new_data
, "parent %s\n",
2785 oid_to_hex(&b
->oid
));
2786 while (merge_list
) {
2787 struct hash_list
*next
= merge_list
->next
;
2788 strbuf_addf(&new_data
, "parent %s\n",
2789 oid_to_hex(&merge_list
->oid
));
2793 strbuf_addf(&new_data
,
2796 author
? author
: committer
, committer
);
2798 strbuf_addf(&new_data
,
2801 strbuf_addch(&new_data
, '\n');
2802 strbuf_addbuf(&new_data
, &msg
);
2807 if (!store_object(OBJ_COMMIT
, &new_data
, NULL
, &b
->oid
, next_mark
))
2808 b
->pack_id
= pack_id
;
2809 b
->last_commit
= object_count_by_type
[OBJ_COMMIT
];
2812 static void parse_new_tag(const char *arg
)
2814 static struct strbuf msg
= STRBUF_INIT
;
2819 uintmax_t from_mark
= 0;
2820 struct object_id oid
;
2821 enum object_type type
;
2824 t
= mem_pool_calloc(&fi_mem_pool
, 1, sizeof(struct tag
));
2825 t
->name
= mem_pool_strdup(&fi_mem_pool
, arg
);
2827 last_tag
->next_tag
= t
;
2831 read_next_command();
2835 if (!skip_prefix(command_buf
.buf
, "from ", &from
))
2836 die("Expected from command, got %s", command_buf
.buf
);
2837 s
= lookup_branch(from
);
2839 if (is_null_oid(&s
->oid
))
2840 die("Can't tag an empty branch.");
2841 oidcpy(&oid
, &s
->oid
);
2843 } else if (*from
== ':') {
2844 struct object_entry
*oe
;
2845 from_mark
= parse_mark_ref_eol(from
);
2846 oe
= find_mark(marks
, from_mark
);
2848 oidcpy(&oid
, &oe
->idx
.oid
);
2849 } else if (!repo_get_oid(the_repository
, from
, &oid
)) {
2850 struct object_entry
*oe
= find_object(&oid
);
2852 type
= oid_object_info(the_repository
, &oid
, NULL
);
2854 die("Not a valid object: %s", from
);
2858 die("Invalid ref name or SHA1 expression: %s", from
);
2859 read_next_command();
2861 /* original-oid ... */
2862 parse_original_identifier();
2865 if (skip_prefix(command_buf
.buf
, "tagger ", &v
)) {
2866 tagger
= parse_ident(v
);
2867 read_next_command();
2871 /* tag payload/message */
2872 parse_data(&msg
, 0, NULL
);
2874 /* build the tag object */
2875 strbuf_reset(&new_data
);
2877 strbuf_addf(&new_data
,
2881 oid_to_hex(&oid
), type_name(type
), t
->name
);
2883 strbuf_addf(&new_data
,
2884 "tagger %s\n", tagger
);
2885 strbuf_addch(&new_data
, '\n');
2886 strbuf_addbuf(&new_data
, &msg
);
2889 if (store_object(OBJ_TAG
, &new_data
, NULL
, &t
->oid
, next_mark
))
2890 t
->pack_id
= MAX_PACK_ID
;
2892 t
->pack_id
= pack_id
;
2895 static void parse_reset_branch(const char *arg
)
2898 const char *tag_name
;
2900 b
= lookup_branch(arg
);
2902 oidclr(&b
->oid
, the_repository
->hash_algo
);
2903 oidclr(&b
->branch_tree
.versions
[0].oid
, the_repository
->hash_algo
);
2904 oidclr(&b
->branch_tree
.versions
[1].oid
, the_repository
->hash_algo
);
2905 if (b
->branch_tree
.tree
) {
2906 release_tree_content_recursive(b
->branch_tree
.tree
);
2907 b
->branch_tree
.tree
= NULL
;
2911 b
= new_branch(arg
);
2912 read_next_command();
2914 if (b
->delete && skip_prefix(b
->name
, "refs/tags/", &tag_name
)) {
2916 * Elsewhere, we call dump_branches() before dump_tags(),
2917 * and dump_branches() will handle ref deletions first, so
2918 * in order to make sure the deletion actually takes effect,
2919 * we need to remove the tag from our list of tags to update.
2921 * NEEDSWORK: replace list of tags with hashmap for faster
2924 struct tag
*t
, *prev
= NULL
;
2925 for (t
= first_tag
; t
; t
= t
->next_tag
) {
2926 if (!strcmp(t
->name
, tag_name
))
2932 prev
->next_tag
= t
->next_tag
;
2934 first_tag
= t
->next_tag
;
2937 /* There is no mem_pool_free(t) function to call. */
2940 if (command_buf
.len
> 0)
2941 unread_command_buf
= 1;
2944 static void cat_blob_write(const char *buf
, unsigned long size
)
2946 if (write_in_full(cat_blob_fd
, buf
, size
) < 0)
2947 die_errno("Write to frontend failed");
2950 static void cat_blob(struct object_entry
*oe
, struct object_id
*oid
)
2952 struct strbuf line
= STRBUF_INIT
;
2954 enum object_type type
= 0;
2957 if (!oe
|| oe
->pack_id
== MAX_PACK_ID
) {
2958 buf
= repo_read_object_file(the_repository
, oid
, &type
, &size
);
2961 buf
= gfi_unpack_entry(oe
, &size
);
2965 * Output based on batch_one_object() from cat-file.c.
2968 strbuf_reset(&line
);
2969 strbuf_addf(&line
, "%s missing\n", oid_to_hex(oid
));
2970 cat_blob_write(line
.buf
, line
.len
);
2971 strbuf_release(&line
);
2976 die("Can't read object %s", oid_to_hex(oid
));
2977 if (type
!= OBJ_BLOB
)
2978 die("Object %s is a %s but a blob was expected.",
2979 oid_to_hex(oid
), type_name(type
));
2980 strbuf_reset(&line
);
2981 strbuf_addf(&line
, "%s %s %"PRIuMAX
"\n", oid_to_hex(oid
),
2982 type_name(type
), (uintmax_t)size
);
2983 cat_blob_write(line
.buf
, line
.len
);
2984 strbuf_release(&line
);
2985 cat_blob_write(buf
, size
);
2986 cat_blob_write("\n", 1);
2987 if (oe
&& oe
->pack_id
== pack_id
) {
2988 last_blob
.offset
= oe
->idx
.offset
;
2989 strbuf_attach(&last_blob
.data
, buf
, size
, size
);
2990 last_blob
.depth
= oe
->depth
;
2995 static void parse_get_mark(const char *p
)
2997 struct object_entry
*oe
;
2998 char output
[GIT_MAX_HEXSZ
+ 2];
3000 /* get-mark SP <object> LF */
3002 die("Not a mark: %s", p
);
3004 oe
= find_mark(marks
, parse_mark_ref_eol(p
));
3006 die("Unknown mark: %s", command_buf
.buf
);
3008 xsnprintf(output
, sizeof(output
), "%s\n", oid_to_hex(&oe
->idx
.oid
));
3009 cat_blob_write(output
, the_hash_algo
->hexsz
+ 1);
3012 static void parse_cat_blob(const char *p
)
3014 struct object_entry
*oe
;
3015 struct object_id oid
;
3017 /* cat-blob SP <object> LF */
3019 oe
= find_mark(marks
, parse_mark_ref_eol(p
));
3021 die("Unknown mark: %s", command_buf
.buf
);
3022 oidcpy(&oid
, &oe
->idx
.oid
);
3024 if (parse_mapped_oid_hex(p
, &oid
, &p
))
3025 die("Invalid dataref: %s", command_buf
.buf
);
3027 die("Garbage after SHA1: %s", command_buf
.buf
);
3028 oe
= find_object(&oid
);
3034 static struct object_entry
*dereference(struct object_entry
*oe
,
3035 struct object_id
*oid
)
3039 const unsigned hexsz
= the_hash_algo
->hexsz
;
3042 enum object_type type
= oid_object_info(the_repository
, oid
,
3045 die("object not found: %s", oid_to_hex(oid
));
3047 oe
= insert_object(oid
);
3049 oe
->pack_id
= MAX_PACK_ID
;
3053 case OBJ_TREE
: /* easy case. */
3059 die("Not a tree-ish: %s", command_buf
.buf
);
3062 if (oe
->pack_id
!= MAX_PACK_ID
) { /* in a pack being written */
3063 buf
= gfi_unpack_entry(oe
, &size
);
3065 enum object_type unused
;
3066 buf
= repo_read_object_file(the_repository
, oid
, &unused
,
3070 die("Can't load object %s", oid_to_hex(oid
));
3072 /* Peel one layer. */
3075 if (size
< hexsz
+ strlen("object ") ||
3076 get_oid_hex(buf
+ strlen("object "), oid
))
3077 die("Invalid SHA1 in tag: %s", command_buf
.buf
);
3080 if (size
< hexsz
+ strlen("tree ") ||
3081 get_oid_hex(buf
+ strlen("tree "), oid
))
3082 die("Invalid SHA1 in commit: %s", command_buf
.buf
);
3086 return find_object(oid
);
3089 static void insert_mapped_mark(uintmax_t mark
, void *object
, void *cbp
)
3091 struct object_id
*fromoid
= object
;
3092 struct object_id
*tooid
= find_mark(cbp
, mark
);
3096 it
= kh_put_oid_map(sub_oid_map
, *fromoid
, &ret
);
3097 /* We've already seen this object. */
3100 kh_value(sub_oid_map
, it
) = tooid
;
3103 static void build_mark_map_one(struct mark_set
*from
, struct mark_set
*to
)
3105 for_each_mark(from
, 0, insert_mapped_mark
, to
);
3108 static void build_mark_map(struct string_list
*from
, struct string_list
*to
)
3110 struct string_list_item
*fromp
, *top
;
3112 sub_oid_map
= kh_init_oid_map();
3114 for_each_string_list_item(fromp
, from
) {
3115 top
= string_list_lookup(to
, fromp
->string
);
3117 die(_("Missing from marks for submodule '%s'"), fromp
->string
);
3118 } else if (!top
|| !top
->util
) {
3119 die(_("Missing to marks for submodule '%s'"), fromp
->string
);
3121 build_mark_map_one(fromp
->util
, top
->util
);
3125 static struct object_entry
*parse_treeish_dataref(const char **p
)
3127 struct object_id oid
;
3128 struct object_entry
*e
;
3130 if (**p
== ':') { /* <mark> */
3131 e
= find_mark(marks
, parse_mark_ref_space(p
));
3133 die("Unknown mark: %s", command_buf
.buf
);
3134 oidcpy(&oid
, &e
->idx
.oid
);
3135 } else { /* <sha1> */
3136 if (parse_mapped_oid_hex(*p
, &oid
, p
))
3137 die("Invalid dataref: %s", command_buf
.buf
);
3138 e
= find_object(&oid
);
3140 die("Missing space after tree-ish: %s", command_buf
.buf
);
3143 while (!e
|| e
->type
!= OBJ_TREE
)
3144 e
= dereference(e
, &oid
);
3148 static void print_ls(int mode
, const unsigned char *hash
, const char *path
)
3150 static struct strbuf line
= STRBUF_INIT
;
3152 /* See show_tree(). */
3154 S_ISGITLINK(mode
) ? commit_type
:
3155 S_ISDIR(mode
) ? tree_type
:
3159 /* missing SP path LF */
3160 strbuf_reset(&line
);
3161 strbuf_addstr(&line
, "missing ");
3162 quote_c_style(path
, &line
, NULL
, 0);
3163 strbuf_addch(&line
, '\n');
3165 /* mode SP type SP object_name TAB path LF */
3166 strbuf_reset(&line
);
3167 strbuf_addf(&line
, "%06o %s %s\t",
3168 mode
& ~NO_DELTA
, type
, hash_to_hex(hash
));
3169 quote_c_style(path
, &line
, NULL
, 0);
3170 strbuf_addch(&line
, '\n');
3172 cat_blob_write(line
.buf
, line
.len
);
3175 static void parse_ls(const char *p
, struct branch
*b
)
3177 static struct strbuf path
= STRBUF_INIT
;
3178 struct tree_entry
*root
= NULL
;
3179 struct tree_entry leaf
= {NULL
};
3181 /* ls SP (<tree-ish> SP)? <path> */
3184 die("Not in a commit: %s", command_buf
.buf
);
3185 root
= &b
->branch_tree
;
3187 struct object_entry
*e
= parse_treeish_dataref(&p
);
3188 root
= new_tree_entry();
3189 oidcpy(&root
->versions
[1].oid
, &e
->idx
.oid
);
3190 if (!is_null_oid(&root
->versions
[1].oid
))
3191 root
->versions
[1].mode
= S_IFDIR
;
3194 strbuf_reset(&path
);
3195 parse_path_eol(&path
, p
, "path");
3196 tree_content_get(root
, path
.buf
, &leaf
, 1);
3198 * A directory in preparation would have a sha1 of zero
3199 * until it is saved. Save, for simplicity.
3201 if (S_ISDIR(leaf
.versions
[1].mode
))
3204 print_ls(leaf
.versions
[1].mode
, leaf
.versions
[1].oid
.hash
, path
.buf
);
3206 release_tree_content_recursive(leaf
.tree
);
3207 if (!b
|| root
!= &b
->branch_tree
)
3208 release_tree_entry(root
);
3211 static void checkpoint(void)
3213 checkpoint_requested
= 0;
3222 static void parse_checkpoint(void)
3224 checkpoint_requested
= 1;
3228 static void parse_progress(void)
3230 fwrite(command_buf
.buf
, 1, command_buf
.len
, stdout
);
3231 fputc('\n', stdout
);
3236 static void parse_alias(void)
3238 struct object_entry
*e
;
3242 read_next_command();
3247 die(_("Expected 'mark' command, got %s"), command_buf
.buf
);
3250 memset(&b
, 0, sizeof(b
));
3251 if (!parse_objectish_with_prefix(&b
, "to "))
3252 die(_("Expected 'to' command, got %s"), command_buf
.buf
);
3253 e
= find_object(&b
.oid
);
3255 insert_mark(&marks
, next_mark
, e
);
3258 static char* make_fast_import_path(const char *path
)
3260 if (!relative_marks_paths
|| is_absolute_path(path
))
3261 return prefix_filename(global_prefix
, path
);
3262 return git_pathdup("info/fast-import/%s", path
);
3265 static void option_import_marks(const char *marks
,
3266 int from_stream
, int ignore_missing
)
3268 if (import_marks_file
) {
3270 die("Only one import-marks command allowed per stream");
3272 /* read previous mark file */
3273 if(!import_marks_file_from_stream
)
3277 free(import_marks_file
);
3278 import_marks_file
= make_fast_import_path(marks
);
3279 import_marks_file_from_stream
= from_stream
;
3280 import_marks_file_ignore_missing
= ignore_missing
;
3283 static void option_date_format(const char *fmt
)
3285 if (!strcmp(fmt
, "raw"))
3286 whenspec
= WHENSPEC_RAW
;
3287 else if (!strcmp(fmt
, "raw-permissive"))
3288 whenspec
= WHENSPEC_RAW_PERMISSIVE
;
3289 else if (!strcmp(fmt
, "rfc2822"))
3290 whenspec
= WHENSPEC_RFC2822
;
3291 else if (!strcmp(fmt
, "now"))
3292 whenspec
= WHENSPEC_NOW
;
3294 die("unknown --date-format argument %s", fmt
);
3297 static unsigned long ulong_arg(const char *option
, const char *arg
)
3300 unsigned long rv
= strtoul(arg
, &endptr
, 0);
3301 if (strchr(arg
, '-') || endptr
== arg
|| *endptr
)
3302 die("%s: argument must be a non-negative integer", option
);
3306 static void option_depth(const char *depth
)
3308 max_depth
= ulong_arg("--depth", depth
);
3309 if (max_depth
> MAX_DEPTH
)
3310 die("--depth cannot exceed %u", MAX_DEPTH
);
3313 static void option_active_branches(const char *branches
)
3315 max_active_branches
= ulong_arg("--active-branches", branches
);
3318 static void option_export_marks(const char *marks
)
3320 free(export_marks_file
);
3321 export_marks_file
= make_fast_import_path(marks
);
3324 static void option_cat_blob_fd(const char *fd
)
3326 unsigned long n
= ulong_arg("--cat-blob-fd", fd
);
3327 if (n
> (unsigned long) INT_MAX
)
3328 die("--cat-blob-fd cannot exceed %d", INT_MAX
);
3329 cat_blob_fd
= (int) n
;
3332 static void option_export_pack_edges(const char *edges
)
3334 char *fn
= prefix_filename(global_prefix
, edges
);
3337 pack_edges
= xfopen(fn
, "a");
3341 static void option_rewrite_submodules(const char *arg
, struct string_list
*list
)
3343 struct mark_set
*ms
;
3345 char *s
= xstrdup(arg
);
3346 char *f
= strchr(s
, ':');
3348 die(_("Expected format name:filename for submodule rewrite option"));
3351 CALLOC_ARRAY(ms
, 1);
3353 f
= prefix_filename(global_prefix
, f
);
3356 die_errno("cannot read '%s'", f
);
3357 read_mark_file(&ms
, fp
, insert_oid_entry
);
3361 string_list_insert(list
, s
)->util
= ms
;
3366 static int parse_one_option(const char *option
)
3368 if (skip_prefix(option
, "max-pack-size=", &option
)) {
3370 if (!git_parse_ulong(option
, &v
))
3373 warning("max-pack-size is now in bytes, assuming --max-pack-size=%lum", v
);
3375 } else if (v
< 1024 * 1024) {
3376 warning("minimum max-pack-size is 1 MiB");
3380 } else if (skip_prefix(option
, "big-file-threshold=", &option
)) {
3382 if (!git_parse_ulong(option
, &v
))
3384 big_file_threshold
= v
;
3385 } else if (skip_prefix(option
, "depth=", &option
)) {
3386 option_depth(option
);
3387 } else if (skip_prefix(option
, "active-branches=", &option
)) {
3388 option_active_branches(option
);
3389 } else if (skip_prefix(option
, "export-pack-edges=", &option
)) {
3390 option_export_pack_edges(option
);
3391 } else if (!strcmp(option
, "quiet")) {
3393 } else if (!strcmp(option
, "stats")) {
3395 } else if (!strcmp(option
, "allow-unsafe-features")) {
3396 ; /* already handled during early option parsing */
3404 static void check_unsafe_feature(const char *feature
, int from_stream
)
3406 if (from_stream
&& !allow_unsafe_features
)
3407 die(_("feature '%s' forbidden in input without --allow-unsafe-features"),
3411 static int parse_one_feature(const char *feature
, int from_stream
)
3415 if (skip_prefix(feature
, "date-format=", &arg
)) {
3416 option_date_format(arg
);
3417 } else if (skip_prefix(feature
, "import-marks=", &arg
)) {
3418 check_unsafe_feature("import-marks", from_stream
);
3419 option_import_marks(arg
, from_stream
, 0);
3420 } else if (skip_prefix(feature
, "import-marks-if-exists=", &arg
)) {
3421 check_unsafe_feature("import-marks-if-exists", from_stream
);
3422 option_import_marks(arg
, from_stream
, 1);
3423 } else if (skip_prefix(feature
, "export-marks=", &arg
)) {
3424 check_unsafe_feature(feature
, from_stream
);
3425 option_export_marks(arg
);
3426 } else if (!strcmp(feature
, "alias")) {
3427 ; /* Don't die - this feature is supported */
3428 } else if (skip_prefix(feature
, "rewrite-submodules-to=", &arg
)) {
3429 option_rewrite_submodules(arg
, &sub_marks_to
);
3430 } else if (skip_prefix(feature
, "rewrite-submodules-from=", &arg
)) {
3431 option_rewrite_submodules(arg
, &sub_marks_from
);
3432 } else if (!strcmp(feature
, "get-mark")) {
3433 ; /* Don't die - this feature is supported */
3434 } else if (!strcmp(feature
, "cat-blob")) {
3435 ; /* Don't die - this feature is supported */
3436 } else if (!strcmp(feature
, "relative-marks")) {
3437 relative_marks_paths
= 1;
3438 } else if (!strcmp(feature
, "no-relative-marks")) {
3439 relative_marks_paths
= 0;
3440 } else if (!strcmp(feature
, "done")) {
3441 require_explicit_termination
= 1;
3442 } else if (!strcmp(feature
, "force")) {
3444 } else if (!strcmp(feature
, "notes") || !strcmp(feature
, "ls")) {
3445 ; /* do nothing; we have the feature */
3453 static void parse_feature(const char *feature
)
3455 if (seen_data_command
)
3456 die("Got feature command '%s' after data command", feature
);
3458 if (parse_one_feature(feature
, 1))
3461 die("This version of fast-import does not support feature %s.", feature
);
3464 static void parse_option(const char *option
)
3466 if (seen_data_command
)
3467 die("Got option command '%s' after data command", option
);
3469 if (parse_one_option(option
))
3472 die("This version of fast-import does not support option: %s", option
);
3475 static void git_pack_config(void)
3477 int indexversion_value
;
3479 unsigned long packsizelimit_value
;
3481 if (!git_config_get_ulong("pack.depth", &max_depth
)) {
3482 if (max_depth
> MAX_DEPTH
)
3483 max_depth
= MAX_DEPTH
;
3485 if (!git_config_get_int("pack.indexversion", &indexversion_value
)) {
3486 pack_idx_opts
.version
= indexversion_value
;
3487 if (pack_idx_opts
.version
> 2)
3488 git_die_config(the_repository
, "pack.indexversion",
3489 "bad pack.indexVersion=%"PRIu32
, pack_idx_opts
.version
);
3491 if (!git_config_get_ulong("pack.packsizelimit", &packsizelimit_value
))
3492 max_packsize
= packsizelimit_value
;
3494 if (!git_config_get_int("fastimport.unpacklimit", &limit
))
3495 unpack_limit
= limit
;
3496 else if (!git_config_get_int("transfer.unpacklimit", &limit
))
3497 unpack_limit
= limit
;
3499 git_config(git_default_config
, NULL
);
3502 static const char fast_import_usage
[] =
3503 "git fast-import [--date-format=<f>] [--max-pack-size=<n>] [--big-file-threshold=<n>] [--depth=<n>] [--active-branches=<n>] [--export-marks=<marks.file>]";
3505 static void parse_argv(void)
3509 for (i
= 1; i
< global_argc
; i
++) {
3510 const char *a
= global_argv
[i
];
3512 if (*a
!= '-' || !strcmp(a
, "--"))
3515 if (!skip_prefix(a
, "--", &a
))
3516 die("unknown option %s", a
);
3518 if (parse_one_option(a
))
3521 if (parse_one_feature(a
, 0))
3524 if (skip_prefix(a
, "cat-blob-fd=", &a
)) {
3525 option_cat_blob_fd(a
);
3529 die("unknown option --%s", a
);
3531 if (i
!= global_argc
)
3532 usage(fast_import_usage
);
3534 seen_data_command
= 1;
3535 if (import_marks_file
)
3537 build_mark_map(&sub_marks_from
, &sub_marks_to
);
3540 int cmd_fast_import(int argc
,
3543 struct repository
*repo UNUSED
)
3547 if (argc
== 2 && !strcmp(argv
[1], "-h"))
3548 usage(fast_import_usage
);
3550 reset_pack_idx_option(&pack_idx_opts
);
3553 alloc_objects(object_entry_alloc
);
3554 strbuf_init(&command_buf
, 0);
3555 CALLOC_ARRAY(atom_table
, atom_table_sz
);
3556 CALLOC_ARRAY(branch_table
, branch_table_sz
);
3557 CALLOC_ARRAY(avail_tree_table
, avail_tree_table_sz
);
3558 marks
= mem_pool_calloc(&fi_mem_pool
, 1, sizeof(struct mark_set
));
3560 hashmap_init(&object_table
, object_entry_hashcmp
, NULL
, 0);
3563 * We don't parse most options until after we've seen the set of
3564 * "feature" lines at the start of the stream (which allows the command
3565 * line to override stream data). But we must do an early parse of any
3566 * command-line options that impact how we interpret the feature lines.
3568 for (i
= 1; i
< argc
; i
++) {
3569 const char *arg
= argv
[i
];
3570 if (*arg
!= '-' || !strcmp(arg
, "--"))
3572 if (!strcmp(arg
, "--allow-unsafe-features"))
3573 allow_unsafe_features
= 1;
3578 global_prefix
= prefix
;
3580 rc_free
= mem_pool_alloc(&fi_mem_pool
, cmd_save
* sizeof(*rc_free
));
3581 for (i
= 0; i
< (cmd_save
- 1); i
++)
3582 rc_free
[i
].next
= &rc_free
[i
+ 1];
3583 rc_free
[cmd_save
- 1].next
= NULL
;
3586 set_die_routine(die_nicely
);
3587 set_checkpoint_signal();
3588 while (read_next_command() != EOF
) {
3590 if (!strcmp("blob", command_buf
.buf
))
3592 else if (skip_prefix(command_buf
.buf
, "commit ", &v
))
3593 parse_new_commit(v
);
3594 else if (skip_prefix(command_buf
.buf
, "tag ", &v
))
3596 else if (skip_prefix(command_buf
.buf
, "reset ", &v
))
3597 parse_reset_branch(v
);
3598 else if (skip_prefix(command_buf
.buf
, "ls ", &v
))
3600 else if (skip_prefix(command_buf
.buf
, "cat-blob ", &v
))
3602 else if (skip_prefix(command_buf
.buf
, "get-mark ", &v
))
3604 else if (!strcmp("checkpoint", command_buf
.buf
))
3606 else if (!strcmp("done", command_buf
.buf
))
3608 else if (!strcmp("alias", command_buf
.buf
))
3610 else if (starts_with(command_buf
.buf
, "progress "))
3612 else if (skip_prefix(command_buf
.buf
, "feature ", &v
))
3614 else if (skip_prefix(command_buf
.buf
, "option git ", &v
))
3616 else if (starts_with(command_buf
.buf
, "option "))
3617 /* ignore non-git options*/;
3619 die("Unsupported command: %s", command_buf
.buf
);
3621 if (checkpoint_requested
)
3625 /* argv hasn't been parsed yet, do so */
3626 if (!seen_data_command
)
3629 if (require_explicit_termination
&& feof(stdin
))
3630 die("stream ends early");
3643 uintmax_t total_count
= 0, duplicate_count
= 0;
3644 for (i
= 0; i
< ARRAY_SIZE(object_count_by_type
); i
++)
3645 total_count
+= object_count_by_type
[i
];
3646 for (i
= 0; i
< ARRAY_SIZE(duplicate_count_by_type
); i
++)
3647 duplicate_count
+= duplicate_count_by_type
[i
];
3649 fprintf(stderr
, "%s statistics:\n", argv
[0]);
3650 fprintf(stderr
, "---------------------------------------------------------------------\n");
3651 fprintf(stderr
, "Alloc'd objects: %10" PRIuMAX
"\n", alloc_count
);
3652 fprintf(stderr
, "Total objects: %10" PRIuMAX
" (%10" PRIuMAX
" duplicates )\n", total_count
, duplicate_count
);
3653 fprintf(stderr
, " blobs : %10" PRIuMAX
" (%10" PRIuMAX
" duplicates %10" PRIuMAX
" deltas of %10" PRIuMAX
" attempts)\n", object_count_by_type
[OBJ_BLOB
], duplicate_count_by_type
[OBJ_BLOB
], delta_count_by_type
[OBJ_BLOB
], delta_count_attempts_by_type
[OBJ_BLOB
]);
3654 fprintf(stderr
, " trees : %10" PRIuMAX
" (%10" PRIuMAX
" duplicates %10" PRIuMAX
" deltas of %10" PRIuMAX
" attempts)\n", object_count_by_type
[OBJ_TREE
], duplicate_count_by_type
[OBJ_TREE
], delta_count_by_type
[OBJ_TREE
], delta_count_attempts_by_type
[OBJ_TREE
]);
3655 fprintf(stderr
, " commits: %10" PRIuMAX
" (%10" PRIuMAX
" duplicates %10" PRIuMAX
" deltas of %10" PRIuMAX
" attempts)\n", object_count_by_type
[OBJ_COMMIT
], duplicate_count_by_type
[OBJ_COMMIT
], delta_count_by_type
[OBJ_COMMIT
], delta_count_attempts_by_type
[OBJ_COMMIT
]);
3656 fprintf(stderr
, " tags : %10" PRIuMAX
" (%10" PRIuMAX
" duplicates %10" PRIuMAX
" deltas of %10" PRIuMAX
" attempts)\n", object_count_by_type
[OBJ_TAG
], duplicate_count_by_type
[OBJ_TAG
], delta_count_by_type
[OBJ_TAG
], delta_count_attempts_by_type
[OBJ_TAG
]);
3657 fprintf(stderr
, "Total branches: %10lu (%10lu loads )\n", branch_count
, branch_load_count
);
3658 fprintf(stderr
, " marks: %10" PRIuMAX
" (%10" PRIuMAX
" unique )\n", (((uintmax_t)1) << marks
->shift
) * 1024, marks_set_count
);
3659 fprintf(stderr
, " atoms: %10u\n", atom_cnt
);
3660 fprintf(stderr
, "Memory total: %10" PRIuMAX
" KiB\n", (tree_entry_allocd
+ fi_mem_pool
.pool_alloc
+ alloc_count
*sizeof(struct object_entry
))/1024);
3661 fprintf(stderr
, " pools: %10lu KiB\n", (unsigned long)((tree_entry_allocd
+ fi_mem_pool
.pool_alloc
) /1024));
3662 fprintf(stderr
, " objects: %10" PRIuMAX
" KiB\n", (alloc_count
*sizeof(struct object_entry
))/1024);
3663 fprintf(stderr
, "---------------------------------------------------------------------\n");
3665 fprintf(stderr
, "---------------------------------------------------------------------\n");
3666 fprintf(stderr
, "\n");
3669 return failure
? 1 : 0;