13 #include "streaming.h"
14 #include "thread-utils.h"
16 #include "object-store.h"
17 #include "promisor-remote.h"
19 static const char index_pack_usage
[] =
20 "git index-pack [-v] [-o <index-file>] [--keep | --keep=<msg>] [--verify] [--strict] (<pack-file> | --stdin [--fix-thin] [<pack-file>])";
23 struct pack_idx_entry idx
;
25 unsigned char hdr_size
;
27 signed char real_type
;
36 struct base_data
*base
;
37 struct base_data
*child
;
38 struct object_entry
*obj
;
41 int ref_first
, ref_last
;
42 int ofs_first
, ofs_last
;
47 struct base_data
*base_cache
;
48 size_t base_cache_used
;
52 /* Remember to update object flag allocation in object.h */
53 #define FLAG_LINK (1u<<20)
54 #define FLAG_CHECKED (1u<<21)
56 struct ofs_delta_entry
{
61 struct ref_delta_entry
{
66 static struct object_entry
*objects
;
67 static struct object_stat
*obj_stat
;
68 static struct ofs_delta_entry
*ofs_deltas
;
69 static struct ref_delta_entry
*ref_deltas
;
70 static struct thread_local nothread_data
;
71 static int nr_objects
;
72 static int nr_ofs_deltas
;
73 static int nr_ref_deltas
;
74 static int ref_deltas_alloc
;
75 static int nr_resolved_deltas
;
76 static int nr_threads
;
78 static int from_stdin
;
80 static int do_fsck_object
;
81 static struct fsck_options fsck_options
= FSCK_OPTIONS_STRICT
;
83 static int show_resolving_progress
;
85 static int check_self_contained_and_connected
;
87 static struct progress
*progress
;
89 /* We always read in 4kB chunks. */
90 static unsigned char input_buffer
[4096];
91 static unsigned int input_offset
, input_len
;
92 static off_t consumed_bytes
;
93 static off_t max_input_size
;
94 static unsigned deepest_delta
;
95 static git_hash_ctx input_ctx
;
96 static uint32_t input_crc32
;
97 static int input_fd
, output_fd
;
98 static const char *curr_pack
;
100 static struct thread_local
*thread_data
;
101 static int nr_dispatched
;
102 static int threads_active
;
104 static pthread_mutex_t read_mutex
;
105 #define read_lock() lock_mutex(&read_mutex)
106 #define read_unlock() unlock_mutex(&read_mutex)
108 static pthread_mutex_t counter_mutex
;
109 #define counter_lock() lock_mutex(&counter_mutex)
110 #define counter_unlock() unlock_mutex(&counter_mutex)
112 static pthread_mutex_t work_mutex
;
113 #define work_lock() lock_mutex(&work_mutex)
114 #define work_unlock() unlock_mutex(&work_mutex)
116 static pthread_mutex_t deepest_delta_mutex
;
117 #define deepest_delta_lock() lock_mutex(&deepest_delta_mutex)
118 #define deepest_delta_unlock() unlock_mutex(&deepest_delta_mutex)
120 static pthread_mutex_t type_cas_mutex
;
121 #define type_cas_lock() lock_mutex(&type_cas_mutex)
122 #define type_cas_unlock() unlock_mutex(&type_cas_mutex)
124 static pthread_key_t key
;
126 static inline void lock_mutex(pthread_mutex_t
*mutex
)
129 pthread_mutex_lock(mutex
);
132 static inline void unlock_mutex(pthread_mutex_t
*mutex
)
135 pthread_mutex_unlock(mutex
);
139 * Mutex and conditional variable can't be statically-initialized on Windows.
141 static void init_thread(void)
144 init_recursive_mutex(&read_mutex
);
145 pthread_mutex_init(&counter_mutex
, NULL
);
146 pthread_mutex_init(&work_mutex
, NULL
);
147 pthread_mutex_init(&type_cas_mutex
, NULL
);
149 pthread_mutex_init(&deepest_delta_mutex
, NULL
);
150 pthread_key_create(&key
, NULL
);
151 thread_data
= xcalloc(nr_threads
, sizeof(*thread_data
));
152 for (i
= 0; i
< nr_threads
; i
++) {
153 thread_data
[i
].pack_fd
= open(curr_pack
, O_RDONLY
);
154 if (thread_data
[i
].pack_fd
== -1)
155 die_errno(_("unable to open %s"), curr_pack
);
161 static void cleanup_thread(void)
167 pthread_mutex_destroy(&read_mutex
);
168 pthread_mutex_destroy(&counter_mutex
);
169 pthread_mutex_destroy(&work_mutex
);
170 pthread_mutex_destroy(&type_cas_mutex
);
172 pthread_mutex_destroy(&deepest_delta_mutex
);
173 for (i
= 0; i
< nr_threads
; i
++)
174 close(thread_data
[i
].pack_fd
);
175 pthread_key_delete(key
);
179 static int mark_link(struct object
*obj
, int type
, void *data
, struct fsck_options
*options
)
184 if (type
!= OBJ_ANY
&& obj
->type
!= type
)
185 die(_("object type mismatch at %s"), oid_to_hex(&obj
->oid
));
187 obj
->flags
|= FLAG_LINK
;
191 /* The content of each linked object must have been checked
192 or it must be already present in the object database */
193 static unsigned check_object(struct object
*obj
)
198 if (!(obj
->flags
& FLAG_LINK
))
201 if (!(obj
->flags
& FLAG_CHECKED
)) {
203 int type
= oid_object_info(the_repository
, &obj
->oid
, &size
);
205 die(_("did not receive expected object %s"),
206 oid_to_hex(&obj
->oid
));
207 if (type
!= obj
->type
)
208 die(_("object %s: expected type %s, found %s"),
209 oid_to_hex(&obj
->oid
),
210 type_name(obj
->type
), type_name(type
));
211 obj
->flags
|= FLAG_CHECKED
;
218 static unsigned check_objects(void)
220 unsigned i
, max
, foreign_nr
= 0;
222 max
= get_max_object_index();
225 progress
= start_delayed_progress(_("Checking objects"), max
);
227 for (i
= 0; i
< max
; i
++) {
228 foreign_nr
+= check_object(get_indexed_object(i
));
229 display_progress(progress
, i
+ 1);
232 stop_progress(&progress
);
237 /* Discard current buffer used content. */
238 static void flush(void)
242 write_or_die(output_fd
, input_buffer
, input_offset
);
243 the_hash_algo
->update_fn(&input_ctx
, input_buffer
, input_offset
);
244 memmove(input_buffer
, input_buffer
+ input_offset
, input_len
);
250 * Make sure at least "min" bytes are available in the buffer, and
251 * return the pointer to the buffer.
253 static void *fill(int min
)
255 if (min
<= input_len
)
256 return input_buffer
+ input_offset
;
257 if (min
> sizeof(input_buffer
))
258 die(Q_("cannot fill %d byte",
259 "cannot fill %d bytes",
264 ssize_t ret
= xread(input_fd
, input_buffer
+ input_len
,
265 sizeof(input_buffer
) - input_len
);
269 die_errno(_("read error on input"));
273 display_throughput(progress
, consumed_bytes
+ input_len
);
274 } while (input_len
< min
);
278 static void use(int bytes
)
280 if (bytes
> input_len
)
281 die(_("used more bytes than were available"));
282 input_crc32
= crc32(input_crc32
, input_buffer
+ input_offset
, bytes
);
284 input_offset
+= bytes
;
286 /* make sure off_t is sufficiently large not to wrap */
287 if (signed_add_overflows(consumed_bytes
, bytes
))
288 die(_("pack too large for current definition of off_t"));
289 consumed_bytes
+= bytes
;
290 if (max_input_size
&& consumed_bytes
> max_input_size
)
291 die(_("pack exceeds maximum allowed size"));
294 static const char *open_pack_file(const char *pack_name
)
299 struct strbuf tmp_file
= STRBUF_INIT
;
300 output_fd
= odb_mkstemp(&tmp_file
,
301 "pack/tmp_pack_XXXXXX");
302 pack_name
= strbuf_detach(&tmp_file
, NULL
);
304 output_fd
= open(pack_name
, O_CREAT
|O_EXCL
|O_RDWR
, 0600);
306 die_errno(_("unable to create '%s'"), pack_name
);
308 nothread_data
.pack_fd
= output_fd
;
310 input_fd
= open(pack_name
, O_RDONLY
);
312 die_errno(_("cannot open packfile '%s'"), pack_name
);
314 nothread_data
.pack_fd
= input_fd
;
316 the_hash_algo
->init_fn(&input_ctx
);
320 static void parse_pack_header(void)
322 struct pack_header
*hdr
= fill(sizeof(struct pack_header
));
324 /* Header consistency check */
325 if (hdr
->hdr_signature
!= htonl(PACK_SIGNATURE
))
326 die(_("pack signature mismatch"));
327 if (!pack_version_ok(hdr
->hdr_version
))
328 die(_("pack version %"PRIu32
" unsupported"),
329 ntohl(hdr
->hdr_version
));
331 nr_objects
= ntohl(hdr
->hdr_entries
);
332 use(sizeof(struct pack_header
));
335 static NORETURN
void bad_object(off_t offset
, const char *format
,
336 ...) __attribute__((format (printf
, 2, 3)));
338 static NORETURN
void bad_object(off_t offset
, const char *format
, ...)
343 va_start(params
, format
);
344 vsnprintf(buf
, sizeof(buf
), format
, params
);
346 die(_("pack has bad object at offset %"PRIuMAX
": %s"),
347 (uintmax_t)offset
, buf
);
350 static inline struct thread_local
*get_thread_data(void)
354 return pthread_getspecific(key
);
355 assert(!threads_active
&&
356 "This should only be reached when all threads are gone");
358 return ¬hread_data
;
361 static void set_thread_data(struct thread_local
*data
)
364 pthread_setspecific(key
, data
);
367 static struct base_data
*alloc_base_data(void)
369 struct base_data
*base
= xcalloc(1, sizeof(struct base_data
));
375 static void free_base_data(struct base_data
*c
)
378 FREE_AND_NULL(c
->data
);
379 get_thread_data()->base_cache_used
-= c
->size
;
383 static void prune_base_data(struct base_data
*retain
)
386 struct thread_local
*data
= get_thread_data();
387 for (b
= data
->base_cache
;
388 data
->base_cache_used
> delta_base_cache_limit
&& b
;
390 if (b
->data
&& b
!= retain
)
395 static void link_base_data(struct base_data
*base
, struct base_data
*c
)
400 get_thread_data()->base_cache
= c
;
405 get_thread_data()->base_cache_used
+= c
->size
;
409 static void unlink_base_data(struct base_data
*c
)
411 struct base_data
*base
= c
->base
;
415 get_thread_data()->base_cache
= NULL
;
419 static int is_delta_type(enum object_type type
)
421 return (type
== OBJ_REF_DELTA
|| type
== OBJ_OFS_DELTA
);
424 static void *unpack_entry_data(off_t offset
, unsigned long size
,
425 enum object_type type
, struct object_id
*oid
)
427 static char fixed_buf
[8192];
435 if (!is_delta_type(type
)) {
436 hdrlen
= xsnprintf(hdr
, sizeof(hdr
), "%s %"PRIuMAX
,
437 type_name(type
),(uintmax_t)size
) + 1;
438 the_hash_algo
->init_fn(&c
);
439 the_hash_algo
->update_fn(&c
, hdr
, hdrlen
);
442 if (type
== OBJ_BLOB
&& size
> big_file_threshold
)
445 buf
= xmallocz(size
);
447 memset(&stream
, 0, sizeof(stream
));
448 git_inflate_init(&stream
);
449 stream
.next_out
= buf
;
450 stream
.avail_out
= buf
== fixed_buf
? sizeof(fixed_buf
) : size
;
453 unsigned char *last_out
= stream
.next_out
;
454 stream
.next_in
= fill(1);
455 stream
.avail_in
= input_len
;
456 status
= git_inflate(&stream
, 0);
457 use(input_len
- stream
.avail_in
);
459 the_hash_algo
->update_fn(&c
, last_out
, stream
.next_out
- last_out
);
460 if (buf
== fixed_buf
) {
461 stream
.next_out
= buf
;
462 stream
.avail_out
= sizeof(fixed_buf
);
464 } while (status
== Z_OK
);
465 if (stream
.total_out
!= size
|| status
!= Z_STREAM_END
)
466 bad_object(offset
, _("inflate returned %d"), status
);
467 git_inflate_end(&stream
);
469 the_hash_algo
->final_fn(oid
->hash
, &c
);
470 return buf
== fixed_buf
? NULL
: buf
;
473 static void *unpack_raw_entry(struct object_entry
*obj
,
475 struct object_id
*ref_oid
,
476 struct object_id
*oid
)
479 unsigned long size
, c
;
484 obj
->idx
.offset
= consumed_bytes
;
485 input_crc32
= crc32(0, NULL
, 0);
490 obj
->type
= (c
>> 4) & 7;
497 size
+= (c
& 0x7f) << shift
;
504 hashcpy(ref_oid
->hash
, fill(the_hash_algo
->rawsz
));
505 use(the_hash_algo
->rawsz
);
511 base_offset
= c
& 127;
514 if (!base_offset
|| MSB(base_offset
, 7))
515 bad_object(obj
->idx
.offset
, _("offset value overflow for delta base object"));
519 base_offset
= (base_offset
<< 7) + (c
& 127);
521 *ofs_offset
= obj
->idx
.offset
- base_offset
;
522 if (*ofs_offset
<= 0 || *ofs_offset
>= obj
->idx
.offset
)
523 bad_object(obj
->idx
.offset
, _("delta base offset is out of bound"));
531 bad_object(obj
->idx
.offset
, _("unknown object type %d"), obj
->type
);
533 obj
->hdr_size
= consumed_bytes
- obj
->idx
.offset
;
535 data
= unpack_entry_data(obj
->idx
.offset
, obj
->size
, obj
->type
, oid
);
536 obj
->idx
.crc32
= input_crc32
;
540 static void *unpack_data(struct object_entry
*obj
,
541 int (*consume
)(const unsigned char *, unsigned long, void *),
544 off_t from
= obj
[0].idx
.offset
+ obj
[0].hdr_size
;
545 off_t len
= obj
[1].idx
.offset
- from
;
546 unsigned char *data
, *inbuf
;
550 data
= xmallocz(consume
? 64*1024 : obj
->size
);
551 inbuf
= xmalloc((len
< 64*1024) ? (int)len
: 64*1024);
553 memset(&stream
, 0, sizeof(stream
));
554 git_inflate_init(&stream
);
555 stream
.next_out
= data
;
556 stream
.avail_out
= consume
? 64*1024 : obj
->size
;
559 ssize_t n
= (len
< 64*1024) ? (ssize_t
)len
: 64*1024;
560 n
= xpread(get_thread_data()->pack_fd
, inbuf
, n
, from
);
562 die_errno(_("cannot pread pack file"));
564 die(Q_("premature end of pack file, %"PRIuMAX
" byte missing",
565 "premature end of pack file, %"PRIuMAX
" bytes missing",
570 stream
.next_in
= inbuf
;
573 status
= git_inflate(&stream
, 0);
576 status
= git_inflate(&stream
, 0);
577 if (consume(data
, stream
.next_out
- data
, cb_data
)) {
582 stream
.next_out
= data
;
583 stream
.avail_out
= 64*1024;
584 } while (status
== Z_OK
&& stream
.avail_in
);
586 } while (len
&& status
== Z_OK
&& !stream
.avail_in
);
588 /* This has been inflated OK when first encountered, so... */
589 if (status
!= Z_STREAM_END
|| stream
.total_out
!= obj
->size
)
590 die(_("serious inflate inconsistency"));
592 git_inflate_end(&stream
);
600 static void *get_data_from_pack(struct object_entry
*obj
)
602 return unpack_data(obj
, NULL
, NULL
);
605 static int compare_ofs_delta_bases(off_t offset1
, off_t offset2
,
606 enum object_type type1
,
607 enum object_type type2
)
609 int cmp
= type1
- type2
;
612 return offset1
< offset2
? -1 :
613 offset1
> offset2
? 1 :
617 static int find_ofs_delta(const off_t offset
, enum object_type type
)
619 int first
= 0, last
= nr_ofs_deltas
;
621 while (first
< last
) {
622 int next
= first
+ (last
- first
) / 2;
623 struct ofs_delta_entry
*delta
= &ofs_deltas
[next
];
626 cmp
= compare_ofs_delta_bases(offset
, delta
->offset
,
627 type
, objects
[delta
->obj_no
].type
);
639 static void find_ofs_delta_children(off_t offset
,
640 int *first_index
, int *last_index
,
641 enum object_type type
)
643 int first
= find_ofs_delta(offset
, type
);
645 int end
= nr_ofs_deltas
- 1;
652 while (first
> 0 && ofs_deltas
[first
- 1].offset
== offset
)
654 while (last
< end
&& ofs_deltas
[last
+ 1].offset
== offset
)
656 *first_index
= first
;
660 static int compare_ref_delta_bases(const struct object_id
*oid1
,
661 const struct object_id
*oid2
,
662 enum object_type type1
,
663 enum object_type type2
)
665 int cmp
= type1
- type2
;
668 return oidcmp(oid1
, oid2
);
671 static int find_ref_delta(const struct object_id
*oid
, enum object_type type
)
673 int first
= 0, last
= nr_ref_deltas
;
675 while (first
< last
) {
676 int next
= first
+ (last
- first
) / 2;
677 struct ref_delta_entry
*delta
= &ref_deltas
[next
];
680 cmp
= compare_ref_delta_bases(oid
, &delta
->oid
,
681 type
, objects
[delta
->obj_no
].type
);
693 static void find_ref_delta_children(const struct object_id
*oid
,
694 int *first_index
, int *last_index
,
695 enum object_type type
)
697 int first
= find_ref_delta(oid
, type
);
699 int end
= nr_ref_deltas
- 1;
706 while (first
> 0 && oideq(&ref_deltas
[first
- 1].oid
, oid
))
708 while (last
< end
&& oideq(&ref_deltas
[last
+ 1].oid
, oid
))
710 *first_index
= first
;
714 struct compare_data
{
715 struct object_entry
*entry
;
716 struct git_istream
*st
;
718 unsigned long buf_size
;
721 static int compare_objects(const unsigned char *buf
, unsigned long size
,
724 struct compare_data
*data
= cb_data
;
726 if (data
->buf_size
< size
) {
728 data
->buf
= xmalloc(size
);
729 data
->buf_size
= size
;
733 ssize_t len
= read_istream(data
->st
, data
->buf
, size
);
735 die(_("SHA1 COLLISION FOUND WITH %s !"),
736 oid_to_hex(&data
->entry
->idx
.oid
));
738 die(_("unable to read %s"),
739 oid_to_hex(&data
->entry
->idx
.oid
));
740 if (memcmp(buf
, data
->buf
, len
))
741 die(_("SHA1 COLLISION FOUND WITH %s !"),
742 oid_to_hex(&data
->entry
->idx
.oid
));
749 static int check_collison(struct object_entry
*entry
)
751 struct compare_data data
;
752 enum object_type type
;
755 if (entry
->size
<= big_file_threshold
|| entry
->type
!= OBJ_BLOB
)
758 memset(&data
, 0, sizeof(data
));
760 data
.st
= open_istream(&entry
->idx
.oid
, &type
, &size
, NULL
);
763 if (size
!= entry
->size
|| type
!= entry
->type
)
764 die(_("SHA1 COLLISION FOUND WITH %s !"),
765 oid_to_hex(&entry
->idx
.oid
));
766 unpack_data(entry
, compare_objects
, &data
);
767 close_istream(data
.st
);
772 static void sha1_object(const void *data
, struct object_entry
*obj_entry
,
773 unsigned long size
, enum object_type type
,
774 const struct object_id
*oid
)
776 void *new_data
= NULL
;
777 int collision_test_needed
= 0;
779 assert(data
|| obj_entry
);
781 if (startup_info
->have_repository
) {
783 collision_test_needed
=
784 has_object_file_with_flags(oid
, OBJECT_INFO_QUICK
);
788 if (collision_test_needed
&& !data
) {
790 if (!check_collison(obj_entry
))
791 collision_test_needed
= 0;
794 if (collision_test_needed
) {
796 enum object_type has_type
;
797 unsigned long has_size
;
799 has_type
= oid_object_info(the_repository
, oid
, &has_size
);
801 die(_("cannot read existing object info %s"), oid_to_hex(oid
));
802 if (has_type
!= type
|| has_size
!= size
)
803 die(_("SHA1 COLLISION FOUND WITH %s !"), oid_to_hex(oid
));
804 has_data
= read_object_file(oid
, &has_type
, &has_size
);
807 data
= new_data
= get_data_from_pack(obj_entry
);
809 die(_("cannot read existing object %s"), oid_to_hex(oid
));
810 if (size
!= has_size
|| type
!= has_type
||
811 memcmp(data
, has_data
, size
) != 0)
812 die(_("SHA1 COLLISION FOUND WITH %s !"), oid_to_hex(oid
));
816 if (strict
|| do_fsck_object
) {
818 if (type
== OBJ_BLOB
) {
819 struct blob
*blob
= lookup_blob(the_repository
, oid
);
821 blob
->object
.flags
|= FLAG_CHECKED
;
823 die(_("invalid blob object %s"), oid_to_hex(oid
));
824 if (do_fsck_object
&&
825 fsck_object(&blob
->object
, (void *)data
, size
, &fsck_options
))
826 die(_("fsck error in packed object"));
830 void *buf
= (void *) data
;
832 assert(data
&& "data can only be NULL for large _blobs_");
835 * we do not need to free the memory here, as the
836 * buf is deleted by the caller.
838 obj
= parse_object_buffer(the_repository
, oid
, type
,
842 die(_("invalid %s"), type_name(type
));
843 if (do_fsck_object
&&
844 fsck_object(obj
, buf
, size
, &fsck_options
))
845 die(_("fsck error in packed object"));
846 if (strict
&& fsck_walk(obj
, NULL
, &fsck_options
))
847 die(_("Not all child objects of %s are reachable"), oid_to_hex(&obj
->oid
));
849 if (obj
->type
== OBJ_TREE
) {
850 struct tree
*item
= (struct tree
*) obj
;
854 if (obj
->type
== OBJ_COMMIT
) {
855 struct commit
*commit
= (struct commit
*) obj
;
856 if (detach_commit_buffer(commit
, NULL
) != data
)
857 BUG("parse_object_buffer transmogrified our buffer");
859 obj
->flags
|= FLAG_CHECKED
;
868 * This function is part of find_unresolved_deltas(). There are two
869 * walkers going in the opposite ways.
871 * The first one in find_unresolved_deltas() traverses down from
872 * parent node to children, deflating nodes along the way. However,
873 * memory for deflated nodes is limited by delta_base_cache_limit, so
874 * at some point parent node's deflated content may be freed.
876 * The second walker is this function, which goes from current node up
877 * to top parent if necessary to deflate the node. In normal
878 * situation, its parent node would be already deflated, so it just
879 * needs to apply delta.
881 * In the worst case scenario, parent node is no longer deflated because
882 * we're running out of delta_base_cache_limit; we need to re-deflate
883 * parents, possibly up to the top base.
885 * All deflated objects here are subject to be freed if we exceed
886 * delta_base_cache_limit, just like in find_unresolved_deltas(), we
887 * just need to make sure the last node is not freed.
889 static void *get_base_data(struct base_data
*c
)
892 struct object_entry
*obj
= c
->obj
;
893 struct base_data
**delta
= NULL
;
894 int delta_nr
= 0, delta_alloc
= 0;
896 while (is_delta_type(c
->obj
->type
) && !c
->data
) {
897 ALLOC_GROW(delta
, delta_nr
+ 1, delta_alloc
);
898 delta
[delta_nr
++] = c
;
902 c
->data
= get_data_from_pack(obj
);
904 get_thread_data()->base_cache_used
+= c
->size
;
907 for (; delta_nr
> 0; delta_nr
--) {
909 c
= delta
[delta_nr
- 1];
911 base
= get_base_data(c
->base
);
912 raw
= get_data_from_pack(obj
);
913 c
->data
= patch_delta(
919 bad_object(obj
->idx
.offset
, _("failed to apply delta"));
920 get_thread_data()->base_cache_used
+= c
->size
;
928 static void resolve_delta(struct object_entry
*delta_obj
,
929 struct base_data
*base
, struct base_data
*result
)
931 void *base_data
, *delta_data
;
934 int i
= delta_obj
- objects
;
935 int j
= base
->obj
- objects
;
936 obj_stat
[i
].delta_depth
= obj_stat
[j
].delta_depth
+ 1;
937 deepest_delta_lock();
938 if (deepest_delta
< obj_stat
[i
].delta_depth
)
939 deepest_delta
= obj_stat
[i
].delta_depth
;
940 deepest_delta_unlock();
941 obj_stat
[i
].base_object_no
= j
;
943 delta_data
= get_data_from_pack(delta_obj
);
944 base_data
= get_base_data(base
);
945 result
->obj
= delta_obj
;
946 result
->data
= patch_delta(base_data
, base
->size
,
947 delta_data
, delta_obj
->size
, &result
->size
);
950 bad_object(delta_obj
->idx
.offset
, _("failed to apply delta"));
951 hash_object_file(result
->data
, result
->size
,
952 type_name(delta_obj
->real_type
), &delta_obj
->idx
.oid
);
953 sha1_object(result
->data
, NULL
, result
->size
, delta_obj
->real_type
,
954 &delta_obj
->idx
.oid
);
956 nr_resolved_deltas
++;
961 * Standard boolean compare-and-swap: atomically check whether "*type" is
962 * "want"; if so, swap in "set" and return true. Otherwise, leave it untouched
965 static int compare_and_swap_type(signed char *type
,
966 enum object_type want
,
967 enum object_type set
)
969 enum object_type old
;
980 static struct base_data
*find_unresolved_deltas_1(struct base_data
*base
,
981 struct base_data
*prev_base
)
983 if (base
->ref_last
== -1 && base
->ofs_last
== -1) {
984 find_ref_delta_children(&base
->obj
->idx
.oid
,
985 &base
->ref_first
, &base
->ref_last
,
988 find_ofs_delta_children(base
->obj
->idx
.offset
,
989 &base
->ofs_first
, &base
->ofs_last
,
992 if (base
->ref_last
== -1 && base
->ofs_last
== -1) {
997 link_base_data(prev_base
, base
);
1000 if (base
->ref_first
<= base
->ref_last
) {
1001 struct object_entry
*child
= objects
+ ref_deltas
[base
->ref_first
].obj_no
;
1002 struct base_data
*result
= alloc_base_data();
1004 if (!compare_and_swap_type(&child
->real_type
, OBJ_REF_DELTA
,
1005 base
->obj
->real_type
))
1006 BUG("child->real_type != OBJ_REF_DELTA");
1008 resolve_delta(child
, base
, result
);
1009 if (base
->ref_first
== base
->ref_last
&& base
->ofs_last
== -1)
1010 free_base_data(base
);
1016 if (base
->ofs_first
<= base
->ofs_last
) {
1017 struct object_entry
*child
= objects
+ ofs_deltas
[base
->ofs_first
].obj_no
;
1018 struct base_data
*result
= alloc_base_data();
1020 assert(child
->real_type
== OBJ_OFS_DELTA
);
1021 child
->real_type
= base
->obj
->real_type
;
1022 resolve_delta(child
, base
, result
);
1023 if (base
->ofs_first
== base
->ofs_last
)
1024 free_base_data(base
);
1030 unlink_base_data(base
);
1034 static void find_unresolved_deltas(struct base_data
*base
)
1036 struct base_data
*new_base
, *prev_base
= NULL
;
1038 new_base
= find_unresolved_deltas_1(base
, prev_base
);
1048 prev_base
= base
->base
;
1053 static int compare_ofs_delta_entry(const void *a
, const void *b
)
1055 const struct ofs_delta_entry
*delta_a
= a
;
1056 const struct ofs_delta_entry
*delta_b
= b
;
1058 return delta_a
->offset
< delta_b
->offset
? -1 :
1059 delta_a
->offset
> delta_b
->offset
? 1 :
1063 static int compare_ref_delta_entry(const void *a
, const void *b
)
1065 const struct ref_delta_entry
*delta_a
= a
;
1066 const struct ref_delta_entry
*delta_b
= b
;
1068 return oidcmp(&delta_a
->oid
, &delta_b
->oid
);
1071 static void resolve_base(struct object_entry
*obj
)
1073 struct base_data
*base_obj
= alloc_base_data();
1074 base_obj
->obj
= obj
;
1075 base_obj
->data
= NULL
;
1076 find_unresolved_deltas(base_obj
);
1079 static void *threaded_second_pass(void *data
)
1081 set_thread_data(data
);
1085 display_progress(progress
, nr_resolved_deltas
);
1088 while (nr_dispatched
< nr_objects
&&
1089 is_delta_type(objects
[nr_dispatched
].type
))
1091 if (nr_dispatched
>= nr_objects
) {
1095 i
= nr_dispatched
++;
1098 resolve_base(&objects
[i
]);
1105 * - find locations of all objects;
1106 * - calculate SHA1 of all non-delta objects;
1107 * - remember base (SHA1 or offset) for all deltas.
1109 static void parse_pack_objects(unsigned char *hash
)
1111 int i
, nr_delays
= 0;
1112 struct ofs_delta_entry
*ofs_delta
= ofs_deltas
;
1113 struct object_id ref_delta_oid
;
1117 progress
= start_progress(
1118 from_stdin
? _("Receiving objects") : _("Indexing objects"),
1120 for (i
= 0; i
< nr_objects
; i
++) {
1121 struct object_entry
*obj
= &objects
[i
];
1122 void *data
= unpack_raw_entry(obj
, &ofs_delta
->offset
,
1125 obj
->real_type
= obj
->type
;
1126 if (obj
->type
== OBJ_OFS_DELTA
) {
1128 ofs_delta
->obj_no
= i
;
1130 } else if (obj
->type
== OBJ_REF_DELTA
) {
1131 ALLOC_GROW(ref_deltas
, nr_ref_deltas
+ 1, ref_deltas_alloc
);
1132 oidcpy(&ref_deltas
[nr_ref_deltas
].oid
, &ref_delta_oid
);
1133 ref_deltas
[nr_ref_deltas
].obj_no
= i
;
1136 /* large blobs, check later */
1137 obj
->real_type
= OBJ_BAD
;
1140 sha1_object(data
, NULL
, obj
->size
, obj
->type
,
1143 display_progress(progress
, i
+1);
1145 objects
[i
].idx
.offset
= consumed_bytes
;
1146 stop_progress(&progress
);
1148 /* Check pack integrity */
1150 the_hash_algo
->final_fn(hash
, &input_ctx
);
1151 if (!hasheq(fill(the_hash_algo
->rawsz
), hash
))
1152 die(_("pack is corrupted (SHA1 mismatch)"));
1153 use(the_hash_algo
->rawsz
);
1155 /* If input_fd is a file, we should have reached its end now. */
1156 if (fstat(input_fd
, &st
))
1157 die_errno(_("cannot fstat packfile"));
1158 if (S_ISREG(st
.st_mode
) &&
1159 lseek(input_fd
, 0, SEEK_CUR
) - input_len
!= st
.st_size
)
1160 die(_("pack has junk at the end"));
1162 for (i
= 0; i
< nr_objects
; i
++) {
1163 struct object_entry
*obj
= &objects
[i
];
1164 if (obj
->real_type
!= OBJ_BAD
)
1166 obj
->real_type
= obj
->type
;
1167 sha1_object(NULL
, obj
, obj
->size
, obj
->type
,
1172 die(_("confusion beyond insanity in parse_pack_objects()"));
1177 * - for all non-delta objects, look if it is used as a base for
1179 * - if used as a base, uncompress the object and apply all deltas,
1180 * recursively checking if the resulting object is used as a base
1181 * for some more deltas.
1183 static void resolve_deltas(void)
1187 if (!nr_ofs_deltas
&& !nr_ref_deltas
)
1190 /* Sort deltas by base SHA1/offset for fast searching */
1191 QSORT(ofs_deltas
, nr_ofs_deltas
, compare_ofs_delta_entry
);
1192 QSORT(ref_deltas
, nr_ref_deltas
, compare_ref_delta_entry
);
1194 if (verbose
|| show_resolving_progress
)
1195 progress
= start_progress(_("Resolving deltas"),
1196 nr_ref_deltas
+ nr_ofs_deltas
);
1199 if (nr_threads
> 1 || getenv("GIT_FORCE_THREADS")) {
1201 for (i
= 0; i
< nr_threads
; i
++) {
1202 int ret
= pthread_create(&thread_data
[i
].thread
, NULL
,
1203 threaded_second_pass
, thread_data
+ i
);
1205 die(_("unable to create thread: %s"),
1208 for (i
= 0; i
< nr_threads
; i
++)
1209 pthread_join(thread_data
[i
].thread
, NULL
);
1214 for (i
= 0; i
< nr_objects
; i
++) {
1215 struct object_entry
*obj
= &objects
[i
];
1217 if (is_delta_type(obj
->type
))
1220 display_progress(progress
, nr_resolved_deltas
);
1226 * - append objects to convert thin pack to full pack if required
1227 * - write the final pack hash
1229 static void fix_unresolved_deltas(struct hashfile
*f
);
1230 static void conclude_pack(int fix_thin_pack
, const char *curr_pack
, unsigned char *pack_hash
)
1232 if (nr_ref_deltas
+ nr_ofs_deltas
== nr_resolved_deltas
) {
1233 stop_progress(&progress
);
1234 /* Flush remaining pack final hash. */
1239 if (fix_thin_pack
) {
1241 unsigned char read_hash
[GIT_MAX_RAWSZ
], tail_hash
[GIT_MAX_RAWSZ
];
1242 struct strbuf msg
= STRBUF_INIT
;
1243 int nr_unresolved
= nr_ofs_deltas
+ nr_ref_deltas
- nr_resolved_deltas
;
1244 int nr_objects_initial
= nr_objects
;
1245 if (nr_unresolved
<= 0)
1246 die(_("confusion beyond insanity"));
1247 REALLOC_ARRAY(objects
, nr_objects
+ nr_unresolved
+ 1);
1248 memset(objects
+ nr_objects
+ 1, 0,
1249 nr_unresolved
* sizeof(*objects
));
1250 f
= hashfd(output_fd
, curr_pack
);
1251 fix_unresolved_deltas(f
);
1252 strbuf_addf(&msg
, Q_("completed with %d local object",
1253 "completed with %d local objects",
1254 nr_objects
- nr_objects_initial
),
1255 nr_objects
- nr_objects_initial
);
1256 stop_progress_msg(&progress
, msg
.buf
);
1257 strbuf_release(&msg
);
1258 finalize_hashfile(f
, tail_hash
, 0);
1259 hashcpy(read_hash
, pack_hash
);
1260 fixup_pack_header_footer(output_fd
, pack_hash
,
1261 curr_pack
, nr_objects
,
1262 read_hash
, consumed_bytes
-the_hash_algo
->rawsz
);
1263 if (!hasheq(read_hash
, tail_hash
))
1264 die(_("Unexpected tail checksum for %s "
1265 "(disk corruption?)"), curr_pack
);
1267 if (nr_ofs_deltas
+ nr_ref_deltas
!= nr_resolved_deltas
)
1268 die(Q_("pack has %d unresolved delta",
1269 "pack has %d unresolved deltas",
1270 nr_ofs_deltas
+ nr_ref_deltas
- nr_resolved_deltas
),
1271 nr_ofs_deltas
+ nr_ref_deltas
- nr_resolved_deltas
);
1274 static int write_compressed(struct hashfile
*f
, void *in
, unsigned int size
)
1278 unsigned char outbuf
[4096];
1280 git_deflate_init(&stream
, zlib_compression_level
);
1281 stream
.next_in
= in
;
1282 stream
.avail_in
= size
;
1285 stream
.next_out
= outbuf
;
1286 stream
.avail_out
= sizeof(outbuf
);
1287 status
= git_deflate(&stream
, Z_FINISH
);
1288 hashwrite(f
, outbuf
, sizeof(outbuf
) - stream
.avail_out
);
1289 } while (status
== Z_OK
);
1291 if (status
!= Z_STREAM_END
)
1292 die(_("unable to deflate appended object (%d)"), status
);
1293 size
= stream
.total_out
;
1294 git_deflate_end(&stream
);
1298 static struct object_entry
*append_obj_to_pack(struct hashfile
*f
,
1299 const unsigned char *sha1
, void *buf
,
1300 unsigned long size
, enum object_type type
)
1302 struct object_entry
*obj
= &objects
[nr_objects
++];
1303 unsigned char header
[10];
1304 unsigned long s
= size
;
1306 unsigned char c
= (type
<< 4) | (s
& 15);
1309 header
[n
++] = c
| 0x80;
1315 hashwrite(f
, header
, n
);
1317 obj
[0].hdr_size
= n
;
1319 obj
[0].real_type
= type
;
1320 obj
[1].idx
.offset
= obj
[0].idx
.offset
+ n
;
1321 obj
[1].idx
.offset
+= write_compressed(f
, buf
, size
);
1322 obj
[0].idx
.crc32
= crc32_end(f
);
1324 hashcpy(obj
->idx
.oid
.hash
, sha1
);
1328 static int delta_pos_compare(const void *_a
, const void *_b
)
1330 struct ref_delta_entry
*a
= *(struct ref_delta_entry
**)_a
;
1331 struct ref_delta_entry
*b
= *(struct ref_delta_entry
**)_b
;
1332 return a
->obj_no
- b
->obj_no
;
1335 static void fix_unresolved_deltas(struct hashfile
*f
)
1337 struct ref_delta_entry
**sorted_by_pos
;
1341 * Since many unresolved deltas may well be themselves base objects
1342 * for more unresolved deltas, we really want to include the
1343 * smallest number of base objects that would cover as much delta
1344 * as possible by picking the
1345 * trunc deltas first, allowing for other deltas to resolve without
1346 * additional base objects. Since most base objects are to be found
1347 * before deltas depending on them, a good heuristic is to start
1348 * resolving deltas in the same order as their position in the pack.
1350 ALLOC_ARRAY(sorted_by_pos
, nr_ref_deltas
);
1351 for (i
= 0; i
< nr_ref_deltas
; i
++)
1352 sorted_by_pos
[i
] = &ref_deltas
[i
];
1353 QSORT(sorted_by_pos
, nr_ref_deltas
, delta_pos_compare
);
1355 if (has_promisor_remote()) {
1357 * Prefetch the delta bases.
1359 struct oid_array to_fetch
= OID_ARRAY_INIT
;
1360 for (i
= 0; i
< nr_ref_deltas
; i
++) {
1361 struct ref_delta_entry
*d
= sorted_by_pos
[i
];
1362 if (!oid_object_info_extended(the_repository
, &d
->oid
,
1364 OBJECT_INFO_FOR_PREFETCH
))
1366 oid_array_append(&to_fetch
, &d
->oid
);
1369 promisor_remote_get_direct(the_repository
,
1370 to_fetch
.oid
, to_fetch
.nr
);
1371 oid_array_clear(&to_fetch
);
1374 for (i
= 0; i
< nr_ref_deltas
; i
++) {
1375 struct ref_delta_entry
*d
= sorted_by_pos
[i
];
1376 enum object_type type
;
1377 struct base_data
*base_obj
= alloc_base_data();
1379 if (objects
[d
->obj_no
].real_type
!= OBJ_REF_DELTA
)
1381 base_obj
->data
= read_object_file(&d
->oid
, &type
,
1383 if (!base_obj
->data
)
1386 if (check_object_signature(&d
->oid
, base_obj
->data
,
1387 base_obj
->size
, type_name(type
)))
1388 die(_("local object %s is corrupt"), oid_to_hex(&d
->oid
));
1389 base_obj
->obj
= append_obj_to_pack(f
, d
->oid
.hash
,
1390 base_obj
->data
, base_obj
->size
, type
);
1391 find_unresolved_deltas(base_obj
);
1392 display_progress(progress
, nr_resolved_deltas
);
1394 free(sorted_by_pos
);
1397 static const char *derive_filename(const char *pack_name
, const char *suffix
,
1401 if (!strip_suffix(pack_name
, ".pack", &len
))
1402 die(_("packfile name '%s' does not end with '.pack'"),
1404 strbuf_add(buf
, pack_name
, len
);
1405 strbuf_addch(buf
, '.');
1406 strbuf_addstr(buf
, suffix
);
1410 static void write_special_file(const char *suffix
, const char *msg
,
1411 const char *pack_name
, const unsigned char *hash
,
1412 const char **report
)
1414 struct strbuf name_buf
= STRBUF_INIT
;
1415 const char *filename
;
1417 int msg_len
= strlen(msg
);
1420 filename
= derive_filename(pack_name
, suffix
, &name_buf
);
1422 filename
= odb_pack_name(&name_buf
, hash
, suffix
);
1424 fd
= odb_pack_keep(filename
);
1426 if (errno
!= EEXIST
)
1427 die_errno(_("cannot write %s file '%s'"),
1431 write_or_die(fd
, msg
, msg_len
);
1432 write_or_die(fd
, "\n", 1);
1435 die_errno(_("cannot close written %s file '%s'"),
1440 strbuf_release(&name_buf
);
1443 static void final(const char *final_pack_name
, const char *curr_pack_name
,
1444 const char *final_index_name
, const char *curr_index_name
,
1445 const char *keep_msg
, const char *promisor_msg
,
1446 unsigned char *hash
)
1448 const char *report
= "pack";
1449 struct strbuf pack_name
= STRBUF_INIT
;
1450 struct strbuf index_name
= STRBUF_INIT
;
1456 fsync_or_die(output_fd
, curr_pack_name
);
1457 err
= close(output_fd
);
1459 die_errno(_("error while closing pack file"));
1463 write_special_file("keep", keep_msg
, final_pack_name
, hash
,
1466 write_special_file("promisor", promisor_msg
, final_pack_name
,
1469 if (final_pack_name
!= curr_pack_name
) {
1470 if (!final_pack_name
)
1471 final_pack_name
= odb_pack_name(&pack_name
, hash
, "pack");
1472 if (finalize_object_file(curr_pack_name
, final_pack_name
))
1473 die(_("cannot store pack file"));
1474 } else if (from_stdin
)
1475 chmod(final_pack_name
, 0444);
1477 if (final_index_name
!= curr_index_name
) {
1478 if (!final_index_name
)
1479 final_index_name
= odb_pack_name(&index_name
, hash
, "idx");
1480 if (finalize_object_file(curr_index_name
, final_index_name
))
1481 die(_("cannot store index file"));
1483 chmod(final_index_name
, 0444);
1485 if (do_fsck_object
) {
1486 struct packed_git
*p
;
1487 p
= add_packed_git(final_index_name
, strlen(final_index_name
), 0);
1489 install_packed_git(the_repository
, p
);
1493 printf("%s\n", hash_to_hex(hash
));
1495 struct strbuf buf
= STRBUF_INIT
;
1497 strbuf_addf(&buf
, "%s\t%s\n", report
, hash_to_hex(hash
));
1498 write_or_die(1, buf
.buf
, buf
.len
);
1499 strbuf_release(&buf
);
1502 * Let's just mimic git-unpack-objects here and write
1503 * the last part of the input buffer to stdout.
1506 err
= xwrite(1, input_buffer
+ input_offset
, input_len
);
1510 input_offset
+= err
;
1514 strbuf_release(&index_name
);
1515 strbuf_release(&pack_name
);
1518 static int git_index_pack_config(const char *k
, const char *v
, void *cb
)
1520 struct pack_idx_option
*opts
= cb
;
1522 if (!strcmp(k
, "pack.indexversion")) {
1523 opts
->version
= git_config_int(k
, v
);
1524 if (opts
->version
> 2)
1525 die(_("bad pack.indexversion=%"PRIu32
), opts
->version
);
1528 if (!strcmp(k
, "pack.threads")) {
1529 nr_threads
= git_config_int(k
, v
);
1531 die(_("invalid number of threads specified (%d)"),
1533 if (!HAVE_THREADS
&& nr_threads
!= 1) {
1534 warning(_("no threads support, ignoring %s"), k
);
1539 return git_default_config(k
, v
, cb
);
1542 static int cmp_uint32(const void *a_
, const void *b_
)
1544 uint32_t a
= *((uint32_t *)a_
);
1545 uint32_t b
= *((uint32_t *)b_
);
1547 return (a
< b
) ? -1 : (a
!= b
);
1550 static void read_v2_anomalous_offsets(struct packed_git
*p
,
1551 struct pack_idx_option
*opts
)
1553 const uint32_t *idx1
, *idx2
;
1555 const uint32_t hashwords
= the_hash_algo
->rawsz
/ sizeof(uint32_t);
1557 /* The address of the 4-byte offset table */
1558 idx1
= (((const uint32_t *)p
->index_data
)
1559 + 2 /* 8-byte header */
1561 + hashwords
* p
->num_objects
/* object ID table */
1562 + p
->num_objects
/* CRC32 table */
1565 /* The address of the 8-byte offset table */
1566 idx2
= idx1
+ p
->num_objects
;
1568 for (i
= 0; i
< p
->num_objects
; i
++) {
1569 uint32_t off
= ntohl(idx1
[i
]);
1570 if (!(off
& 0x80000000))
1572 off
= off
& 0x7fffffff;
1573 check_pack_index_ptr(p
, &idx2
[off
* 2]);
1577 * The real offset is ntohl(idx2[off * 2]) in high 4
1578 * octets, and ntohl(idx2[off * 2 + 1]) in low 4
1579 * octets. But idx2[off * 2] is Zero!!!
1581 ALLOC_GROW(opts
->anomaly
, opts
->anomaly_nr
+ 1, opts
->anomaly_alloc
);
1582 opts
->anomaly
[opts
->anomaly_nr
++] = ntohl(idx2
[off
* 2 + 1]);
1585 QSORT(opts
->anomaly
, opts
->anomaly_nr
, cmp_uint32
);
1588 static void read_idx_option(struct pack_idx_option
*opts
, const char *pack_name
)
1590 struct packed_git
*p
= add_packed_git(pack_name
, strlen(pack_name
), 1);
1593 die(_("Cannot open existing pack file '%s'"), pack_name
);
1594 if (open_pack_index(p
))
1595 die(_("Cannot open existing pack idx file for '%s'"), pack_name
);
1597 /* Read the attributes from the existing idx file */
1598 opts
->version
= p
->index_version
;
1600 if (opts
->version
== 2)
1601 read_v2_anomalous_offsets(p
, opts
);
1604 * Get rid of the idx file as we do not need it anymore.
1605 * NEEDSWORK: extract this bit from free_pack_by_name() in
1606 * sha1-file.c, perhaps? It shouldn't matter very much as we
1607 * know we haven't installed this pack (hence we never have
1608 * read anything from it).
1610 close_pack_index(p
);
1614 static void show_pack_info(int stat_only
)
1616 int i
, baseobjects
= nr_objects
- nr_ref_deltas
- nr_ofs_deltas
;
1617 unsigned long *chain_histogram
= NULL
;
1620 chain_histogram
= xcalloc(deepest_delta
, sizeof(unsigned long));
1622 for (i
= 0; i
< nr_objects
; i
++) {
1623 struct object_entry
*obj
= &objects
[i
];
1625 if (is_delta_type(obj
->type
))
1626 chain_histogram
[obj_stat
[i
].delta_depth
- 1]++;
1629 printf("%s %-6s %"PRIuMAX
" %"PRIuMAX
" %"PRIuMAX
,
1630 oid_to_hex(&obj
->idx
.oid
),
1631 type_name(obj
->real_type
), (uintmax_t)obj
->size
,
1632 (uintmax_t)(obj
[1].idx
.offset
- obj
->idx
.offset
),
1633 (uintmax_t)obj
->idx
.offset
);
1634 if (is_delta_type(obj
->type
)) {
1635 struct object_entry
*bobj
= &objects
[obj_stat
[i
].base_object_no
];
1636 printf(" %u %s", obj_stat
[i
].delta_depth
,
1637 oid_to_hex(&bobj
->idx
.oid
));
1643 printf_ln(Q_("non delta: %d object",
1644 "non delta: %d objects",
1647 for (i
= 0; i
< deepest_delta
; i
++) {
1648 if (!chain_histogram
[i
])
1650 printf_ln(Q_("chain length = %d: %lu object",
1651 "chain length = %d: %lu objects",
1652 chain_histogram
[i
]),
1654 chain_histogram
[i
]);
1658 int cmd_index_pack(int argc
, const char **argv
, const char *prefix
)
1660 int i
, fix_thin_pack
= 0, verify
= 0, stat_only
= 0;
1661 const char *curr_index
;
1662 const char *index_name
= NULL
, *pack_name
= NULL
;
1663 const char *keep_msg
= NULL
;
1664 const char *promisor_msg
= NULL
;
1665 struct strbuf index_name_buf
= STRBUF_INIT
;
1666 struct pack_idx_entry
**idx_objects
;
1667 struct pack_idx_option opts
;
1668 unsigned char pack_hash
[GIT_MAX_RAWSZ
];
1669 unsigned foreign_nr
= 1; /* zero is a "good" value, assume bad */
1670 int report_end_of_input
= 0;
1673 * index-pack never needs to fetch missing objects except when
1674 * REF_DELTA bases are missing (which are explicitly handled). It only
1675 * accesses the repo to do hash collision checks and to check which
1676 * REF_DELTA bases need to be fetched.
1678 fetch_if_missing
= 0;
1680 if (argc
== 2 && !strcmp(argv
[1], "-h"))
1681 usage(index_pack_usage
);
1683 read_replace_refs
= 0;
1684 fsck_options
.walk
= mark_link
;
1686 reset_pack_idx_option(&opts
);
1687 git_config(git_index_pack_config
, &opts
);
1688 if (prefix
&& chdir(prefix
))
1689 die(_("Cannot come back to cwd"));
1691 for (i
= 1; i
< argc
; i
++) {
1692 const char *arg
= argv
[i
];
1695 if (!strcmp(arg
, "--stdin")) {
1697 } else if (!strcmp(arg
, "--fix-thin")) {
1699 } else if (skip_to_optional_arg(arg
, "--strict", &arg
)) {
1702 fsck_set_msg_types(&fsck_options
, arg
);
1703 } else if (!strcmp(arg
, "--check-self-contained-and-connected")) {
1705 check_self_contained_and_connected
= 1;
1706 } else if (!strcmp(arg
, "--fsck-objects")) {
1708 } else if (!strcmp(arg
, "--verify")) {
1710 } else if (!strcmp(arg
, "--verify-stat")) {
1713 } else if (!strcmp(arg
, "--verify-stat-only")) {
1717 } else if (skip_to_optional_arg(arg
, "--keep", &keep_msg
)) {
1718 ; /* nothing to do */
1719 } else if (skip_to_optional_arg(arg
, "--promisor", &promisor_msg
)) {
1720 ; /* already parsed */
1721 } else if (starts_with(arg
, "--threads=")) {
1723 nr_threads
= strtoul(arg
+10, &end
, 0);
1724 if (!arg
[10] || *end
|| nr_threads
< 0)
1725 usage(index_pack_usage
);
1726 if (!HAVE_THREADS
&& nr_threads
!= 1) {
1727 warning(_("no threads support, ignoring %s"), arg
);
1730 } else if (starts_with(arg
, "--pack_header=")) {
1731 struct pack_header
*hdr
;
1734 hdr
= (struct pack_header
*)input_buffer
;
1735 hdr
->hdr_signature
= htonl(PACK_SIGNATURE
);
1736 hdr
->hdr_version
= htonl(strtoul(arg
+ 14, &c
, 10));
1738 die(_("bad %s"), arg
);
1739 hdr
->hdr_entries
= htonl(strtoul(c
+ 1, &c
, 10));
1741 die(_("bad %s"), arg
);
1742 input_len
= sizeof(*hdr
);
1743 } else if (!strcmp(arg
, "-v")) {
1745 } else if (!strcmp(arg
, "--show-resolving-progress")) {
1746 show_resolving_progress
= 1;
1747 } else if (!strcmp(arg
, "--report-end-of-input")) {
1748 report_end_of_input
= 1;
1749 } else if (!strcmp(arg
, "-o")) {
1750 if (index_name
|| (i
+1) >= argc
)
1751 usage(index_pack_usage
);
1752 index_name
= argv
[++i
];
1753 } else if (starts_with(arg
, "--index-version=")) {
1755 opts
.version
= strtoul(arg
+ 16, &c
, 10);
1756 if (opts
.version
> 2)
1757 die(_("bad %s"), arg
);
1759 opts
.off32_limit
= strtoul(c
+1, &c
, 0);
1760 if (*c
|| opts
.off32_limit
& 0x80000000)
1761 die(_("bad %s"), arg
);
1762 } else if (skip_prefix(arg
, "--max-input-size=", &arg
)) {
1763 max_input_size
= strtoumax(arg
, NULL
, 10);
1765 usage(index_pack_usage
);
1770 usage(index_pack_usage
);
1774 if (!pack_name
&& !from_stdin
)
1775 usage(index_pack_usage
);
1776 if (fix_thin_pack
&& !from_stdin
)
1777 die(_("--fix-thin cannot be used without --stdin"));
1778 if (from_stdin
&& !startup_info
->have_repository
)
1779 die(_("--stdin requires a git repository"));
1780 if (!index_name
&& pack_name
)
1781 index_name
= derive_filename(pack_name
, "idx", &index_name_buf
);
1785 die(_("--verify with no packfile name given"));
1786 read_idx_option(&opts
, index_name
);
1787 opts
.flags
|= WRITE_IDX_VERIFY
| WRITE_IDX_STRICT
;
1790 opts
.flags
|= WRITE_IDX_STRICT
;
1792 if (HAVE_THREADS
&& !nr_threads
) {
1793 nr_threads
= online_cpus();
1794 /* An experiment showed that more threads does not mean faster */
1799 curr_pack
= open_pack_file(pack_name
);
1800 parse_pack_header();
1801 objects
= xcalloc(st_add(nr_objects
, 1), sizeof(struct object_entry
));
1803 obj_stat
= xcalloc(st_add(nr_objects
, 1), sizeof(struct object_stat
));
1804 ofs_deltas
= xcalloc(nr_objects
, sizeof(struct ofs_delta_entry
));
1805 parse_pack_objects(pack_hash
);
1806 if (report_end_of_input
)
1807 write_in_full(2, "\0", 1);
1809 conclude_pack(fix_thin_pack
, curr_pack
, pack_hash
);
1813 foreign_nr
= check_objects();
1816 show_pack_info(stat_only
);
1818 ALLOC_ARRAY(idx_objects
, nr_objects
);
1819 for (i
= 0; i
< nr_objects
; i
++)
1820 idx_objects
[i
] = &objects
[i
].idx
;
1821 curr_index
= write_idx_file(index_name
, idx_objects
, nr_objects
, &opts
, pack_hash
);
1825 final(pack_name
, curr_pack
,
1826 index_name
, curr_index
,
1827 keep_msg
, promisor_msg
,
1832 if (do_fsck_object
&& fsck_finish(&fsck_options
))
1833 die(_("fsck error in pack objects"));
1836 strbuf_release(&index_name_buf
);
1837 if (pack_name
== NULL
)
1838 free((void *) curr_pack
);
1839 if (index_name
== NULL
)
1840 free((void *) curr_index
);
1843 * Let the caller know this pack is not self contained
1845 if (check_self_contained_and_connected
&& foreign_nr
)