4 #include "commit-graph.h"
5 #include "repository.h"
6 #include "object-store.h"
13 #include "gpg-interface.h"
14 #include "mergesort.h"
15 #include "commit-slab.h"
16 #include "prio-queue.h"
17 #include "hash-lookup.h"
18 #include "wt-status.h"
21 #include "commit-reach.h"
22 #include "run-command.h"
26 static struct commit_extra_header
*read_commit_extra_header_lines(const char *buf
, size_t len
, const char **);
28 int save_commit_buffer
= 1;
29 int no_graft_file_deprecated_advice
;
31 const char *commit_type
= "commit";
33 struct commit
*lookup_commit_reference_gently(struct repository
*r
,
34 const struct object_id
*oid
, int quiet
)
36 struct object
*obj
= deref_tag(r
,
42 return object_as_type(obj
, OBJ_COMMIT
, quiet
);
45 struct commit
*lookup_commit_reference(struct repository
*r
, const struct object_id
*oid
)
47 return lookup_commit_reference_gently(r
, oid
, 0);
50 struct commit
*lookup_commit_or_die(const struct object_id
*oid
, const char *ref_name
)
52 struct commit
*c
= lookup_commit_reference(the_repository
, oid
);
54 die(_("could not parse %s"), ref_name
);
55 if (!oideq(oid
, &c
->object
.oid
)) {
56 warning(_("%s %s is not a commit!"),
57 ref_name
, oid_to_hex(oid
));
62 struct commit
*lookup_commit_object(struct repository
*r
,
63 const struct object_id
*oid
)
65 struct object
*obj
= parse_object(r
, oid
);
66 return obj
? object_as_type(obj
, OBJ_COMMIT
, 0) : NULL
;
70 struct commit
*lookup_commit(struct repository
*r
, const struct object_id
*oid
)
72 struct object
*obj
= lookup_object(r
, oid
);
74 return create_object(r
, oid
, alloc_commit_node(r
));
75 return object_as_type(obj
, OBJ_COMMIT
, 0);
78 struct commit
*lookup_commit_reference_by_name(const char *name
)
81 struct commit
*commit
;
83 if (get_oid_committish(name
, &oid
))
85 commit
= lookup_commit_reference(the_repository
, &oid
);
86 if (parse_commit(commit
))
91 static timestamp_t
parse_commit_date(const char *buf
, const char *tail
)
97 if (memcmp(buf
, "author", 6))
99 while (buf
< tail
&& *buf
++ != '\n')
103 if (memcmp(buf
, "committer", 9))
105 while (buf
< tail
&& *buf
++ != '>')
110 while (buf
< tail
&& *buf
++ != '\n')
114 /* dateptr < buf && buf[-1] == '\n', so parsing will stop at buf-1 */
115 return parse_timestamp(dateptr
, NULL
, 10);
118 static const struct object_id
*commit_graft_oid_access(size_t index
, const void *table
)
120 const struct commit_graft
* const *commit_graft_table
= table
;
121 return &commit_graft_table
[index
]->oid
;
124 int commit_graft_pos(struct repository
*r
, const struct object_id
*oid
)
126 return oid_pos(oid
, r
->parsed_objects
->grafts
,
127 r
->parsed_objects
->grafts_nr
,
128 commit_graft_oid_access
);
131 static void unparse_commit(struct repository
*r
, const struct object_id
*oid
)
133 struct commit
*c
= lookup_commit(r
, oid
);
135 if (!c
->object
.parsed
)
137 free_commit_list(c
->parents
);
139 c
->object
.parsed
= 0;
142 int register_commit_graft(struct repository
*r
, struct commit_graft
*graft
,
145 int pos
= commit_graft_pos(r
, &graft
->oid
);
151 free(r
->parsed_objects
->grafts
[pos
]);
152 r
->parsed_objects
->grafts
[pos
] = graft
;
157 ALLOC_GROW(r
->parsed_objects
->grafts
,
158 r
->parsed_objects
->grafts_nr
+ 1,
159 r
->parsed_objects
->grafts_alloc
);
160 r
->parsed_objects
->grafts_nr
++;
161 if (pos
< r
->parsed_objects
->grafts_nr
)
162 memmove(r
->parsed_objects
->grafts
+ pos
+ 1,
163 r
->parsed_objects
->grafts
+ pos
,
164 (r
->parsed_objects
->grafts_nr
- pos
- 1) *
165 sizeof(*r
->parsed_objects
->grafts
));
166 r
->parsed_objects
->grafts
[pos
] = graft
;
167 unparse_commit(r
, &graft
->oid
);
171 struct commit_graft
*read_graft_line(struct strbuf
*line
)
173 /* The format is just "Commit Parent1 Parent2 ...\n" */
175 const char *tail
= NULL
;
176 struct commit_graft
*graft
= NULL
;
177 struct object_id dummy_oid
, *oid
;
180 if (!line
->len
|| line
->buf
[0] == '#')
183 * phase 0 verifies line, counts hashes in line and allocates graft
184 * phase 1 fills graft
186 for (phase
= 0; phase
< 2; phase
++) {
187 oid
= graft
? &graft
->oid
: &dummy_oid
;
188 if (parse_oid_hex(line
->buf
, oid
, &tail
))
190 for (i
= 0; *tail
!= '\0'; i
++) {
191 oid
= graft
? &graft
->parent
[i
] : &dummy_oid
;
192 if (!isspace(*tail
++) || parse_oid_hex(tail
, oid
, &tail
))
196 graft
= xmalloc(st_add(sizeof(*graft
),
197 st_mult(sizeof(struct object_id
), i
)));
198 graft
->nr_parent
= i
;
204 error("bad graft data: %s", line
->buf
);
209 static int read_graft_file(struct repository
*r
, const char *graft_file
)
211 FILE *fp
= fopen_or_warn(graft_file
, "r");
212 struct strbuf buf
= STRBUF_INIT
;
215 if (!no_graft_file_deprecated_advice
&&
216 advice_enabled(ADVICE_GRAFT_FILE_DEPRECATED
))
217 advise(_("Support for <GIT_DIR>/info/grafts is deprecated\n"
218 "and will be removed in a future Git version.\n"
220 "Please use \"git replace --convert-graft-file\"\n"
221 "to convert the grafts into replace refs.\n"
223 "Turn this message off by running\n"
224 "\"git config advice.graftFileDeprecated false\""));
225 while (!strbuf_getwholeline(&buf
, fp
, '\n')) {
226 /* The format is just "Commit Parent1 Parent2 ...\n" */
227 struct commit_graft
*graft
= read_graft_line(&buf
);
230 if (register_commit_graft(r
, graft
, 1))
231 error("duplicate graft data: %s", buf
.buf
);
234 strbuf_release(&buf
);
238 void prepare_commit_graft(struct repository
*r
)
242 if (r
->parsed_objects
->commit_graft_prepared
)
244 if (!startup_info
->have_repository
)
247 graft_file
= get_graft_file(r
);
248 read_graft_file(r
, graft_file
);
249 /* make sure shallows are read */
250 is_repository_shallow(r
);
251 r
->parsed_objects
->commit_graft_prepared
= 1;
254 struct commit_graft
*lookup_commit_graft(struct repository
*r
, const struct object_id
*oid
)
257 prepare_commit_graft(r
);
258 pos
= commit_graft_pos(r
, oid
);
261 return r
->parsed_objects
->grafts
[pos
];
264 int for_each_commit_graft(each_commit_graft_fn fn
, void *cb_data
)
267 for (i
= ret
= 0; i
< the_repository
->parsed_objects
->grafts_nr
&& !ret
; i
++)
268 ret
= fn(the_repository
->parsed_objects
->grafts
[i
], cb_data
);
272 void reset_commit_grafts(struct repository
*r
)
276 for (i
= 0; i
< r
->parsed_objects
->grafts_nr
; i
++) {
277 unparse_commit(r
, &r
->parsed_objects
->grafts
[i
]->oid
);
278 free(r
->parsed_objects
->grafts
[i
]);
280 r
->parsed_objects
->grafts_nr
= 0;
281 r
->parsed_objects
->commit_graft_prepared
= 0;
284 struct commit_buffer
{
288 define_commit_slab(buffer_slab
, struct commit_buffer
);
290 struct buffer_slab
*allocate_commit_buffer_slab(void)
292 struct buffer_slab
*bs
= xmalloc(sizeof(*bs
));
293 init_buffer_slab(bs
);
297 void free_commit_buffer_slab(struct buffer_slab
*bs
)
299 clear_buffer_slab(bs
);
303 void set_commit_buffer(struct repository
*r
, struct commit
*commit
, void *buffer
, unsigned long size
)
305 struct commit_buffer
*v
= buffer_slab_at(
306 r
->parsed_objects
->buffer_slab
, commit
);
311 const void *get_cached_commit_buffer(struct repository
*r
, const struct commit
*commit
, unsigned long *sizep
)
313 struct commit_buffer
*v
= buffer_slab_peek(
314 r
->parsed_objects
->buffer_slab
, commit
);
325 const void *repo_get_commit_buffer(struct repository
*r
,
326 const struct commit
*commit
,
327 unsigned long *sizep
)
329 const void *ret
= get_cached_commit_buffer(r
, commit
, sizep
);
331 enum object_type type
;
333 ret
= repo_read_object_file(r
, &commit
->object
.oid
, &type
, &size
);
335 die("cannot read commit object %s",
336 oid_to_hex(&commit
->object
.oid
));
337 if (type
!= OBJ_COMMIT
)
338 die("expected commit for %s, got %s",
339 oid_to_hex(&commit
->object
.oid
), type_name(type
));
346 void repo_unuse_commit_buffer(struct repository
*r
,
347 const struct commit
*commit
,
350 struct commit_buffer
*v
= buffer_slab_peek(
351 r
->parsed_objects
->buffer_slab
, commit
);
352 if (!(v
&& v
->buffer
== buffer
))
353 free((void *)buffer
);
356 void free_commit_buffer(struct parsed_object_pool
*pool
, struct commit
*commit
)
358 struct commit_buffer
*v
= buffer_slab_peek(
359 pool
->buffer_slab
, commit
);
361 FREE_AND_NULL(v
->buffer
);
366 static inline void set_commit_tree(struct commit
*c
, struct tree
*t
)
371 struct tree
*repo_get_commit_tree(struct repository
*r
,
372 const struct commit
*commit
)
374 if (commit
->maybe_tree
|| !commit
->object
.parsed
)
375 return commit
->maybe_tree
;
377 if (commit_graph_position(commit
) != COMMIT_NOT_FROM_GRAPH
)
378 return get_commit_tree_in_graph(r
, commit
);
383 struct object_id
*get_commit_tree_oid(const struct commit
*commit
)
385 struct tree
*tree
= get_commit_tree(commit
);
386 return tree
? &tree
->object
.oid
: NULL
;
389 void release_commit_memory(struct parsed_object_pool
*pool
, struct commit
*c
)
391 set_commit_tree(c
, NULL
);
392 free_commit_buffer(pool
, c
);
394 free_commit_list(c
->parents
);
396 c
->object
.parsed
= 0;
399 const void *detach_commit_buffer(struct commit
*commit
, unsigned long *sizep
)
401 struct commit_buffer
*v
= buffer_slab_peek(
402 the_repository
->parsed_objects
->buffer_slab
, commit
);
419 int parse_commit_buffer(struct repository
*r
, struct commit
*item
, const void *buffer
, unsigned long size
, int check_graph
)
421 const char *tail
= buffer
;
422 const char *bufptr
= buffer
;
423 struct object_id parent
;
424 struct commit_list
**pptr
;
425 struct commit_graft
*graft
;
426 const int tree_entry_len
= the_hash_algo
->hexsz
+ 5;
427 const int parent_entry_len
= the_hash_algo
->hexsz
+ 7;
430 if (item
->object
.parsed
)
433 * Presumably this is leftover from an earlier failed parse;
434 * clear it out in preparation for us re-parsing (we'll hit the
435 * same error, but that's good, since it lets our caller know
436 * the result cannot be trusted.
438 free_commit_list(item
->parents
);
439 item
->parents
= NULL
;
442 if (tail
<= bufptr
+ tree_entry_len
+ 1 || memcmp(bufptr
, "tree ", 5) ||
443 bufptr
[tree_entry_len
] != '\n')
444 return error("bogus commit object %s", oid_to_hex(&item
->object
.oid
));
445 if (get_oid_hex(bufptr
+ 5, &parent
) < 0)
446 return error("bad tree pointer in commit %s",
447 oid_to_hex(&item
->object
.oid
));
448 tree
= lookup_tree(r
, &parent
);
450 return error("bad tree pointer %s in commit %s",
452 oid_to_hex(&item
->object
.oid
));
453 set_commit_tree(item
, tree
);
454 bufptr
+= tree_entry_len
+ 1; /* "tree " + "hex sha1" + "\n" */
455 pptr
= &item
->parents
;
457 graft
= lookup_commit_graft(r
, &item
->object
.oid
);
459 r
->parsed_objects
->substituted_parent
= 1;
460 while (bufptr
+ parent_entry_len
< tail
&& !memcmp(bufptr
, "parent ", 7)) {
461 struct commit
*new_parent
;
463 if (tail
<= bufptr
+ parent_entry_len
+ 1 ||
464 get_oid_hex(bufptr
+ 7, &parent
) ||
465 bufptr
[parent_entry_len
] != '\n')
466 return error("bad parents in commit %s", oid_to_hex(&item
->object
.oid
));
467 bufptr
+= parent_entry_len
+ 1;
469 * The clone is shallow if nr_parent < 0, and we must
470 * not traverse its real parents even when we unhide them.
472 if (graft
&& (graft
->nr_parent
< 0 || grafts_replace_parents
))
474 new_parent
= lookup_commit(r
, &parent
);
476 return error("bad parent %s in commit %s",
478 oid_to_hex(&item
->object
.oid
));
479 pptr
= &commit_list_insert(new_parent
, pptr
)->next
;
483 struct commit
*new_parent
;
484 for (i
= 0; i
< graft
->nr_parent
; i
++) {
485 new_parent
= lookup_commit(r
,
488 return error("bad graft parent %s in commit %s",
489 oid_to_hex(&graft
->parent
[i
]),
490 oid_to_hex(&item
->object
.oid
));
491 pptr
= &commit_list_insert(new_parent
, pptr
)->next
;
494 item
->date
= parse_commit_date(bufptr
, tail
);
497 load_commit_graph_info(r
, item
);
499 item
->object
.parsed
= 1;
503 int repo_parse_commit_internal(struct repository
*r
,
505 int quiet_on_missing
,
506 int use_commit_graph
)
508 enum object_type type
;
511 struct object_info oi
= {
517 * Git does not support partial clones that exclude commits, so set
518 * OBJECT_INFO_SKIP_FETCH_OBJECT to fail fast when an object is missing.
520 int flags
= OBJECT_INFO_LOOKUP_REPLACE
| OBJECT_INFO_SKIP_FETCH_OBJECT
|
521 OBJECT_INFO_DIE_IF_CORRUPT
;
526 if (item
->object
.parsed
)
528 if (use_commit_graph
&& parse_commit_in_graph(r
, item
))
531 if (oid_object_info_extended(r
, &item
->object
.oid
, &oi
, flags
) < 0)
532 return quiet_on_missing
? -1 :
533 error("Could not read %s",
534 oid_to_hex(&item
->object
.oid
));
535 if (type
!= OBJ_COMMIT
) {
537 return error("Object %s not a commit",
538 oid_to_hex(&item
->object
.oid
));
541 ret
= parse_commit_buffer(r
, item
, buffer
, size
, 0);
542 if (save_commit_buffer
&& !ret
) {
543 set_commit_buffer(r
, item
, buffer
, size
);
550 int repo_parse_commit_gently(struct repository
*r
,
551 struct commit
*item
, int quiet_on_missing
)
553 return repo_parse_commit_internal(r
, item
, quiet_on_missing
, 1);
556 void parse_commit_or_die(struct commit
*item
)
558 if (parse_commit(item
))
559 die("unable to parse commit %s",
560 item
? oid_to_hex(&item
->object
.oid
) : "(null)");
563 int find_commit_subject(const char *commit_buffer
, const char **subject
)
566 const char *p
= commit_buffer
;
568 while (*p
&& (*p
!= '\n' || p
[1] != '\n'))
571 p
= skip_blank_lines(p
+ 2);
572 eol
= strchrnul(p
, '\n');
581 size_t commit_subject_length(const char *body
)
583 const char *p
= body
;
585 const char *next
= skip_blank_lines(p
);
588 p
= strchrnul(p
, '\n');
595 struct commit_list
*commit_list_insert(struct commit
*item
, struct commit_list
**list_p
)
597 struct commit_list
*new_list
= xmalloc(sizeof(struct commit_list
));
598 new_list
->item
= item
;
599 new_list
->next
= *list_p
;
604 int commit_list_contains(struct commit
*item
, struct commit_list
*list
)
607 if (list
->item
== item
)
615 unsigned commit_list_count(const struct commit_list
*l
)
618 for (; l
; l
= l
->next
)
623 struct commit_list
*copy_commit_list(struct commit_list
*list
)
625 struct commit_list
*head
= NULL
;
626 struct commit_list
**pp
= &head
;
628 pp
= commit_list_append(list
->item
, pp
);
634 struct commit_list
*reverse_commit_list(struct commit_list
*list
)
636 struct commit_list
*next
= NULL
, *current
, *backup
;
637 for (current
= list
; current
; current
= backup
) {
638 backup
= current
->next
;
639 current
->next
= next
;
645 void free_commit_list(struct commit_list
*list
)
651 struct commit_list
* commit_list_insert_by_date(struct commit
*item
, struct commit_list
**list
)
653 struct commit_list
**pp
= list
;
654 struct commit_list
*p
;
655 while ((p
= *pp
) != NULL
) {
656 if (p
->item
->date
< item
->date
) {
661 return commit_list_insert(item
, pp
);
664 static int commit_list_compare_by_date(const struct commit_list
*a
,
665 const struct commit_list
*b
)
667 timestamp_t a_date
= a
->item
->date
;
668 timestamp_t b_date
= b
->item
->date
;
676 DEFINE_LIST_SORT(static, commit_list_sort
, struct commit_list
, next
);
678 void commit_list_sort_by_date(struct commit_list
**list
)
680 commit_list_sort(list
, commit_list_compare_by_date
);
683 struct commit
*pop_most_recent_commit(struct commit_list
**list
,
686 struct commit
*ret
= pop_commit(list
);
687 struct commit_list
*parents
= ret
->parents
;
690 struct commit
*commit
= parents
->item
;
691 if (!parse_commit(commit
) && !(commit
->object
.flags
& mark
)) {
692 commit
->object
.flags
|= mark
;
693 commit_list_insert_by_date(commit
, list
);
695 parents
= parents
->next
;
700 static void clear_commit_marks_1(struct commit_list
**plist
,
701 struct commit
*commit
, unsigned int mark
)
704 struct commit_list
*parents
;
706 if (!(mark
& commit
->object
.flags
))
709 commit
->object
.flags
&= ~mark
;
711 parents
= commit
->parents
;
715 while ((parents
= parents
->next
)) {
716 if (parents
->item
->object
.flags
& mark
)
717 commit_list_insert(parents
->item
, plist
);
720 commit
= commit
->parents
->item
;
724 void clear_commit_marks_many(int nr
, struct commit
**commit
, unsigned int mark
)
726 struct commit_list
*list
= NULL
;
729 clear_commit_marks_1(&list
, *commit
, mark
);
733 clear_commit_marks_1(&list
, pop_commit(&list
), mark
);
736 void clear_commit_marks(struct commit
*commit
, unsigned int mark
)
738 clear_commit_marks_many(1, &commit
, mark
);
741 struct commit
*pop_commit(struct commit_list
**stack
)
743 struct commit_list
*top
= *stack
;
744 struct commit
*item
= top
? top
->item
: NULL
;
754 * Topological sort support
757 /* count number of children that have not been emitted */
758 define_commit_slab(indegree_slab
, int);
760 define_commit_slab(author_date_slab
, timestamp_t
);
762 void record_author_date(struct author_date_slab
*author_date
,
763 struct commit
*commit
)
765 const char *buffer
= get_commit_buffer(commit
, NULL
);
766 struct ident_split ident
;
767 const char *ident_line
;
772 ident_line
= find_commit_header(buffer
, "author", &ident_len
);
774 goto fail_exit
; /* no author line */
775 if (split_ident_line(&ident
, ident_line
, ident_len
) ||
776 !ident
.date_begin
|| !ident
.date_end
)
777 goto fail_exit
; /* malformed "author" line */
779 date
= parse_timestamp(ident
.date_begin
, &date_end
, 10);
780 if (date_end
!= ident
.date_end
)
781 goto fail_exit
; /* malformed date */
782 *(author_date_slab_at(author_date
, commit
)) = date
;
785 unuse_commit_buffer(commit
, buffer
);
788 int compare_commits_by_author_date(const void *a_
, const void *b_
,
791 const struct commit
*a
= a_
, *b
= b_
;
792 struct author_date_slab
*author_date
= cb_data
;
793 timestamp_t a_date
= *(author_date_slab_at(author_date
, a
));
794 timestamp_t b_date
= *(author_date_slab_at(author_date
, b
));
796 /* newer commits with larger date first */
799 else if (a_date
> b_date
)
804 int compare_commits_by_gen_then_commit_date(const void *a_
, const void *b_
, void *unused
)
806 const struct commit
*a
= a_
, *b
= b_
;
807 const timestamp_t generation_a
= commit_graph_generation(a
),
808 generation_b
= commit_graph_generation(b
);
810 /* newer commits first */
811 if (generation_a
< generation_b
)
813 else if (generation_a
> generation_b
)
816 /* use date as a heuristic when generations are equal */
817 if (a
->date
< b
->date
)
819 else if (a
->date
> b
->date
)
824 int compare_commits_by_commit_date(const void *a_
, const void *b_
, void *unused
)
826 const struct commit
*a
= a_
, *b
= b_
;
827 /* newer commits with larger date first */
828 if (a
->date
< b
->date
)
830 else if (a
->date
> b
->date
)
836 * Performs an in-place topological sort on the list supplied.
838 void sort_in_topological_order(struct commit_list
**list
, enum rev_sort_order sort_order
)
840 struct commit_list
*next
, *orig
= *list
;
841 struct commit_list
**pptr
;
842 struct indegree_slab indegree
;
843 struct prio_queue queue
;
844 struct commit
*commit
;
845 struct author_date_slab author_date
;
851 init_indegree_slab(&indegree
);
852 memset(&queue
, '\0', sizeof(queue
));
854 switch (sort_order
) {
855 default: /* REV_SORT_IN_GRAPH_ORDER */
856 queue
.compare
= NULL
;
858 case REV_SORT_BY_COMMIT_DATE
:
859 queue
.compare
= compare_commits_by_commit_date
;
861 case REV_SORT_BY_AUTHOR_DATE
:
862 init_author_date_slab(&author_date
);
863 queue
.compare
= compare_commits_by_author_date
;
864 queue
.cb_data
= &author_date
;
868 /* Mark them and clear the indegree */
869 for (next
= orig
; next
; next
= next
->next
) {
870 struct commit
*commit
= next
->item
;
871 *(indegree_slab_at(&indegree
, commit
)) = 1;
872 /* also record the author dates, if needed */
873 if (sort_order
== REV_SORT_BY_AUTHOR_DATE
)
874 record_author_date(&author_date
, commit
);
877 /* update the indegree */
878 for (next
= orig
; next
; next
= next
->next
) {
879 struct commit_list
*parents
= next
->item
->parents
;
881 struct commit
*parent
= parents
->item
;
882 int *pi
= indegree_slab_at(&indegree
, parent
);
886 parents
= parents
->next
;
893 * tips are nodes not reachable from any other node in the list
895 * the tips serve as a starting set for the work queue.
897 for (next
= orig
; next
; next
= next
->next
) {
898 struct commit
*commit
= next
->item
;
900 if (*(indegree_slab_at(&indegree
, commit
)) == 1)
901 prio_queue_put(&queue
, commit
);
905 * This is unfortunate; the initial tips need to be shown
906 * in the order given from the revision traversal machinery.
908 if (sort_order
== REV_SORT_IN_GRAPH_ORDER
)
909 prio_queue_reverse(&queue
);
911 /* We no longer need the commit list */
912 free_commit_list(orig
);
916 while ((commit
= prio_queue_get(&queue
)) != NULL
) {
917 struct commit_list
*parents
;
919 for (parents
= commit
->parents
; parents
; parents
= parents
->next
) {
920 struct commit
*parent
= parents
->item
;
921 int *pi
= indegree_slab_at(&indegree
, parent
);
927 * parents are only enqueued for emission
928 * when all their children have been emitted thereby
929 * guaranteeing topological order.
932 prio_queue_put(&queue
, parent
);
935 * all children of commit have already been
936 * emitted. we can emit it now.
938 *(indegree_slab_at(&indegree
, commit
)) = 0;
940 pptr
= &commit_list_insert(commit
, pptr
)->next
;
943 clear_indegree_slab(&indegree
);
944 clear_prio_queue(&queue
);
945 if (sort_order
== REV_SORT_BY_AUTHOR_DATE
)
946 clear_author_date_slab(&author_date
);
950 struct commit
**commit
;
953 unsigned int initial
: 1;
956 static void add_one_commit(struct object_id
*oid
, struct rev_collect
*revs
)
958 struct commit
*commit
;
960 if (is_null_oid(oid
))
963 commit
= lookup_commit(the_repository
, oid
);
965 (commit
->object
.flags
& TMP_MARK
) ||
966 parse_commit(commit
))
969 ALLOC_GROW(revs
->commit
, revs
->nr
+ 1, revs
->alloc
);
970 revs
->commit
[revs
->nr
++] = commit
;
971 commit
->object
.flags
|= TMP_MARK
;
974 static int collect_one_reflog_ent(struct object_id
*ooid
, struct object_id
*noid
,
975 const char *ident UNUSED
,
976 timestamp_t timestamp UNUSED
, int tz UNUSED
,
977 const char *message UNUSED
, void *cbdata
)
979 struct rev_collect
*revs
= cbdata
;
983 add_one_commit(ooid
, revs
);
985 add_one_commit(noid
, revs
);
989 struct commit
*get_fork_point(const char *refname
, struct commit
*commit
)
991 struct object_id oid
;
992 struct rev_collect revs
;
993 struct commit_list
*bases
;
995 struct commit
*ret
= NULL
;
998 switch (dwim_ref(refname
, strlen(refname
), &oid
, &full_refname
, 0)) {
1000 die("No such ref: '%s'", refname
);
1004 die("Ambiguous refname: '%s'", refname
);
1007 memset(&revs
, 0, sizeof(revs
));
1009 for_each_reflog_ent(full_refname
, collect_one_reflog_ent
, &revs
);
1012 add_one_commit(&oid
, &revs
);
1014 for (i
= 0; i
< revs
.nr
; i
++)
1015 revs
.commit
[i
]->object
.flags
&= ~TMP_MARK
;
1017 bases
= get_merge_bases_many(commit
, revs
.nr
, revs
.commit
);
1020 * There should be one and only one merge base, when we found
1021 * a common ancestor among reflog entries.
1023 if (!bases
|| bases
->next
)
1024 goto cleanup_return
;
1026 /* And the found one must be one of the reflog entries */
1027 for (i
= 0; i
< revs
.nr
; i
++)
1028 if (&bases
->item
->object
== &revs
.commit
[i
]->object
)
1031 goto cleanup_return
;
1037 free_commit_list(bases
);
1043 * Indexed by hash algorithm identifier.
1045 static const char *gpg_sig_headers
[] = {
1051 int sign_with_header(struct strbuf
*buf
, const char *keyid
)
1053 struct strbuf sig
= STRBUF_INIT
;
1054 int inspos
, copypos
;
1056 const char *gpg_sig_header
= gpg_sig_headers
[hash_algo_by_ptr(the_hash_algo
)];
1057 int gpg_sig_header_len
= strlen(gpg_sig_header
);
1059 /* find the end of the header */
1060 eoh
= strstr(buf
->buf
, "\n\n");
1064 inspos
= eoh
- buf
->buf
+ 1;
1066 if (!keyid
|| !*keyid
)
1067 keyid
= get_signing_key();
1068 if (sign_buffer(buf
, &sig
, keyid
)) {
1069 strbuf_release(&sig
);
1073 for (copypos
= 0; sig
.buf
[copypos
]; ) {
1074 const char *bol
= sig
.buf
+ copypos
;
1075 const char *eol
= strchrnul(bol
, '\n');
1076 int len
= (eol
- bol
) + !!*eol
;
1079 strbuf_insert(buf
, inspos
, gpg_sig_header
, gpg_sig_header_len
);
1080 inspos
+= gpg_sig_header_len
;
1082 strbuf_insertstr(buf
, inspos
++, " ");
1083 strbuf_insert(buf
, inspos
, bol
, len
);
1087 strbuf_release(&sig
);
1093 int parse_signed_commit(const struct commit
*commit
,
1094 struct strbuf
*payload
, struct strbuf
*signature
,
1095 const struct git_hash_algo
*algop
)
1098 const char *buffer
= get_commit_buffer(commit
, &size
);
1099 int ret
= parse_buffer_signed_by_header(buffer
, size
, payload
, signature
, algop
);
1101 unuse_commit_buffer(commit
, buffer
);
1105 int parse_buffer_signed_by_header(const char *buffer
,
1107 struct strbuf
*payload
,
1108 struct strbuf
*signature
,
1109 const struct git_hash_algo
*algop
)
1111 int in_signature
= 0, saw_signature
= 0, other_signature
= 0;
1112 const char *line
, *tail
, *p
;
1113 const char *gpg_sig_header
= gpg_sig_headers
[hash_algo_by_ptr(algop
)];
1116 tail
= buffer
+ size
;
1117 while (line
< tail
) {
1118 const char *sig
= NULL
;
1119 const char *next
= memchr(line
, '\n', tail
- line
);
1121 next
= next
? next
+ 1 : tail
;
1122 if (in_signature
&& line
[0] == ' ')
1124 else if (skip_prefix(line
, gpg_sig_header
, &p
) &&
1126 sig
= line
+ strlen(gpg_sig_header
) + 1;
1127 other_signature
= 0;
1129 else if (starts_with(line
, "gpgsig"))
1130 other_signature
= 1;
1131 else if (other_signature
&& line
[0] != ' ')
1132 other_signature
= 0;
1134 strbuf_add(signature
, sig
, next
- sig
);
1139 /* dump the whole remainder of the buffer */
1141 if (!other_signature
)
1142 strbuf_add(payload
, line
, next
- line
);
1147 return saw_signature
;
1150 int remove_signature(struct strbuf
*buf
)
1152 const char *line
= buf
->buf
;
1153 const char *tail
= buf
->buf
+ buf
->len
;
1154 int in_signature
= 0;
1158 } sigs
[2], *sigp
= &sigs
[0];
1160 const char *orig_buf
= buf
->buf
;
1162 memset(sigs
, 0, sizeof(sigs
));
1164 while (line
< tail
) {
1165 const char *next
= memchr(line
, '\n', tail
- line
);
1166 next
= next
? next
+ 1 : tail
;
1168 if (in_signature
&& line
[0] == ' ')
1170 else if (starts_with(line
, "gpgsig")) {
1172 for (i
= 1; i
< GIT_HASH_NALGOS
; i
++) {
1174 if (skip_prefix(line
, gpg_sig_headers
[i
], &p
) &&
1183 /* dump the whole remainder of the buffer */
1185 if (in_signature
&& sigp
- sigs
!= ARRAY_SIZE(sigs
))
1192 for (i
= ARRAY_SIZE(sigs
) - 1; i
>= 0; i
--)
1194 strbuf_remove(buf
, sigs
[i
].start
- orig_buf
, sigs
[i
].end
- sigs
[i
].start
);
1196 return sigs
[0].start
!= NULL
;
1199 static void handle_signed_tag(struct commit
*parent
, struct commit_extra_header
***tail
)
1201 struct merge_remote_desc
*desc
;
1202 struct commit_extra_header
*mergetag
;
1205 enum object_type type
;
1206 struct strbuf payload
= STRBUF_INIT
;
1207 struct strbuf signature
= STRBUF_INIT
;
1209 desc
= merge_remote_util(parent
);
1210 if (!desc
|| !desc
->obj
)
1212 buf
= read_object_file(&desc
->obj
->oid
, &type
, &size
);
1213 if (!buf
|| type
!= OBJ_TAG
)
1215 if (!parse_signature(buf
, size
, &payload
, &signature
))
1218 * We could verify this signature and either omit the tag when
1219 * it does not validate, but the integrator may not have the
1220 * public key of the signer of the tag being merged, while a
1221 * later auditor may have it while auditing, so let's not run
1222 * verify-signed-buffer here for now...
1224 * if (verify_signed_buffer(buf, len, buf + len, size - len, ...))
1225 * warn("warning: signed tag unverified.");
1227 CALLOC_ARRAY(mergetag
, 1);
1228 mergetag
->key
= xstrdup("mergetag");
1229 mergetag
->value
= buf
;
1230 mergetag
->len
= size
;
1233 *tail
= &mergetag
->next
;
1234 strbuf_release(&payload
);
1235 strbuf_release(&signature
);
1242 int check_commit_signature(const struct commit
*commit
, struct signature_check
*sigc
)
1244 struct strbuf payload
= STRBUF_INIT
;
1245 struct strbuf signature
= STRBUF_INIT
;
1250 if (parse_signed_commit(commit
, &payload
, &signature
, the_hash_algo
) <= 0)
1253 sigc
->payload_type
= SIGNATURE_PAYLOAD_COMMIT
;
1254 sigc
->payload
= strbuf_detach(&payload
, &sigc
->payload_len
);
1255 ret
= check_signature(sigc
, signature
.buf
, signature
.len
);
1258 strbuf_release(&payload
);
1259 strbuf_release(&signature
);
1264 void verify_merge_signature(struct commit
*commit
, int verbosity
,
1267 char hex
[GIT_MAX_HEXSZ
+ 1];
1268 struct signature_check signature_check
;
1270 memset(&signature_check
, 0, sizeof(signature_check
));
1272 ret
= check_commit_signature(commit
, &signature_check
);
1274 find_unique_abbrev_r(hex
, &commit
->object
.oid
, DEFAULT_ABBREV
);
1275 switch (signature_check
.result
) {
1277 if (ret
|| (check_trust
&& signature_check
.trust_level
< TRUST_MARGINAL
))
1278 die(_("Commit %s has an untrusted GPG signature, "
1279 "allegedly by %s."), hex
, signature_check
.signer
);
1282 die(_("Commit %s has a bad GPG signature "
1283 "allegedly by %s."), hex
, signature_check
.signer
);
1285 die(_("Commit %s does not have a GPG signature."), hex
);
1287 if (verbosity
>= 0 && signature_check
.result
== 'G')
1288 printf(_("Commit %s has a good GPG signature by %s\n"),
1289 hex
, signature_check
.signer
);
1291 signature_check_clear(&signature_check
);
1294 void append_merge_tag_headers(struct commit_list
*parents
,
1295 struct commit_extra_header
***tail
)
1298 struct commit
*parent
= parents
->item
;
1299 handle_signed_tag(parent
, tail
);
1300 parents
= parents
->next
;
1304 static void add_extra_header(struct strbuf
*buffer
,
1305 struct commit_extra_header
*extra
)
1307 strbuf_addstr(buffer
, extra
->key
);
1309 strbuf_add_lines(buffer
, " ", extra
->value
, extra
->len
);
1311 strbuf_addch(buffer
, '\n');
1314 struct commit_extra_header
*read_commit_extra_headers(struct commit
*commit
,
1315 const char **exclude
)
1317 struct commit_extra_header
*extra
= NULL
;
1319 const char *buffer
= get_commit_buffer(commit
, &size
);
1320 extra
= read_commit_extra_header_lines(buffer
, size
, exclude
);
1321 unuse_commit_buffer(commit
, buffer
);
1325 int for_each_mergetag(each_mergetag_fn fn
, struct commit
*commit
, void *data
)
1327 struct commit_extra_header
*extra
, *to_free
;
1330 to_free
= read_commit_extra_headers(commit
, NULL
);
1331 for (extra
= to_free
; !res
&& extra
; extra
= extra
->next
) {
1332 if (strcmp(extra
->key
, "mergetag"))
1333 continue; /* not a merge tag */
1334 res
= fn(commit
, extra
, data
);
1336 free_commit_extra_headers(to_free
);
1340 static inline int standard_header_field(const char *field
, size_t len
)
1342 return ((len
== 4 && !memcmp(field
, "tree", 4)) ||
1343 (len
== 6 && !memcmp(field
, "parent", 6)) ||
1344 (len
== 6 && !memcmp(field
, "author", 6)) ||
1345 (len
== 9 && !memcmp(field
, "committer", 9)) ||
1346 (len
== 8 && !memcmp(field
, "encoding", 8)));
1349 static int excluded_header_field(const char *field
, size_t len
, const char **exclude
)
1355 size_t xlen
= strlen(*exclude
);
1356 if (len
== xlen
&& !memcmp(field
, *exclude
, xlen
))
1363 static struct commit_extra_header
*read_commit_extra_header_lines(
1364 const char *buffer
, size_t size
,
1365 const char **exclude
)
1367 struct commit_extra_header
*extra
= NULL
, **tail
= &extra
, *it
= NULL
;
1368 const char *line
, *next
, *eof
, *eob
;
1369 struct strbuf buf
= STRBUF_INIT
;
1371 for (line
= buffer
, eob
= line
+ size
;
1372 line
< eob
&& *line
!= '\n';
1374 next
= memchr(line
, '\n', eob
- line
);
1375 next
= next
? next
+ 1 : eob
;
1379 strbuf_add(&buf
, line
+ 1, next
- (line
+ 1));
1383 it
->value
= strbuf_detach(&buf
, &it
->len
);
1387 eof
= memchr(line
, ' ', next
- line
);
1390 else if (standard_header_field(line
, eof
- line
) ||
1391 excluded_header_field(line
, eof
- line
, exclude
))
1394 CALLOC_ARRAY(it
, 1);
1395 it
->key
= xmemdupz(line
, eof
-line
);
1399 strbuf_add(&buf
, eof
+ 1, next
- (eof
+ 1));
1402 it
->value
= strbuf_detach(&buf
, &it
->len
);
1406 void free_commit_extra_headers(struct commit_extra_header
*extra
)
1409 struct commit_extra_header
*next
= extra
->next
;
1417 int commit_tree(const char *msg
, size_t msg_len
, const struct object_id
*tree
,
1418 struct commit_list
*parents
, struct object_id
*ret
,
1419 const char *author
, const char *sign_commit
)
1421 struct commit_extra_header
*extra
= NULL
, **tail
= &extra
;
1424 append_merge_tag_headers(parents
, &tail
);
1425 result
= commit_tree_extended(msg
, msg_len
, tree
, parents
, ret
, author
,
1426 NULL
, sign_commit
, extra
);
1427 free_commit_extra_headers(extra
);
1431 static int find_invalid_utf8(const char *buf
, int len
)
1434 static const unsigned int max_codepoint
[] = {
1435 0x7f, 0x7ff, 0xffff, 0x10ffff
1439 unsigned char c
= *buf
++;
1440 int bytes
, bad_offset
;
1441 unsigned int codepoint
;
1442 unsigned int min_val
, max_val
;
1447 /* Simple US-ASCII? No worries. */
1451 bad_offset
= offset
-1;
1454 * Count how many more high bits set: that's how
1455 * many more bytes this sequence should have.
1464 * Must be between 1 and 3 more bytes. Longer sequences result in
1465 * codepoints beyond U+10FFFF, which are guaranteed never to exist.
1467 if (bytes
< 1 || 3 < bytes
)
1470 /* Do we *have* that many bytes? */
1475 * Place the encoded bits at the bottom of the value and compute the
1478 codepoint
= (c
& 0x7f) >> bytes
;
1479 min_val
= max_codepoint
[bytes
-1] + 1;
1480 max_val
= max_codepoint
[bytes
];
1485 /* And verify that they are good continuation bytes */
1488 codepoint
|= *buf
& 0x3f;
1489 if ((*buf
++ & 0xc0) != 0x80)
1493 /* Reject codepoints that are out of range for the sequence length. */
1494 if (codepoint
< min_val
|| codepoint
> max_val
)
1496 /* Surrogates are only for UTF-16 and cannot be encoded in UTF-8. */
1497 if ((codepoint
& 0x1ff800) == 0xd800)
1499 /* U+xxFFFE and U+xxFFFF are guaranteed non-characters. */
1500 if ((codepoint
& 0xfffe) == 0xfffe)
1502 /* So are anything in the range U+FDD0..U+FDEF. */
1503 if (codepoint
>= 0xfdd0 && codepoint
<= 0xfdef)
1510 * This verifies that the buffer is in proper utf8 format.
1512 * If it isn't, it assumes any non-utf8 characters are Latin1,
1513 * and does the conversion.
1515 static int verify_utf8(struct strbuf
*buf
)
1523 unsigned char replace
[2];
1525 bad
= find_invalid_utf8(buf
->buf
+ pos
, buf
->len
- pos
);
1531 strbuf_remove(buf
, pos
, 1);
1533 /* We know 'c' must be in the range 128-255 */
1534 replace
[0] = 0xc0 + (c
>> 6);
1535 replace
[1] = 0x80 + (c
& 0x3f);
1536 strbuf_insert(buf
, pos
, replace
, 2);
1541 static const char commit_utf8_warn
[] =
1542 N_("Warning: commit message did not conform to UTF-8.\n"
1543 "You may want to amend it after fixing the message, or set the config\n"
1544 "variable i18n.commitEncoding to the encoding your project uses.\n");
1546 int commit_tree_extended(const char *msg
, size_t msg_len
,
1547 const struct object_id
*tree
,
1548 struct commit_list
*parents
, struct object_id
*ret
,
1549 const char *author
, const char *committer
,
1550 const char *sign_commit
,
1551 struct commit_extra_header
*extra
)
1554 int encoding_is_utf8
;
1555 struct strbuf buffer
;
1557 assert_oid_type(tree
, OBJ_TREE
);
1559 if (memchr(msg
, '\0', msg_len
))
1560 return error("a NUL byte in commit log message not allowed.");
1562 /* Not having i18n.commitencoding is the same as having utf-8 */
1563 encoding_is_utf8
= is_encoding_utf8(git_commit_encoding
);
1565 strbuf_init(&buffer
, 8192); /* should avoid reallocs for the headers */
1566 strbuf_addf(&buffer
, "tree %s\n", oid_to_hex(tree
));
1569 * NOTE! This ordering means that the same exact tree merged with a
1570 * different order of parents will be a _different_ changeset even
1571 * if everything else stays the same.
1574 struct commit
*parent
= pop_commit(&parents
);
1575 strbuf_addf(&buffer
, "parent %s\n",
1576 oid_to_hex(&parent
->object
.oid
));
1579 /* Person/date information */
1581 author
= git_author_info(IDENT_STRICT
);
1582 strbuf_addf(&buffer
, "author %s\n", author
);
1584 committer
= git_committer_info(IDENT_STRICT
);
1585 strbuf_addf(&buffer
, "committer %s\n", committer
);
1586 if (!encoding_is_utf8
)
1587 strbuf_addf(&buffer
, "encoding %s\n", git_commit_encoding
);
1590 add_extra_header(&buffer
, extra
);
1591 extra
= extra
->next
;
1593 strbuf_addch(&buffer
, '\n');
1595 /* And add the comment */
1596 strbuf_add(&buffer
, msg
, msg_len
);
1598 /* And check the encoding */
1599 if (encoding_is_utf8
&& !verify_utf8(&buffer
))
1600 fprintf(stderr
, _(commit_utf8_warn
));
1602 if (sign_commit
&& sign_with_header(&buffer
, sign_commit
)) {
1607 result
= write_object_file(buffer
.buf
, buffer
.len
, OBJ_COMMIT
, ret
);
1609 strbuf_release(&buffer
);
1613 define_commit_slab(merge_desc_slab
, struct merge_remote_desc
*);
1614 static struct merge_desc_slab merge_desc_slab
= COMMIT_SLAB_INIT(1, merge_desc_slab
);
1616 struct merge_remote_desc
*merge_remote_util(struct commit
*commit
)
1618 return *merge_desc_slab_at(&merge_desc_slab
, commit
);
1621 void set_merge_remote_desc(struct commit
*commit
,
1622 const char *name
, struct object
*obj
)
1624 struct merge_remote_desc
*desc
;
1625 FLEX_ALLOC_STR(desc
, name
, name
);
1627 *merge_desc_slab_at(&merge_desc_slab
, commit
) = desc
;
1630 struct commit
*get_merge_parent(const char *name
)
1633 struct commit
*commit
;
1634 struct object_id oid
;
1635 if (get_oid(name
, &oid
))
1637 obj
= parse_object(the_repository
, &oid
);
1638 commit
= (struct commit
*)peel_to_type(name
, 0, obj
, OBJ_COMMIT
);
1639 if (commit
&& !merge_remote_util(commit
))
1640 set_merge_remote_desc(commit
, name
, obj
);
1645 * Append a commit to the end of the commit_list.
1647 * next starts by pointing to the variable that holds the head of an
1648 * empty commit_list, and is updated to point to the "next" field of
1649 * the last item on the list as new commits are appended.
1653 * struct commit_list *list;
1654 * struct commit_list **next = &list;
1656 * next = commit_list_append(c1, next);
1657 * next = commit_list_append(c2, next);
1658 * assert(commit_list_count(list) == 2);
1661 struct commit_list
**commit_list_append(struct commit
*commit
,
1662 struct commit_list
**next
)
1664 struct commit_list
*new_commit
= xmalloc(sizeof(struct commit_list
));
1665 new_commit
->item
= commit
;
1667 new_commit
->next
= NULL
;
1668 return &new_commit
->next
;
1671 const char *find_header_mem(const char *msg
, size_t len
,
1672 const char *key
, size_t *out_len
)
1674 int key_len
= strlen(key
);
1675 const char *line
= msg
;
1678 * NEEDSWORK: It's possible for strchrnul() to scan beyond the range
1679 * given by len. However, current callers are safe because they compute
1680 * len by scanning a NUL-terminated block of memory starting at msg.
1681 * Nonetheless, it would be better to ensure the function does not look
1682 * at msg beyond the len provided by the caller.
1684 while (line
&& line
< msg
+ len
) {
1685 const char *eol
= strchrnul(line
, '\n');
1690 if (eol
- line
> key_len
&&
1691 !strncmp(line
, key
, key_len
) &&
1692 line
[key_len
] == ' ') {
1693 *out_len
= eol
- line
- key_len
- 1;
1694 return line
+ key_len
+ 1;
1696 line
= *eol
? eol
+ 1 : NULL
;
1701 const char *find_commit_header(const char *msg
, const char *key
, size_t *out_len
)
1703 return find_header_mem(msg
, strlen(msg
), key
, out_len
);
1706 * Inspect the given string and determine the true "end" of the log message, in
1707 * order to find where to put a new Signed-off-by trailer. Ignored are
1708 * trailing comment lines and blank lines. To support "git commit -s
1709 * --amend" on an existing commit, we also ignore "Conflicts:". To
1710 * support "git commit -v", we truncate at cut lines.
1712 * Returns the number of bytes from the tail to ignore, to be fed as
1713 * the second parameter to append_signoff().
1715 size_t ignore_non_trailer(const char *buf
, size_t len
)
1719 int in_old_conflicts_block
= 0;
1720 size_t cutoff
= wt_status_locate_end(buf
, len
);
1722 while (bol
< cutoff
) {
1723 const char *next_line
= memchr(buf
+ bol
, '\n', len
- bol
);
1726 next_line
= buf
+ len
;
1730 if (buf
[bol
] == comment_line_char
|| buf
[bol
] == '\n') {
1731 /* is this the first of the run of comments? */
1734 /* otherwise, it is just continuing */
1735 } else if (starts_with(buf
+ bol
, "Conflicts:\n")) {
1736 in_old_conflicts_block
= 1;
1739 } else if (in_old_conflicts_block
&& buf
[bol
] == '\t') {
1740 ; /* a pathname in the conflicts block */
1742 /* the previous was not trailing comment */
1744 in_old_conflicts_block
= 0;
1746 bol
= next_line
- buf
;
1748 return boc
? len
- boc
: len
- cutoff
;
1751 int run_commit_hook(int editor_is_used
, const char *index_file
,
1752 int *invoked_hook
, const char *name
, ...)
1754 struct run_hooks_opt opt
= RUN_HOOKS_OPT_INIT
;
1758 strvec_pushf(&opt
.env
, "GIT_INDEX_FILE=%s", index_file
);
1761 * Let the hook know that no editor will be launched.
1763 if (!editor_is_used
)
1764 strvec_push(&opt
.env
, "GIT_EDITOR=:");
1766 va_start(args
, name
);
1767 while ((arg
= va_arg(args
, const char *)))
1768 strvec_push(&opt
.args
, arg
);
1771 opt
.invoked_hook
= invoked_hook
;
1772 return run_hooks_opt(name
, &opt
);