2 * Copyright (c) 2018, 2019, 2020 Stefan Sperling <stsp@openbsd.org>
4 * Permission to use, copy, modify, and distribute this software for any
5 * purpose with or without fee is hereby granted, provided that the above
6 * copyright notice and this permission notice appear in all copies.
8 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
17 #include <sys/types.h>
19 #include <sys/socket.h>
22 #include <sys/resource.h>
42 #include "got_error.h"
43 #include "got_reference.h"
44 #include "got_repository.h"
46 #include "got_cancel.h"
47 #include "got_object.h"
49 #include "got_lib_delta.h"
50 #include "got_lib_inflate.h"
51 #include "got_lib_object.h"
52 #include "got_lib_object_parse.h"
53 #include "got_lib_object_create.h"
54 #include "got_lib_pack.h"
55 #include "got_lib_privsep.h"
56 #include "got_lib_sha1.h"
57 #include "got_lib_object_cache.h"
58 #include "got_lib_repository.h"
59 #include "got_lib_gotconfig.h"
62 #define nitems(_a) (sizeof(_a) / sizeof((_a)[0]))
66 got_repo_get_path(struct got_repository
*repo
)
72 got_repo_get_path_git_dir(struct got_repository
*repo
)
74 return repo
->path_git_dir
;
78 got_repo_get_fd(struct got_repository
*repo
)
80 return repo
->gitdir_fd
;
84 got_repo_get_gitconfig_author_name(struct got_repository
*repo
)
86 return repo
->gitconfig_author_name
;
90 got_repo_get_gitconfig_author_email(struct got_repository
*repo
)
92 return repo
->gitconfig_author_email
;
96 got_repo_get_global_gitconfig_author_name(struct got_repository
*repo
)
98 return repo
->global_gitconfig_author_name
;
102 got_repo_get_global_gitconfig_author_email(struct got_repository
*repo
)
104 return repo
->global_gitconfig_author_email
;
108 got_repo_get_gitconfig_owner(struct got_repository
*repo
)
110 return repo
->gitconfig_owner
;
114 got_repo_get_gitconfig_extensions(char ***extensions
, int *nextensions
,
115 struct got_repository
*repo
)
117 *extensions
= repo
->extensions
;
118 *nextensions
= repo
->nextensions
;
122 got_repo_is_bare(struct got_repository
*repo
)
124 return (strcmp(repo
->path
, repo
->path_git_dir
) == 0);
128 get_path_git_child(struct got_repository
*repo
, const char *basename
)
132 if (asprintf(&path_child
, "%s/%s", repo
->path_git_dir
,
140 got_repo_get_path_objects(struct got_repository
*repo
)
142 return get_path_git_child(repo
, GOT_OBJECTS_DIR
);
146 got_repo_get_path_objects_pack(struct got_repository
*repo
)
148 return get_path_git_child(repo
, GOT_OBJECTS_PACK_DIR
);
152 got_repo_get_path_refs(struct got_repository
*repo
)
154 return get_path_git_child(repo
, GOT_REFS_DIR
);
158 got_repo_get_path_packed_refs(struct got_repository
*repo
)
160 return get_path_git_child(repo
, GOT_PACKED_REFS_FILE
);
164 get_path_head(struct got_repository
*repo
)
166 return get_path_git_child(repo
, GOT_HEAD_FILE
);
170 got_repo_get_path_gitconfig(struct got_repository
*repo
)
172 return get_path_git_child(repo
, GOT_GITCONFIG
);
176 got_repo_get_path_gotconfig(struct got_repository
*repo
)
178 return get_path_git_child(repo
, GOT_GOTCONFIG_FILENAME
);
181 const struct got_gotconfig
*
182 got_repo_get_gotconfig(struct got_repository
*repo
)
184 return repo
->gotconfig
;
188 got_repo_get_gitconfig_remotes(int *nremotes
,
189 const struct got_remote_repo
**remotes
, struct got_repository
*repo
)
191 *nremotes
= repo
->ngitconfig_remotes
;
192 *remotes
= repo
->gitconfig_remotes
;
196 is_git_repo(struct got_repository
*repo
)
198 const char *path_git
= got_repo_get_path_git_dir(repo
);
199 char *path_objects
= got_repo_get_path_objects(repo
);
200 char *path_refs
= got_repo_get_path_refs(repo
);
201 char *path_head
= get_path_head(repo
);
204 struct got_reference
*head_ref
;
206 if (lstat(path_git
, &sb
) == -1)
208 if (!S_ISDIR(sb
.st_mode
))
211 if (lstat(path_objects
, &sb
) == -1)
213 if (!S_ISDIR(sb
.st_mode
))
216 if (lstat(path_refs
, &sb
) == -1)
218 if (!S_ISDIR(sb
.st_mode
))
221 if (lstat(path_head
, &sb
) == -1)
223 if (!S_ISREG(sb
.st_mode
))
226 /* Check if the HEAD reference can be opened. */
227 if (got_ref_open(&head_ref
, repo
, GOT_REF_HEAD
, 0) != NULL
)
229 got_ref_close(head_ref
);
240 const struct got_error
*
241 got_repo_cache_object(struct got_repository
*repo
, struct got_object_id
*id
,
242 struct got_object
*obj
)
244 #ifndef GOT_NO_OBJ_CACHE
245 const struct got_error
*err
= NULL
;
246 err
= got_object_cache_add(&repo
->objcache
, id
, obj
);
248 if (err
->code
== GOT_ERR_OBJ_EXISTS
||
249 err
->code
== GOT_ERR_OBJ_TOO_LARGE
)
259 got_repo_get_cached_object(struct got_repository
*repo
,
260 struct got_object_id
*id
)
262 return (struct got_object
*)got_object_cache_get(&repo
->objcache
, id
);
265 const struct got_error
*
266 got_repo_cache_tree(struct got_repository
*repo
, struct got_object_id
*id
,
267 struct got_tree_object
*tree
)
269 #ifndef GOT_NO_OBJ_CACHE
270 const struct got_error
*err
= NULL
;
271 err
= got_object_cache_add(&repo
->treecache
, id
, tree
);
273 if (err
->code
== GOT_ERR_OBJ_EXISTS
||
274 err
->code
== GOT_ERR_OBJ_TOO_LARGE
)
283 struct got_tree_object
*
284 got_repo_get_cached_tree(struct got_repository
*repo
,
285 struct got_object_id
*id
)
287 return (struct got_tree_object
*)got_object_cache_get(
288 &repo
->treecache
, id
);
291 const struct got_error
*
292 got_repo_cache_commit(struct got_repository
*repo
, struct got_object_id
*id
,
293 struct got_commit_object
*commit
)
295 #ifndef GOT_NO_OBJ_CACHE
296 const struct got_error
*err
= NULL
;
297 err
= got_object_cache_add(&repo
->commitcache
, id
, commit
);
299 if (err
->code
== GOT_ERR_OBJ_EXISTS
||
300 err
->code
== GOT_ERR_OBJ_TOO_LARGE
)
309 struct got_commit_object
*
310 got_repo_get_cached_commit(struct got_repository
*repo
,
311 struct got_object_id
*id
)
313 return (struct got_commit_object
*)got_object_cache_get(
314 &repo
->commitcache
, id
);
317 const struct got_error
*
318 got_repo_cache_tag(struct got_repository
*repo
, struct got_object_id
*id
,
319 struct got_tag_object
*tag
)
321 #ifndef GOT_NO_OBJ_CACHE
322 const struct got_error
*err
= NULL
;
323 err
= got_object_cache_add(&repo
->tagcache
, id
, tag
);
325 if (err
->code
== GOT_ERR_OBJ_EXISTS
||
326 err
->code
== GOT_ERR_OBJ_TOO_LARGE
)
335 struct got_tag_object
*
336 got_repo_get_cached_tag(struct got_repository
*repo
, struct got_object_id
*id
)
338 return (struct got_tag_object
*)got_object_cache_get(
339 &repo
->tagcache
, id
);
342 static const struct got_error
*
343 open_repo(struct got_repository
*repo
, const char *path
)
345 const struct got_error
*err
= NULL
;
347 repo
->gitdir_fd
= -1;
349 /* bare git repository? */
350 repo
->path_git_dir
= strdup(path
);
351 if (repo
->path_git_dir
== NULL
)
352 return got_error_from_errno("strdup");
353 if (is_git_repo(repo
)) {
354 repo
->path
= strdup(repo
->path_git_dir
);
355 if (repo
->path
== NULL
) {
356 err
= got_error_from_errno("strdup");
359 repo
->gitdir_fd
= open(repo
->path_git_dir
, O_DIRECTORY
);
360 if (repo
->gitdir_fd
== -1) {
361 err
= got_error_from_errno2("open",
368 /* git repository with working tree? */
369 free(repo
->path_git_dir
);
370 repo
->path_git_dir
= NULL
;
371 if (asprintf(&repo
->path_git_dir
, "%s/%s", path
, GOT_GIT_DIR
) == -1) {
372 err
= got_error_from_errno("asprintf");
375 if (is_git_repo(repo
)) {
376 repo
->path
= strdup(path
);
377 if (repo
->path
== NULL
) {
378 err
= got_error_from_errno("strdup");
381 repo
->gitdir_fd
= open(repo
->path_git_dir
, O_DIRECTORY
);
382 if (repo
->gitdir_fd
== -1) {
383 err
= got_error_from_errno2("open",
390 err
= got_error(GOT_ERR_NOT_GIT_REPO
);
395 free(repo
->path_git_dir
);
396 repo
->path_git_dir
= NULL
;
397 if (repo
->gitdir_fd
!= -1)
398 close(repo
->gitdir_fd
);
399 repo
->gitdir_fd
= -1;
405 static const struct got_error
*
406 parse_gitconfig_file(int *gitconfig_repository_format_version
,
407 char **gitconfig_author_name
, char **gitconfig_author_email
,
408 struct got_remote_repo
**remotes
, int *nremotes
,
409 char **gitconfig_owner
, char ***extensions
, int *nextensions
,
410 const char *gitconfig_path
)
412 const struct got_error
*err
= NULL
, *child_err
= NULL
;
414 int imsg_fds
[2] = { -1, -1 };
416 struct imsgbuf
*ibuf
;
418 *gitconfig_repository_format_version
= 0;
423 *gitconfig_author_name
= NULL
;
424 *gitconfig_author_email
= NULL
;
430 *gitconfig_owner
= NULL
;
432 fd
= open(gitconfig_path
, O_RDONLY
);
436 return got_error_from_errno2("open", gitconfig_path
);
439 ibuf
= calloc(1, sizeof(*ibuf
));
441 err
= got_error_from_errno("calloc");
445 if (socketpair(AF_UNIX
, SOCK_STREAM
, PF_UNSPEC
, imsg_fds
) == -1) {
446 err
= got_error_from_errno("socketpair");
452 err
= got_error_from_errno("fork");
454 } else if (pid
== 0) {
455 got_privsep_exec_child(imsg_fds
, GOT_PATH_PROG_READ_GITCONFIG
,
460 if (close(imsg_fds
[1]) == -1) {
461 err
= got_error_from_errno("close");
465 imsg_init(ibuf
, imsg_fds
[0]);
467 err
= got_privsep_send_gitconfig_parse_req(ibuf
, fd
);
472 err
= got_privsep_send_gitconfig_repository_format_version_req(ibuf
);
476 err
= got_privsep_recv_gitconfig_int(
477 gitconfig_repository_format_version
, ibuf
);
481 if (extensions
&& nextensions
) {
482 err
= got_privsep_send_gitconfig_repository_extensions_req(
486 err
= got_privsep_recv_gitconfig_int(nextensions
, ibuf
);
489 if (*nextensions
> 0) {
491 *extensions
= calloc(*nextensions
, sizeof(char *));
492 if (*extensions
== NULL
) {
493 err
= got_error_from_errno("calloc");
496 for (i
= 0; i
< *nextensions
; i
++) {
498 err
= got_privsep_recv_gitconfig_str(&ext
,
502 (*extensions
)[i
] = ext
;
507 err
= got_privsep_send_gitconfig_author_name_req(ibuf
);
511 err
= got_privsep_recv_gitconfig_str(gitconfig_author_name
, ibuf
);
515 err
= got_privsep_send_gitconfig_author_email_req(ibuf
);
519 err
= got_privsep_recv_gitconfig_str(gitconfig_author_email
, ibuf
);
523 if (remotes
&& nremotes
) {
524 err
= got_privsep_send_gitconfig_remotes_req(ibuf
);
528 err
= got_privsep_recv_gitconfig_remotes(remotes
,
534 if (gitconfig_owner
) {
535 err
= got_privsep_send_gitconfig_owner_req(ibuf
);
538 err
= got_privsep_recv_gitconfig_str(gitconfig_owner
, ibuf
);
544 err
= got_privsep_send_stop(imsg_fds
[0]);
545 child_err
= got_privsep_wait_for_child(pid
);
546 if (child_err
&& err
== NULL
)
549 if (imsg_fds
[0] != -1 && close(imsg_fds
[0]) == -1 && err
== NULL
)
550 err
= got_error_from_errno("close");
551 if (imsg_fds
[1] != -1 && close(imsg_fds
[1]) == -1 && err
== NULL
)
552 err
= got_error_from_errno("close");
553 if (fd
!= -1 && close(fd
) == -1 && err
== NULL
)
554 err
= got_error_from_errno2("close", gitconfig_path
);
559 static const struct got_error
*
560 read_gitconfig(struct got_repository
*repo
, const char *global_gitconfig_path
)
562 const struct got_error
*err
= NULL
;
563 char *repo_gitconfig_path
= NULL
;
565 if (global_gitconfig_path
) {
566 /* Read settings from ~/.gitconfig. */
567 int dummy_repo_version
;
568 err
= parse_gitconfig_file(&dummy_repo_version
,
569 &repo
->global_gitconfig_author_name
,
570 &repo
->global_gitconfig_author_email
,
571 NULL
, NULL
, NULL
, NULL
, NULL
, global_gitconfig_path
);
576 /* Read repository's .git/config file. */
577 repo_gitconfig_path
= got_repo_get_path_gitconfig(repo
);
578 if (repo_gitconfig_path
== NULL
)
579 return got_error_from_errno("got_repo_get_path_gitconfig");
581 err
= parse_gitconfig_file(&repo
->gitconfig_repository_format_version
,
582 &repo
->gitconfig_author_name
, &repo
->gitconfig_author_email
,
583 &repo
->gitconfig_remotes
, &repo
->ngitconfig_remotes
,
584 &repo
->gitconfig_owner
, &repo
->extensions
, &repo
->nextensions
,
585 repo_gitconfig_path
);
589 free(repo_gitconfig_path
);
593 static const struct got_error
*
594 read_gotconfig(struct got_repository
*repo
)
596 const struct got_error
*err
= NULL
;
597 char *gotconfig_path
;
599 gotconfig_path
= got_repo_get_path_gotconfig(repo
);
600 if (gotconfig_path
== NULL
)
601 return got_error_from_errno("got_repo_get_path_gotconfig");
603 err
= got_gotconfig_read(&repo
->gotconfig
, gotconfig_path
);
604 free(gotconfig_path
);
608 /* Supported repository format extensions. */
609 static const char *repo_extensions
[] = {
610 "noop", /* Got supports repository format version 1. */
611 "preciousObjects", /* Supported by gotadmin cleanup. */
612 "worktreeConfig", /* Got does not care about Git work trees. */
615 const struct got_error
*
616 got_repo_open(struct got_repository
**repop
, const char *path
,
617 const char *global_gitconfig_path
)
619 struct got_repository
*repo
= NULL
;
620 const struct got_error
*err
= NULL
;
621 char *repo_path
= NULL
;
627 if (getrlimit(RLIMIT_NOFILE
, &rl
) == -1)
628 return got_error_from_errno("getrlimit");
630 repo
= calloc(1, sizeof(*repo
));
632 err
= got_error_from_errno("calloc");
636 STAILQ_INIT(&repo
->packidx_bloom_filters
);
638 for (i
= 0; i
< nitems(repo
->privsep_children
); i
++) {
639 memset(&repo
->privsep_children
[i
], 0,
640 sizeof(repo
->privsep_children
[0]));
641 repo
->privsep_children
[i
].imsg_fd
= -1;
644 err
= got_object_cache_init(&repo
->objcache
,
645 GOT_OBJECT_CACHE_TYPE_OBJ
);
648 err
= got_object_cache_init(&repo
->treecache
,
649 GOT_OBJECT_CACHE_TYPE_TREE
);
652 err
= got_object_cache_init(&repo
->commitcache
,
653 GOT_OBJECT_CACHE_TYPE_COMMIT
);
656 err
= got_object_cache_init(&repo
->tagcache
,
657 GOT_OBJECT_CACHE_TYPE_TAG
);
661 repo
->pack_cache_size
= GOT_PACK_CACHE_SIZE
;
662 if (repo
->pack_cache_size
> rl
.rlim_cur
/ 8)
663 repo
->pack_cache_size
= rl
.rlim_cur
/ 8;
665 repo_path
= realpath(path
, NULL
);
666 if (repo_path
== NULL
) {
667 err
= got_error_from_errno2("realpath", path
);
674 err
= open_repo(repo
, repo_path
);
677 if (err
->code
!= GOT_ERR_NOT_GIT_REPO
)
679 if (repo_path
[0] == '/' && repo_path
[1] == '\0') {
680 err
= got_error(GOT_ERR_NOT_GIT_REPO
);
683 err
= got_path_dirname(&parent_path
, repo_path
);
687 repo_path
= parent_path
;
690 err
= read_gotconfig(repo
);
694 err
= read_gitconfig(repo
, global_gitconfig_path
);
697 if (repo
->gitconfig_repository_format_version
!= 0)
698 err
= got_error_path(path
, GOT_ERR_GIT_REPO_FORMAT
);
699 for (i
= 0; i
< repo
->nextensions
; i
++) {
700 char *ext
= repo
->extensions
[i
];
701 int j
, supported
= 0;
702 for (j
= 0; j
< nitems(repo_extensions
); j
++) {
703 if (strcmp(ext
, repo_extensions
[j
]) == 0) {
709 err
= got_error_path(ext
, GOT_ERR_GIT_REPO_EXT
);
715 got_repo_close(repo
);
722 const struct got_error
*
723 got_repo_close(struct got_repository
*repo
)
725 const struct got_error
*err
= NULL
, *child_err
;
728 for (i
= 0; i
< repo
->pack_cache_size
; i
++) {
729 if (repo
->packidx_cache
[i
] == NULL
)
731 got_packidx_close(repo
->packidx_cache
[i
]);
734 while (!STAILQ_EMPTY(&repo
->packidx_bloom_filters
)) {
735 struct got_packidx_bloom_filter
*bf
;
736 bf
= STAILQ_FIRST(&repo
->packidx_bloom_filters
);
737 STAILQ_REMOVE_HEAD(&repo
->packidx_bloom_filters
, entry
);
742 for (i
= 0; i
< repo
->pack_cache_size
; i
++) {
743 if (repo
->packs
[i
].path_packfile
== NULL
)
745 got_pack_close(&repo
->packs
[i
]);
749 free(repo
->path_git_dir
);
751 got_object_cache_close(&repo
->objcache
);
752 got_object_cache_close(&repo
->treecache
);
753 got_object_cache_close(&repo
->commitcache
);
754 got_object_cache_close(&repo
->tagcache
);
756 for (i
= 0; i
< nitems(repo
->privsep_children
); i
++) {
757 if (repo
->privsep_children
[i
].imsg_fd
== -1)
759 imsg_clear(repo
->privsep_children
[i
].ibuf
);
760 free(repo
->privsep_children
[i
].ibuf
);
761 err
= got_privsep_send_stop(repo
->privsep_children
[i
].imsg_fd
);
762 child_err
= got_privsep_wait_for_child(
763 repo
->privsep_children
[i
].pid
);
764 if (child_err
&& err
== NULL
)
766 if (close(repo
->privsep_children
[i
].imsg_fd
) == -1 &&
768 err
= got_error_from_errno("close");
771 if (repo
->gitdir_fd
!= -1 && close(repo
->gitdir_fd
) == -1 &&
773 err
= got_error_from_errno("close");
776 got_gotconfig_free(repo
->gotconfig
);
777 free(repo
->gitconfig_author_name
);
778 free(repo
->gitconfig_author_email
);
779 for (i
= 0; i
< repo
->ngitconfig_remotes
; i
++)
780 got_repo_free_remote_repo_data(&repo
->gitconfig_remotes
[i
]);
781 free(repo
->gitconfig_remotes
);
782 for (i
= 0; i
< repo
->nextensions
; i
++)
783 free(repo
->extensions
[i
]);
784 free(repo
->extensions
);
791 got_repo_free_remote_repo_data(struct got_remote_repo
*repo
)
797 free(repo
->fetch_url
);
798 repo
->fetch_url
= NULL
;
799 free(repo
->send_url
);
800 repo
->send_url
= NULL
;
801 for (i
= 0; i
< repo
->nfetch_branches
; i
++)
802 free(repo
->fetch_branches
[i
]);
803 free(repo
->fetch_branches
);
804 repo
->fetch_branches
= NULL
;
805 repo
->nfetch_branches
= 0;
806 for (i
= 0; i
< repo
->nsend_branches
; i
++)
807 free(repo
->send_branches
[i
]);
808 free(repo
->send_branches
);
809 repo
->send_branches
= NULL
;
810 repo
->nsend_branches
= 0;
813 const struct got_error
*
814 got_repo_map_path(char **in_repo_path
, struct got_repository
*repo
,
815 const char *input_path
)
817 const struct got_error
*err
= NULL
;
818 const char *repo_abspath
= NULL
;
820 char *canonpath
, *path
= NULL
;
822 *in_repo_path
= NULL
;
824 canonpath
= strdup(input_path
);
825 if (canonpath
== NULL
) {
826 err
= got_error_from_errno("strdup");
829 err
= got_canonpath(input_path
, canonpath
, strlen(canonpath
) + 1);
833 repo_abspath
= got_repo_get_path(repo
);
835 if (canonpath
[0] == '\0') {
836 path
= strdup(canonpath
);
838 err
= got_error_from_errno("strdup");
842 path
= realpath(canonpath
, NULL
);
844 if (errno
!= ENOENT
) {
845 err
= got_error_from_errno2("realpath",
850 * Path is not on disk.
851 * Assume it is already relative to repository root.
853 path
= strdup(canonpath
);
855 err
= got_error_from_errno("strdup");
860 repolen
= strlen(repo_abspath
);
864 if (strcmp(path
, repo_abspath
) == 0) {
868 err
= got_error_from_errno("strdup");
871 } else if (len
> repolen
&&
872 got_path_is_child(path
, repo_abspath
, repolen
)) {
873 /* Matched an on-disk path inside repository. */
874 if (got_repo_is_bare(repo
)) {
876 * Matched an on-disk path inside repository
877 * database. Treat input as repository-relative.
884 /* Strip common prefix with repository path. */
885 err
= got_path_skip_common_ancestor(&child
,
894 * Matched unrelated on-disk path.
895 * Treat input as repository-relative.
903 /* Make in-repository path absolute */
904 if (path
[0] != '/') {
906 if (asprintf(&abspath
, "/%s", path
) == -1) {
907 err
= got_error_from_errno("asprintf");
919 *in_repo_path
= path
;
923 static const struct got_error
*
924 cache_packidx(struct got_repository
*repo
, struct got_packidx
*packidx
,
925 const char *path_packidx
)
927 const struct got_error
*err
= NULL
;
930 for (i
= 0; i
< repo
->pack_cache_size
; i
++) {
931 if (repo
->packidx_cache
[i
] == NULL
)
933 if (strcmp(repo
->packidx_cache
[i
]->path_packidx
,
934 path_packidx
) == 0) {
935 return got_error(GOT_ERR_CACHE_DUP_ENTRY
);
938 if (i
== repo
->pack_cache_size
) {
939 i
= repo
->pack_cache_size
- 1;
940 err
= got_packidx_close(repo
->packidx_cache
[i
]);
945 repo
->packidx_cache
[i
] = packidx
;
951 got_repo_is_packidx_filename(const char *name
, size_t len
)
953 if (len
!= GOT_PACKIDX_NAMELEN
)
956 if (strncmp(name
, GOT_PACK_PREFIX
, strlen(GOT_PACK_PREFIX
)) != 0)
959 if (strcmp(name
+ strlen(GOT_PACK_PREFIX
) +
960 SHA1_DIGEST_STRING_LENGTH
- 1, GOT_PACKIDX_SUFFIX
) != 0)
967 check_packidx_bloom_filter(struct got_repository
*repo
,
968 const char *path_packidx
, struct got_object_id
*id
)
970 struct got_packidx_bloom_filter
*bf
;
972 STAILQ_FOREACH(bf
, &repo
->packidx_bloom_filters
, entry
) {
973 if (got_path_cmp(bf
->path_packidx
, path_packidx
,
974 bf
->path_packidx_len
, strlen(path_packidx
)) == 0) {
975 return bloom_check(bf
->bloom
, id
->sha1
,
980 /* No bloom filter means this pack index must be searched. */
984 static const struct got_error
*
985 add_packidx_bloom_filter(struct got_repository
*repo
,
986 struct got_packidx
*packidx
, const char *path_packidx
)
988 int i
, nobjects
= be32toh(packidx
->hdr
.fanout_table
[0xff]);
989 struct got_packidx_bloom_filter
*bf
;
993 * Don't use bloom filters for very large pack index files.
994 * Large pack files will contain a relatively large fraction
995 * of our objects so we will likely need to visit them anyway.
996 * The more objects a pack file contains the higher the probability
997 * of a false-positive match from the bloom filter. And reading
998 * all object IDs from a large pack index file can be expensive.
1000 if (nobjects
> 100000) /* cut-off at about 2MB, at 20 bytes per ID */
1003 /* Do we already have a filter for this pack index? */
1004 STAILQ_FOREACH(bf
, &repo
->packidx_bloom_filters
, entry
) {
1005 if (got_path_cmp(bf
->path_packidx
, path_packidx
,
1006 bf
->path_packidx_len
, strlen(path_packidx
)) == 0)
1010 bf
= calloc(1, sizeof(*bf
));
1012 return got_error_from_errno("calloc");
1013 bf
->bloom
= calloc(1, sizeof(*bf
->bloom
));
1014 if (bf
->bloom
== NULL
) {
1016 return got_error_from_errno("calloc");
1020 len
= strlcpy(bf
->path_packidx
, path_packidx
, sizeof(bf
->path_packidx
));
1021 if (len
>= sizeof(bf
->path_packidx
)) {
1024 return got_error(GOT_ERR_NO_SPACE
);
1026 bf
->path_packidx_len
= len
;
1028 /* Minimum size supported by our bloom filter is 1000 entries. */
1029 bloom_init(bf
->bloom
, nobjects
< 1000 ? 1000 : nobjects
, 0.1);
1030 for (i
= 0; i
< nobjects
; i
++) {
1031 struct got_packidx_object_id
*id
;
1032 id
= &packidx
->hdr
.sorted_ids
[i
];
1033 bloom_add(bf
->bloom
, id
->sha1
, sizeof(id
->sha1
));
1036 STAILQ_INSERT_TAIL(&repo
->packidx_bloom_filters
, bf
, entry
);
1040 const struct got_error
*
1041 got_repo_search_packidx(struct got_packidx
**packidx
, int *idx
,
1042 struct got_repository
*repo
, struct got_object_id
*id
)
1044 const struct got_error
*err
;
1045 DIR *packdir
= NULL
;
1046 struct dirent
*dent
;
1051 /* Search pack index cache. */
1052 for (i
= 0; i
< repo
->pack_cache_size
; i
++) {
1053 if (repo
->packidx_cache
[i
] == NULL
)
1055 if (!check_packidx_bloom_filter(repo
,
1056 repo
->packidx_cache
[i
]->path_packidx
, id
))
1057 continue; /* object will not be found in this index */
1058 *idx
= got_packidx_get_object_idx(repo
->packidx_cache
[i
], id
);
1060 *packidx
= repo
->packidx_cache
[i
];
1062 * Move this cache entry to the front. Repeatedly
1063 * searching a wrong pack index can be expensive.
1066 memmove(&repo
->packidx_cache
[1],
1067 &repo
->packidx_cache
[0],
1068 i
* sizeof(repo
->packidx_cache
[0]));
1069 repo
->packidx_cache
[0] = *packidx
;
1074 /* No luck. Search the filesystem. */
1076 packdir_fd
= openat(got_repo_get_fd(repo
),
1077 GOT_OBJECTS_PACK_DIR
, O_DIRECTORY
);
1078 if (packdir_fd
== -1) {
1079 if (errno
== ENOENT
)
1080 err
= got_error_no_obj(id
);
1082 err
= got_error_from_errno_fmt("openat: %s/%s",
1083 got_repo_get_path_git_dir(repo
),
1084 GOT_OBJECTS_PACK_DIR
);
1088 packdir
= fdopendir(packdir_fd
);
1089 if (packdir
== NULL
) {
1090 err
= got_error_from_errno("fdopendir");
1094 while ((dent
= readdir(packdir
)) != NULL
) {
1097 if (!got_repo_is_packidx_filename(dent
->d_name
,
1098 strlen(dent
->d_name
)))
1101 if (asprintf(&path_packidx
, "%s/%s", GOT_OBJECTS_PACK_DIR
,
1102 dent
->d_name
) == -1) {
1103 err
= got_error_from_errno("asprintf");
1107 if (!check_packidx_bloom_filter(repo
, path_packidx
, id
)) {
1109 continue; /* object will not be found in this index */
1112 for (i
= 0; i
< repo
->pack_cache_size
; i
++) {
1113 if (repo
->packidx_cache
[i
] == NULL
)
1115 if (strcmp(repo
->packidx_cache
[i
]->path_packidx
,
1116 path_packidx
) == 0) {
1123 continue; /* already searched */
1126 err
= got_packidx_open(packidx
, got_repo_get_fd(repo
),
1133 err
= add_packidx_bloom_filter(repo
, *packidx
, path_packidx
);
1139 err
= cache_packidx(repo
, *packidx
, path_packidx
);
1144 *idx
= got_packidx_get_object_idx(*packidx
, id
);
1146 err
= NULL
; /* found the object */
1151 err
= got_error_no_obj(id
);
1153 if (packdir
&& closedir(packdir
) != 0 && err
== NULL
)
1154 err
= got_error_from_errno("closedir");
1158 static const struct got_error
*
1159 read_packfile_hdr(int fd
, struct got_packidx
*packidx
)
1161 const struct got_error
*err
= NULL
;
1162 uint32_t totobj
= be32toh(packidx
->hdr
.fanout_table
[0xff]);
1163 struct got_packfile_hdr hdr
;
1166 n
= read(fd
, &hdr
, sizeof(hdr
));
1168 return got_error_from_errno("read");
1169 if (n
!= sizeof(hdr
))
1170 return got_error(GOT_ERR_BAD_PACKFILE
);
1172 if (be32toh(hdr
.signature
) != GOT_PACKFILE_SIGNATURE
||
1173 be32toh(hdr
.version
) != GOT_PACKFILE_VERSION
||
1174 be32toh(hdr
.nobjects
) != totobj
)
1175 err
= got_error(GOT_ERR_BAD_PACKFILE
);
1180 static const struct got_error
*
1181 open_packfile(int *fd
, struct got_repository
*repo
,
1182 const char *relpath
, struct got_packidx
*packidx
)
1184 const struct got_error
*err
= NULL
;
1186 *fd
= openat(got_repo_get_fd(repo
), relpath
, O_RDONLY
| O_NOFOLLOW
);
1188 return got_error_from_errno_fmt("openat: %s/%s",
1189 got_repo_get_path_git_dir(repo
), relpath
);
1192 err
= read_packfile_hdr(*fd
, packidx
);
1202 const struct got_error
*
1203 got_repo_cache_pack(struct got_pack
**packp
, struct got_repository
*repo
,
1204 const char *path_packfile
, struct got_packidx
*packidx
)
1206 const struct got_error
*err
= NULL
;
1207 struct got_pack
*pack
= NULL
;
1214 for (i
= 0; i
< repo
->pack_cache_size
; i
++) {
1215 pack
= &repo
->packs
[i
];
1216 if (pack
->path_packfile
== NULL
)
1218 if (strcmp(pack
->path_packfile
, path_packfile
) == 0)
1219 return got_error(GOT_ERR_CACHE_DUP_ENTRY
);
1222 if (i
== repo
->pack_cache_size
) {
1223 err
= got_pack_close(&repo
->packs
[i
- 1]);
1226 memmove(&repo
->packs
[1], &repo
->packs
[0],
1227 sizeof(repo
->packs
) - sizeof(repo
->packs
[0]));
1231 pack
= &repo
->packs
[i
];
1233 pack
->path_packfile
= strdup(path_packfile
);
1234 if (pack
->path_packfile
== NULL
) {
1235 err
= got_error_from_errno("strdup");
1239 err
= open_packfile(&pack
->fd
, repo
, path_packfile
, packidx
);
1243 if (fstat(pack
->fd
, &sb
) != 0) {
1244 err
= got_error_from_errno("fstat");
1247 pack
->filesize
= sb
.st_size
;
1249 pack
->privsep_child
= NULL
;
1251 #ifndef GOT_PACK_NO_MMAP
1252 pack
->map
= mmap(NULL
, pack
->filesize
, PROT_READ
, MAP_PRIVATE
,
1254 if (pack
->map
== MAP_FAILED
) {
1255 if (errno
!= ENOMEM
) {
1256 err
= got_error_from_errno("mmap");
1259 pack
->map
= NULL
; /* fall back to read(2) */
1265 free(pack
->path_packfile
);
1266 memset(pack
, 0, sizeof(*pack
));
1274 got_repo_get_cached_pack(struct got_repository
*repo
, const char *path_packfile
)
1276 struct got_pack
*pack
= NULL
;
1279 for (i
= 0; i
< repo
->pack_cache_size
; i
++) {
1280 pack
= &repo
->packs
[i
];
1281 if (pack
->path_packfile
== NULL
)
1283 if (strcmp(pack
->path_packfile
, path_packfile
) == 0)
1290 const struct got_error
*
1291 got_repo_init(const char *repo_path
)
1293 const struct got_error
*err
= NULL
;
1294 const char *dirnames
[] = {
1296 GOT_OBJECTS_PACK_DIR
,
1299 const char *description_str
= "Unnamed repository; "
1300 "edit this file 'description' to name the repository.";
1301 const char *headref_str
= "ref: refs/heads/main";
1302 const char *gitconfig_str
= "[core]\n"
1303 "\trepositoryformatversion = 0\n"
1304 "\tfilemode = true\n"
1309 if (!got_path_dir_is_empty(repo_path
))
1310 return got_error(GOT_ERR_DIR_NOT_EMPTY
);
1312 for (i
= 0; i
< nitems(dirnames
); i
++) {
1313 if (asprintf(&path
, "%s/%s", repo_path
, dirnames
[i
]) == -1) {
1314 return got_error_from_errno("asprintf");
1316 err
= got_path_mkdir(path
);
1322 if (asprintf(&path
, "%s/%s", repo_path
, "description") == -1)
1323 return got_error_from_errno("asprintf");
1324 err
= got_path_create_file(path
, description_str
);
1329 if (asprintf(&path
, "%s/%s", repo_path
, GOT_HEAD_FILE
) == -1)
1330 return got_error_from_errno("asprintf");
1331 err
= got_path_create_file(path
, headref_str
);
1336 if (asprintf(&path
, "%s/%s", repo_path
, "config") == -1)
1337 return got_error_from_errno("asprintf");
1338 err
= got_path_create_file(path
, gitconfig_str
);
1346 static const struct got_error
*
1347 match_packed_object(struct got_object_id
**unique_id
,
1348 struct got_repository
*repo
, const char *id_str_prefix
, int obj_type
)
1350 const struct got_error
*err
= NULL
;
1351 DIR *packdir
= NULL
;
1352 struct dirent
*dent
;
1354 struct got_object_id_queue matched_ids
;
1357 STAILQ_INIT(&matched_ids
);
1359 packdir_fd
= openat(got_repo_get_fd(repo
),
1360 GOT_OBJECTS_PACK_DIR
, O_DIRECTORY
);
1361 if (packdir_fd
== -1) {
1362 if (errno
!= ENOENT
)
1363 err
= got_error_from_errno2("openat", GOT_OBJECTS_PACK_DIR
);
1367 packdir
= fdopendir(packdir_fd
);
1368 if (packdir
== NULL
) {
1369 err
= got_error_from_errno("fdopendir");
1373 while ((dent
= readdir(packdir
)) != NULL
) {
1374 struct got_packidx
*packidx
;
1375 struct got_object_qid
*qid
;
1377 if (!got_repo_is_packidx_filename(dent
->d_name
,
1378 strlen(dent
->d_name
)))
1381 if (asprintf(&path_packidx
, "%s/%s", GOT_OBJECTS_PACK_DIR
,
1382 dent
->d_name
) == -1) {
1383 err
= got_error_from_errno("strdup");
1387 err
= got_packidx_open(&packidx
, got_repo_get_fd(repo
),
1393 err
= got_packidx_match_id_str_prefix(&matched_ids
,
1394 packidx
, id_str_prefix
);
1396 got_packidx_close(packidx
);
1399 err
= got_packidx_close(packidx
);
1403 STAILQ_FOREACH(qid
, &matched_ids
, entry
) {
1404 if (obj_type
!= GOT_OBJ_TYPE_ANY
) {
1406 err
= got_object_get_type(&matched_type
, repo
,
1410 if (matched_type
!= obj_type
)
1413 if (*unique_id
== NULL
) {
1414 *unique_id
= got_object_id_dup(qid
->id
);
1415 if (*unique_id
== NULL
) {
1416 err
= got_error_from_errno("malloc");
1420 if (got_object_id_cmp(*unique_id
, qid
->id
) == 0)
1421 continue; /* packed multiple times */
1422 err
= got_error(GOT_ERR_AMBIGUOUS_ID
);
1428 got_object_id_queue_free(&matched_ids
);
1429 if (packdir
&& closedir(packdir
) != 0 && err
== NULL
)
1430 err
= got_error_from_errno("closedir");
1438 static const struct got_error
*
1439 match_loose_object(struct got_object_id
**unique_id
, const char *path_objects
,
1440 const char *object_dir
, const char *id_str_prefix
, int obj_type
,
1441 struct got_repository
*repo
)
1443 const struct got_error
*err
= NULL
;
1446 struct dirent
*dent
;
1447 struct got_object_id id
;
1449 if (asprintf(&path
, "%s/%s", path_objects
, object_dir
) == -1) {
1450 err
= got_error_from_errno("asprintf");
1454 dir
= opendir(path
);
1456 if (errno
== ENOENT
) {
1460 err
= got_error_from_errno2("opendir", path
);
1463 while ((dent
= readdir(dir
)) != NULL
) {
1467 if (strcmp(dent
->d_name
, ".") == 0 ||
1468 strcmp(dent
->d_name
, "..") == 0)
1471 if (asprintf(&id_str
, "%s%s", object_dir
, dent
->d_name
) == -1) {
1472 err
= got_error_from_errno("asprintf");
1476 if (!got_parse_sha1_digest(id
.sha1
, id_str
))
1480 * Directory entries do not necessarily appear in
1481 * sorted order, so we must iterate over all of them.
1483 cmp
= strncmp(id_str
, id_str_prefix
, strlen(id_str_prefix
));
1489 if (*unique_id
== NULL
) {
1490 if (obj_type
!= GOT_OBJ_TYPE_ANY
) {
1492 err
= got_object_get_type(&matched_type
, repo
,
1496 if (matched_type
!= obj_type
)
1499 *unique_id
= got_object_id_dup(&id
);
1500 if (*unique_id
== NULL
) {
1501 err
= got_error_from_errno("got_object_id_dup");
1506 if (got_object_id_cmp(*unique_id
, &id
) == 0)
1507 continue; /* both packed and loose */
1508 err
= got_error(GOT_ERR_AMBIGUOUS_ID
);
1514 if (dir
&& closedir(dir
) != 0 && err
== NULL
)
1515 err
= got_error_from_errno("closedir");
1524 const struct got_error
*
1525 got_repo_match_object_id_prefix(struct got_object_id
**id
,
1526 const char *id_str_prefix
, int obj_type
, struct got_repository
*repo
)
1528 const struct got_error
*err
= NULL
;
1529 char *path_objects
= got_repo_get_path_objects(repo
);
1530 char *object_dir
= NULL
;
1536 for (i
= 0; i
< strlen(id_str_prefix
); i
++) {
1537 if (isxdigit((unsigned char)id_str_prefix
[i
]))
1539 return got_error_path(id_str_prefix
, GOT_ERR_BAD_OBJ_ID_STR
);
1542 len
= strlen(id_str_prefix
);
1544 err
= match_packed_object(id
, repo
, id_str_prefix
, obj_type
);
1547 object_dir
= strndup(id_str_prefix
, 2);
1548 if (object_dir
== NULL
) {
1549 err
= got_error_from_errno("strdup");
1552 err
= match_loose_object(id
, path_objects
, object_dir
,
1553 id_str_prefix
, obj_type
, repo
);
1554 } else if (len
== 1) {
1556 for (i
= 0; i
< 0xf; i
++) {
1557 if (asprintf(&object_dir
, "%s%.1x", id_str_prefix
, i
)
1559 err
= got_error_from_errno("asprintf");
1562 err
= match_packed_object(id
, repo
, object_dir
,
1566 err
= match_loose_object(id
, path_objects
, object_dir
,
1567 id_str_prefix
, obj_type
, repo
);
1572 err
= got_error_path(id_str_prefix
, GOT_ERR_BAD_OBJ_ID_STR
);
1580 } else if (*id
== NULL
) {
1582 case GOT_OBJ_TYPE_BLOB
:
1583 err
= got_error_fmt(GOT_ERR_NO_OBJ
, "%s %s",
1584 GOT_OBJ_LABEL_BLOB
, id_str_prefix
);
1586 case GOT_OBJ_TYPE_TREE
:
1587 err
= got_error_fmt(GOT_ERR_NO_OBJ
, "%s %s",
1588 GOT_OBJ_LABEL_TREE
, id_str_prefix
);
1590 case GOT_OBJ_TYPE_COMMIT
:
1591 err
= got_error_fmt(GOT_ERR_NO_OBJ
, "%s %s",
1592 GOT_OBJ_LABEL_COMMIT
, id_str_prefix
);
1594 case GOT_OBJ_TYPE_TAG
:
1595 err
= got_error_fmt(GOT_ERR_NO_OBJ
, "%s %s",
1596 GOT_OBJ_LABEL_TAG
, id_str_prefix
);
1599 err
= got_error_path(id_str_prefix
, GOT_ERR_NO_OBJ
);
1607 const struct got_error
*
1608 got_repo_match_object_id(struct got_object_id
**id
, char **label
,
1609 const char *id_str
, int obj_type
, struct got_reflist_head
*refs
,
1610 struct got_repository
*repo
)
1612 const struct got_error
*err
;
1613 struct got_tag_object
*tag
;
1614 struct got_reference
*ref
= NULL
;
1621 err
= got_repo_object_match_tag(&tag
, id_str
, obj_type
,
1624 *id
= got_object_id_dup(
1625 got_object_tag_get_object_id(tag
));
1627 err
= got_error_from_errno("got_object_id_dup");
1628 else if (label
&& asprintf(label
, "refs/tags/%s",
1629 got_object_tag_get_name(tag
)) == -1) {
1630 err
= got_error_from_errno("asprintf");
1634 got_object_tag_close(tag
);
1636 } else if (err
->code
!= GOT_ERR_OBJ_TYPE
&&
1637 err
->code
!= GOT_ERR_NO_OBJ
)
1641 err
= got_repo_match_object_id_prefix(id
, id_str
, obj_type
, repo
);
1643 if (err
->code
!= GOT_ERR_BAD_OBJ_ID_STR
)
1645 err
= got_ref_open(&ref
, repo
, id_str
, 0);
1649 *label
= strdup(got_ref_get_name(ref
));
1650 if (*label
== NULL
) {
1651 err
= got_error_from_errno("strdup");
1655 err
= got_ref_resolve(id
, repo
, ref
);
1657 err
= got_object_id_str(label
, *id
);
1658 if (*label
== NULL
) {
1659 err
= got_error_from_errno("strdup");
1669 const struct got_error
*
1670 got_repo_object_match_tag(struct got_tag_object
**tag
, const char *name
,
1671 int obj_type
, struct got_reflist_head
*refs
, struct got_repository
*repo
)
1673 const struct got_error
*err
= NULL
;
1674 struct got_reflist_entry
*re
;
1675 struct got_object_id
*tag_id
;
1676 int name_is_absolute
= (strncmp(name
, "refs/", 5) == 0);
1680 TAILQ_FOREACH(re
, refs
, entry
) {
1681 const char *refname
;
1682 refname
= got_ref_get_name(re
->ref
);
1683 if (got_ref_is_symbolic(re
->ref
))
1685 if (strncmp(refname
, "refs/tags/", 10) != 0)
1687 if (!name_is_absolute
)
1688 refname
+= strlen("refs/tags/");
1689 if (strcmp(refname
, name
) != 0)
1691 err
= got_ref_resolve(&tag_id
, repo
, re
->ref
);
1694 err
= got_object_open_as_tag(tag
, repo
, tag_id
);
1698 if (obj_type
== GOT_OBJ_TYPE_ANY
||
1699 got_object_tag_get_object_type(*tag
) == obj_type
)
1701 got_object_tag_close(*tag
);
1705 if (err
== NULL
&& *tag
== NULL
)
1706 err
= got_error_fmt(GOT_ERR_NO_OBJ
, "%s %s",
1707 GOT_OBJ_LABEL_TAG
, name
);
1711 static const struct got_error
*
1712 alloc_added_blob_tree_entry(struct got_tree_entry
**new_te
,
1713 const char *name
, mode_t mode
, struct got_object_id
*blob_id
)
1715 const struct got_error
*err
= NULL
;
1719 *new_te
= calloc(1, sizeof(**new_te
));
1720 if (*new_te
== NULL
)
1721 return got_error_from_errno("calloc");
1723 if (strlcpy((*new_te
)->name
, name
, sizeof((*new_te
)->name
)) >=
1724 sizeof((*new_te
)->name
)) {
1725 err
= got_error(GOT_ERR_NO_SPACE
);
1729 if (S_ISLNK(mode
)) {
1730 (*new_te
)->mode
= S_IFLNK
;
1732 (*new_te
)->mode
= S_IFREG
;
1733 (*new_te
)->mode
|= (mode
& (S_IRWXU
| S_IRWXG
| S_IRWXO
));
1735 memcpy(&(*new_te
)->id
, blob_id
, sizeof((*new_te
)->id
));
1737 if (err
&& *new_te
) {
1744 static const struct got_error
*
1745 import_file(struct got_tree_entry
**new_te
, struct dirent
*de
,
1746 const char *path
, struct got_repository
*repo
)
1748 const struct got_error
*err
;
1749 struct got_object_id
*blob_id
= NULL
;
1753 if (asprintf(&filepath
, "%s%s%s", path
,
1754 path
[0] == '\0' ? "" : "/", de
->d_name
) == -1)
1755 return got_error_from_errno("asprintf");
1757 if (lstat(filepath
, &sb
) != 0) {
1758 err
= got_error_from_errno2("lstat", path
);
1762 err
= got_object_blob_create(&blob_id
, filepath
, repo
);
1766 err
= alloc_added_blob_tree_entry(new_te
, de
->d_name
, sb
.st_mode
,
1775 static const struct got_error
*
1776 insert_tree_entry(struct got_tree_entry
*new_te
,
1777 struct got_pathlist_head
*paths
)
1779 const struct got_error
*err
= NULL
;
1780 struct got_pathlist_entry
*new_pe
;
1782 err
= got_pathlist_insert(&new_pe
, paths
, new_te
->name
, new_te
);
1786 return got_error(GOT_ERR_TREE_DUP_ENTRY
);
1790 static const struct got_error
*write_tree(struct got_object_id
**,
1791 const char *, struct got_pathlist_head
*, struct got_repository
*,
1792 got_repo_import_cb progress_cb
, void *progress_arg
);
1794 static const struct got_error
*
1795 import_subdir(struct got_tree_entry
**new_te
, struct dirent
*de
,
1796 const char *path
, struct got_pathlist_head
*ignores
,
1797 struct got_repository
*repo
,
1798 got_repo_import_cb progress_cb
, void *progress_arg
)
1800 const struct got_error
*err
;
1801 struct got_object_id
*id
= NULL
;
1804 if (asprintf(&subdirpath
, "%s%s%s", path
,
1805 path
[0] == '\0' ? "" : "/", de
->d_name
) == -1)
1806 return got_error_from_errno("asprintf");
1808 (*new_te
) = calloc(1, sizeof(**new_te
));
1809 if (*new_te
== NULL
)
1810 return got_error_from_errno("calloc");
1811 (*new_te
)->mode
= S_IFDIR
;
1812 if (strlcpy((*new_te
)->name
, de
->d_name
, sizeof((*new_te
)->name
)) >=
1813 sizeof((*new_te
)->name
)) {
1814 err
= got_error(GOT_ERR_NO_SPACE
);
1817 err
= write_tree(&id
, subdirpath
, ignores
, repo
,
1818 progress_cb
, progress_arg
);
1821 memcpy(&(*new_te
)->id
, id
, sizeof((*new_te
)->id
));
1833 static const struct got_error
*
1834 write_tree(struct got_object_id
**new_tree_id
, const char *path_dir
,
1835 struct got_pathlist_head
*ignores
, struct got_repository
*repo
,
1836 got_repo_import_cb progress_cb
, void *progress_arg
)
1838 const struct got_error
*err
= NULL
;
1842 struct got_tree_entry
*new_te
= NULL
;
1843 struct got_pathlist_head paths
;
1844 struct got_pathlist_entry
*pe
;
1846 *new_tree_id
= NULL
;
1850 dir
= opendir(path_dir
);
1852 err
= got_error_from_errno2("opendir", path_dir
);
1857 while ((de
= readdir(dir
)) != NULL
) {
1861 if (strcmp(de
->d_name
, ".") == 0 ||
1862 strcmp(de
->d_name
, "..") == 0)
1865 TAILQ_FOREACH(pe
, ignores
, entry
) {
1866 if (fnmatch(pe
->path
, de
->d_name
, 0) == 0) {
1874 err
= got_path_dirent_type(&type
, path_dir
, de
);
1878 if (type
== DT_DIR
) {
1879 err
= import_subdir(&new_te
, de
, path_dir
,
1880 ignores
, repo
, progress_cb
, progress_arg
);
1882 if (err
->code
!= GOT_ERR_NO_TREE_ENTRY
)
1887 } else if (type
== DT_REG
|| type
== DT_LNK
) {
1888 err
= import_file(&new_te
, de
, path_dir
, repo
);
1894 err
= insert_tree_entry(new_te
, &paths
);
1900 if (TAILQ_EMPTY(&paths
)) {
1901 err
= got_error_msg(GOT_ERR_NO_TREE_ENTRY
,
1902 "cannot create tree without any entries");
1906 TAILQ_FOREACH(pe
, &paths
, entry
) {
1907 struct got_tree_entry
*te
= pe
->data
;
1909 if (!S_ISREG(te
->mode
) && !S_ISLNK(te
->mode
))
1911 if (asprintf(&path
, "%s/%s", path_dir
, pe
->path
) == -1) {
1912 err
= got_error_from_errno("asprintf");
1915 err
= (*progress_cb
)(progress_arg
, path
);
1921 err
= got_object_tree_create(new_tree_id
, &paths
, nentries
, repo
);
1925 got_pathlist_free(&paths
);
1929 const struct got_error
*
1930 got_repo_import(struct got_object_id
**new_commit_id
, const char *path_dir
,
1931 const char *logmsg
, const char *author
, struct got_pathlist_head
*ignores
,
1932 struct got_repository
*repo
, got_repo_import_cb progress_cb
,
1935 const struct got_error
*err
;
1936 struct got_object_id
*new_tree_id
;
1938 err
= write_tree(&new_tree_id
, path_dir
, ignores
, repo
,
1939 progress_cb
, progress_arg
);
1943 err
= got_object_commit_create(new_commit_id
, new_tree_id
, NULL
, 0,
1944 author
, time(NULL
), author
, time(NULL
), logmsg
, repo
);
1949 const struct got_error
*
1950 got_repo_get_loose_object_info(int *nobjects
, off_t
*ondisk_size
,
1951 struct got_repository
*repo
)
1953 const struct got_error
*err
= NULL
;
1954 char *path_objects
= NULL
, *path
= NULL
;
1956 struct got_object_id id
;
1962 path_objects
= got_repo_get_path_objects(repo
);
1963 if (path_objects
== NULL
)
1964 return got_error_from_errno("got_repo_get_path_objects");
1966 for (i
= 0; i
<= 0xff; i
++) {
1967 struct dirent
*dent
;
1969 if (asprintf(&path
, "%s/%.2x", path_objects
, i
) == -1) {
1970 err
= got_error_from_errno("asprintf");
1974 dir
= opendir(path
);
1976 if (errno
== ENOENT
) {
1980 err
= got_error_from_errno2("opendir", path
);
1984 while ((dent
= readdir(dir
)) != NULL
) {
1989 if (strcmp(dent
->d_name
, ".") == 0 ||
1990 strcmp(dent
->d_name
, "..") == 0)
1993 if (asprintf(&id_str
, "%.2x%s", i
, dent
->d_name
) == -1) {
1994 err
= got_error_from_errno("asprintf");
1998 if (!got_parse_sha1_digest(id
.sha1
, id_str
)) {
2004 err
= got_object_open_loose_fd(&fd
, &id
, repo
);
2008 if (fstat(fd
, &sb
) == -1) {
2009 err
= got_error_from_errno("fstat");
2014 (*ondisk_size
) += sb
.st_size
;
2016 if (close(fd
) == -1) {
2017 err
= got_error_from_errno("close");
2022 if (closedir(dir
) != 0) {
2023 err
= got_error_from_errno("closedir");
2032 if (dir
&& closedir(dir
) != 0 && err
== NULL
)
2033 err
= got_error_from_errno("closedir");
2044 const struct got_error
*
2045 got_repo_get_packfile_info(int *npackfiles
, int *nobjects
,
2046 off_t
*total_packsize
, struct got_repository
*repo
)
2048 const struct got_error
*err
= NULL
;
2049 DIR *packdir
= NULL
;
2050 struct dirent
*dent
;
2051 struct got_packidx
*packidx
= NULL
;
2053 char *path_packfile
;
2059 *total_packsize
= 0;
2061 packdir_fd
= openat(got_repo_get_fd(repo
),
2062 GOT_OBJECTS_PACK_DIR
, O_DIRECTORY
);
2063 if (packdir_fd
== -1) {
2064 return got_error_from_errno_fmt("openat: %s/%s",
2065 got_repo_get_path_git_dir(repo
),
2066 GOT_OBJECTS_PACK_DIR
);
2069 packdir
= fdopendir(packdir_fd
);
2070 if (packdir
== NULL
) {
2071 err
= got_error_from_errno("fdopendir");
2075 while ((dent
= readdir(packdir
)) != NULL
) {
2076 if (!got_repo_is_packidx_filename(dent
->d_name
,
2077 strlen(dent
->d_name
)))
2080 if (asprintf(&path_packidx
, "%s/%s", GOT_OBJECTS_PACK_DIR
,
2081 dent
->d_name
) == -1) {
2082 err
= got_error_from_errno("asprintf");
2086 err
= got_packidx_open(&packidx
, got_repo_get_fd(repo
),
2092 if (fstat(packidx
->fd
, &sb
) == -1)
2094 *total_packsize
+= sb
.st_size
;
2096 err
= got_packidx_get_packfile_path(&path_packfile
,
2097 packidx
->path_packidx
);
2101 if (fstatat(got_repo_get_fd(repo
), path_packfile
, &sb
,
2103 free(path_packfile
);
2106 free(path_packfile
);
2107 *total_packsize
+= sb
.st_size
;
2109 *nobjects
+= be32toh(packidx
->hdr
.fanout_table
[0xff]);
2113 got_packidx_close(packidx
);
2118 got_packidx_close(packidx
);
2119 if (packdir
&& closedir(packdir
) != 0 && err
== NULL
)
2120 err
= got_error_from_errno("closedir");
2124 *total_packsize
= 0;