2 * Copyright (c) 2018, 2019 Stefan Sperling <stsp@openbsd.org>
4 * Permission to use, copy, modify, and distribute this software for any
5 * purpose with or without fee is hereby granted, provided that the above
6 * copyright notice and this permission notice appear in all copies.
8 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
17 #include <sys/types.h>
19 #include <sys/queue.h>
21 #include <sys/socket.h>
22 #include <sys/syslimits.h>
38 #include "got_error.h"
39 #include "got_object.h"
40 #include "got_repository.h"
41 #include "got_opentemp.h"
44 #include "got_lib_sha1.h"
45 #include "got_lib_delta.h"
46 #include "got_lib_inflate.h"
47 #include "got_lib_object.h"
48 #include "got_lib_object_cache.h"
49 #include "got_lib_pack.h"
50 #include "got_lib_privsep.h"
51 #include "got_lib_repository.h"
54 #define nitems(_a) (sizeof(_a) / sizeof((_a)[0]))
58 got_object_id_cmp(const struct got_object_id *id1,
59 const struct got_object_id *id2)
61 return memcmp(id1->sha1, id2->sha1, SHA1_DIGEST_LENGTH);
64 const struct got_error *
65 got_object_qid_alloc_partial(struct got_object_qid **qid)
67 const struct got_error *err = NULL;
69 *qid = malloc(sizeof(**qid));
71 return got_error_from_errno("malloc");
73 (*qid)->id = malloc(sizeof(*((*qid)->id)));
74 if ((*qid)->id == NULL) {
75 err = got_error_from_errno("malloc");
76 got_object_qid_free(*qid);
84 const struct got_error *
85 got_object_id_str(char **outbuf, struct got_object_id *id)
87 static const size_t len = SHA1_DIGEST_STRING_LENGTH;
89 *outbuf = malloc(len);
91 return got_error_from_errno("malloc");
93 if (got_sha1_digest_to_str(id->sha1, *outbuf, len) == NULL) {
96 return got_error(GOT_ERR_BAD_OBJ_ID_STR);
103 got_object_close(struct got_object *obj)
105 if (obj->refcnt > 0) {
111 if (obj->flags & GOT_OBJ_FLAG_DELTIFIED) {
112 struct got_delta *delta;
113 while (!SIMPLEQ_EMPTY(&obj->deltas.entries)) {
114 delta = SIMPLEQ_FIRST(&obj->deltas.entries);
115 SIMPLEQ_REMOVE_HEAD(&obj->deltas.entries, entry);
116 free(delta->delta_buf);
120 if (obj->flags & GOT_OBJ_FLAG_PACKED)
121 free(obj->path_packfile);
126 got_object_qid_free(struct got_object_qid *qid)
133 got_object_id_queue_free(struct got_object_id_queue *ids)
135 struct got_object_qid *qid;
137 while (!SIMPLEQ_EMPTY(ids)) {
138 qid = SIMPLEQ_FIRST(ids);
139 SIMPLEQ_REMOVE_HEAD(ids, entry);
140 got_object_qid_free(qid);
144 const struct got_error *
145 got_object_parse_header(struct got_object **obj, char *buf, size_t len)
147 const char *obj_labels[] = {
148 GOT_OBJ_LABEL_COMMIT,
153 const int obj_types[] = {
160 size_t size = 0, hdrlen = 0;
165 hdrlen = strnlen(buf, len) + 1 /* '\0' */;
167 return got_error(GOT_ERR_BAD_OBJ_HDR);
169 for (i = 0; i < nitems(obj_labels); i++) {
170 const char *label = obj_labels[i];
171 size_t label_len = strlen(label);
174 if (strncmp(buf, label, label_len) != 0)
178 if (len <= label_len)
179 return got_error(GOT_ERR_BAD_OBJ_HDR);
180 size = strtonum(buf + label_len, 0, LONG_MAX, &errstr);
182 return got_error(GOT_ERR_BAD_OBJ_HDR);
187 return got_error(GOT_ERR_BAD_OBJ_HDR);
189 *obj = calloc(1, sizeof(**obj));
191 return got_error_from_errno("calloc");
193 (*obj)->hdrlen = hdrlen;
198 const struct got_error *
199 got_object_read_header(struct got_object **obj, int fd)
201 const struct got_error *err;
202 struct got_inflate_buf zb;
204 const size_t zbsize = 64;
205 size_t outlen, totlen;
210 buf = malloc(zbsize);
212 return got_error_from_errno("malloc");
214 err = got_inflate_init(&zb, buf, zbsize);
220 err = got_inflate_read_fd(&zb, fd, &outlen);
226 if (memchr(zb.outbuf, '\0', outlen) == NULL) {
229 newbuf = recallocarray(buf, nbuf - 1, nbuf, zbsize);
230 if (newbuf == NULL) {
231 err = got_error_from_errno("recallocarray");
235 zb.outbuf = newbuf + totlen;
236 zb.outlen = (nbuf * zbsize) - totlen;
238 } while (memchr(zb.outbuf, '\0', outlen) == NULL);
240 err = got_object_parse_header(obj, buf, totlen);
243 got_inflate_end(&zb);
247 struct got_commit_object *
248 got_object_commit_alloc_partial(void)
250 struct got_commit_object *commit;
252 commit = calloc(1, sizeof(*commit));
255 commit->tree_id = malloc(sizeof(*commit->tree_id));
256 if (commit->tree_id == NULL) {
261 SIMPLEQ_INIT(&commit->parent_ids);
266 const struct got_error *
267 got_object_commit_add_parent(struct got_commit_object *commit,
270 const struct got_error *err = NULL;
271 struct got_object_qid *qid;
273 err = got_object_qid_alloc_partial(&qid);
277 if (!got_parse_sha1_digest(qid->id->sha1, id_str)) {
278 err = got_error(GOT_ERR_BAD_OBJ_DATA);
279 got_object_qid_free(qid);
283 SIMPLEQ_INSERT_TAIL(&commit->parent_ids, qid, entry);
289 static const struct got_error *
290 parse_gmtoff(time_t *gmtoff, const char *tzstr)
293 const char *p = tzstr;
301 return got_error(GOT_ERR_BAD_OBJ_DATA);
303 if (!isdigit(*p) && !isdigit(*(p + 1)))
304 return got_error(GOT_ERR_BAD_OBJ_DATA);
305 h = (((*p - '0') * 10) + (*(p + 1) - '0'));
308 if (!isdigit(*p) && !isdigit(*(p + 1)))
309 return got_error(GOT_ERR_BAD_OBJ_DATA);
310 m = ((*p - '0') * 10) + (*(p + 1) - '0');
312 *gmtoff = (h * 60 * 60 + m * 60) * sign;
316 static const struct got_error *
317 parse_commit_time(time_t *time, time_t *gmtoff, char *committer)
319 const struct got_error *err = NULL;
323 /* Parse and strip off trailing timezone indicator string. */
324 space = strrchr(committer, ' ');
326 return got_error(GOT_ERR_BAD_OBJ_DATA);
327 tzstr = strdup(space + 1);
329 return got_error_from_errno("strdup");
330 err = parse_gmtoff(gmtoff, tzstr);
336 /* Timestamp is separated from committer name + email by space. */
337 space = strrchr(committer, ' ');
339 return got_error(GOT_ERR_BAD_OBJ_DATA);
341 /* Timestamp parsed here is expressed as UNIX timestamp (UTC). */
342 *time = strtonum(space + 1, 0, INT64_MAX, &errstr);
344 return got_error(GOT_ERR_BAD_OBJ_DATA);
346 /* Strip off parsed time information, leaving just author and email. */
353 got_object_commit_close(struct got_commit_object *commit)
355 if (commit->refcnt > 0) {
357 if (commit->refcnt > 0)
361 got_object_id_queue_free(&commit->parent_ids);
362 free(commit->tree_id);
363 free(commit->author);
364 free(commit->committer);
365 free(commit->logmsg);
369 struct got_object_id *
370 got_object_commit_get_tree_id(struct got_commit_object *commit)
372 return commit->tree_id;
376 got_object_commit_get_nparents(struct got_commit_object *commit)
378 return commit->nparents;
381 const struct got_object_id_queue *
382 got_object_commit_get_parent_ids(struct got_commit_object *commit)
384 return &commit->parent_ids;
388 got_object_commit_get_author(struct got_commit_object *commit)
390 return commit->author;
394 got_object_commit_get_author_time(struct got_commit_object *commit)
396 return commit->author_time;
399 time_t got_object_commit_get_author_gmtoff(struct got_commit_object *commit)
401 return commit->author_gmtoff;
405 got_object_commit_get_committer(struct got_commit_object *commit)
407 return commit->committer;
411 got_object_commit_get_committer_time(struct got_commit_object *commit)
413 return commit->committer_time;
417 got_object_commit_get_committer_gmtoff(struct got_commit_object *commit)
419 return commit->committer_gmtoff;
422 const struct got_error *
423 got_object_commit_get_logmsg(char **logmsg, struct got_commit_object *commit)
425 const struct got_error *err = NULL;
426 char *msg0, *msg, *line, *s;
432 msg0 = strdup(commit->logmsg);
434 return got_error_from_errno("strdup");
436 /* Copy log message line by line to strip out unusual headers... */
439 if ((line = strsep(&msg, "\n")) == NULL)
443 if (line[0] != '\0' &&
444 strncmp(line, GOT_COMMIT_LABEL_TREE,
445 strlen(GOT_COMMIT_LABEL_TREE)) != 0 &&
446 strncmp(line, GOT_COMMIT_LABEL_AUTHOR,
447 strlen(GOT_COMMIT_LABEL_AUTHOR)) != 0 &&
448 strncmp(line, GOT_COMMIT_LABEL_PARENT,
449 strlen(GOT_COMMIT_LABEL_PARENT)) != 0 &&
450 strncmp(line, GOT_COMMIT_LABEL_COMMITTER,
451 strlen(GOT_COMMIT_LABEL_COMMITTER)) != 0)
458 if (asprintf(&s, "%s%s\n",
459 *logmsg ? *logmsg : "", line) == -1) {
460 err = got_error_from_errno("asprintf");
468 /* Trim redundant trailing whitespace. */
469 len = strlen(*logmsg);
470 while (len > 1 && isspace((unsigned char)(*logmsg)[len - 2]) &&
471 isspace((unsigned char)(*logmsg)[len - 1])) {
472 (*logmsg)[len - 1] = '\0';
485 got_object_commit_get_logmsg_raw(struct got_commit_object *commit)
487 return commit->logmsg;
490 const struct got_error *
491 got_object_parse_commit(struct got_commit_object **commit, char *buf,
494 const struct got_error *err = NULL;
497 ssize_t remain = (ssize_t)len;
500 return got_error(GOT_ERR_BAD_OBJ_DATA);
502 *commit = got_object_commit_alloc_partial();
504 return got_error_from_errno("got_object_commit_alloc_partial");
506 label_len = strlen(GOT_COMMIT_LABEL_TREE);
507 if (strncmp(s, GOT_COMMIT_LABEL_TREE, label_len) == 0) {
509 if (remain < SHA1_DIGEST_STRING_LENGTH) {
510 err = got_error(GOT_ERR_BAD_OBJ_DATA);
514 if (!got_parse_sha1_digest((*commit)->tree_id->sha1, s)) {
515 err = got_error(GOT_ERR_BAD_OBJ_DATA);
518 remain -= SHA1_DIGEST_STRING_LENGTH;
519 s += SHA1_DIGEST_STRING_LENGTH;
521 err = got_error(GOT_ERR_BAD_OBJ_DATA);
525 label_len = strlen(GOT_COMMIT_LABEL_PARENT);
526 while (strncmp(s, GOT_COMMIT_LABEL_PARENT, label_len) == 0) {
528 if (remain < SHA1_DIGEST_STRING_LENGTH) {
529 err = got_error(GOT_ERR_BAD_OBJ_DATA);
533 err = got_object_commit_add_parent(*commit, s);
537 remain -= SHA1_DIGEST_STRING_LENGTH;
538 s += SHA1_DIGEST_STRING_LENGTH;
541 label_len = strlen(GOT_COMMIT_LABEL_AUTHOR);
542 if (strncmp(s, GOT_COMMIT_LABEL_AUTHOR, label_len) == 0) {
548 err = got_error(GOT_ERR_BAD_OBJ_DATA);
552 p = memchr(s, '\n', remain);
554 err = got_error(GOT_ERR_BAD_OBJ_DATA);
559 err = parse_commit_time(&(*commit)->author_time,
560 &(*commit)->author_gmtoff, s);
563 (*commit)->author = strdup(s);
564 if ((*commit)->author == NULL) {
565 err = got_error_from_errno("strdup");
572 label_len = strlen(GOT_COMMIT_LABEL_COMMITTER);
573 if (strncmp(s, GOT_COMMIT_LABEL_COMMITTER, label_len) == 0) {
579 err = got_error(GOT_ERR_BAD_OBJ_DATA);
583 p = memchr(s, '\n', remain);
585 err = got_error(GOT_ERR_BAD_OBJ_DATA);
590 err = parse_commit_time(&(*commit)->committer_time,
591 &(*commit)->committer_gmtoff, s);
594 (*commit)->committer = strdup(s);
595 if ((*commit)->committer == NULL) {
596 err = got_error_from_errno("strdup");
603 (*commit)->logmsg = strndup(s, remain);
604 if ((*commit)->logmsg == NULL) {
605 err = got_error_from_errno("strndup");
610 got_object_commit_close(*commit);
617 got_object_tree_entry_close(struct got_tree_entry *te)
625 got_object_tree_entries_close(struct got_tree_entries *entries)
627 struct got_tree_entry *te;
629 while (!SIMPLEQ_EMPTY(&entries->head)) {
630 te = SIMPLEQ_FIRST(&entries->head);
631 SIMPLEQ_REMOVE_HEAD(&entries->head, entry);
632 got_object_tree_entry_close(te);
637 got_object_tree_close(struct got_tree_object *tree)
639 if (tree->refcnt > 0) {
641 if (tree->refcnt > 0)
645 got_object_tree_entries_close(&tree->entries);
649 struct got_tree_entry *
650 got_alloc_tree_entry_partial(void)
652 struct got_tree_entry *te;
654 te = malloc(sizeof(*te));
658 te->id = malloc(sizeof(*te->id));
659 if (te->id == NULL) {
666 static const struct got_error *
667 parse_tree_entry(struct got_tree_entry **te, size_t *elen, char *buf,
671 const struct got_error *err = NULL;
675 *te = got_alloc_tree_entry_partial();
677 return got_error_from_errno("got_alloc_tree_entry_partial");
679 *elen = strnlen(buf, maxlen) + 1;
680 if (*elen > maxlen) {
683 return got_error(GOT_ERR_BAD_OBJ_DATA);
686 space = memchr(buf, ' ', *elen);
687 if (space == NULL || space <= buf) {
688 err = got_error(GOT_ERR_BAD_OBJ_DATA);
696 if (*p < '0' && *p > '7') {
697 err = got_error(GOT_ERR_BAD_OBJ_DATA);
701 (*te)->mode |= *p - '0';
705 (*te)->name = strdup(space + 1);
706 if (*elen > maxlen || maxlen - *elen < SHA1_DIGEST_LENGTH) {
707 err = got_error(GOT_ERR_BAD_OBJ_DATA);
711 memcpy((*te)->id->sha1, buf, SHA1_DIGEST_LENGTH);
712 *elen += SHA1_DIGEST_LENGTH;
715 got_object_tree_entry_close(*te);
721 const struct got_error *
722 got_object_parse_tree(struct got_tree_object **tree, uint8_t *buf, size_t len)
724 const struct got_error *err;
726 struct got_pathlist_head pathlist;
727 struct got_pathlist_entry *pe;
729 TAILQ_INIT(&pathlist);
731 *tree = calloc(1, sizeof(**tree));
733 return got_error_from_errno("calloc");
735 SIMPLEQ_INIT(&(*tree)->entries.head);
738 return NULL; /* tree is empty */
741 struct got_tree_entry *te;
742 struct got_pathlist_entry *new = NULL;
745 err = parse_tree_entry(&te, &elen, buf, remain);
748 err = got_pathlist_insert(&new, &pathlist, te->name, te);
752 err = got_error(GOT_ERR_TREE_DUP_ENTRY);
760 got_object_tree_close(*tree);
762 err = got_error(GOT_ERR_BAD_OBJ_DATA);
766 TAILQ_FOREACH(pe, &pathlist, entry) {
767 struct got_tree_entry *te = pe->data;
768 (*tree)->entries.nentries++;
769 SIMPLEQ_INSERT_TAIL(&(*tree)->entries.head, te, entry);
772 got_pathlist_free(&pathlist);
777 got_object_tag_close(struct got_tag_object *tag)
779 if (tag->refcnt > 0) {
791 const struct got_error *
792 got_object_parse_tag(struct got_tag_object **tag, uint8_t *buf, size_t len)
794 const struct got_error *err = NULL;
800 return got_error(GOT_ERR_BAD_OBJ_DATA);
802 *tag = calloc(1, sizeof(**tag));
804 return got_error_from_errno("calloc");
806 label_len = strlen(GOT_TAG_LABEL_OBJECT);
807 if (strncmp(s, GOT_TAG_LABEL_OBJECT, label_len) == 0) {
809 if (remain < SHA1_DIGEST_STRING_LENGTH) {
810 err = got_error(GOT_ERR_BAD_OBJ_DATA);
814 if (!got_parse_sha1_digest((*tag)->id.sha1, s)) {
815 err = got_error(GOT_ERR_BAD_OBJ_DATA);
818 remain -= SHA1_DIGEST_STRING_LENGTH;
819 s += SHA1_DIGEST_STRING_LENGTH;
821 err = got_error(GOT_ERR_BAD_OBJ_DATA);
826 err = got_error(GOT_ERR_BAD_OBJ_DATA);
830 label_len = strlen(GOT_TAG_LABEL_TYPE);
831 if (strncmp(s, GOT_TAG_LABEL_TYPE, label_len) == 0) {
834 err = got_error(GOT_ERR_BAD_OBJ_DATA);
838 if (strncmp(s, GOT_OBJ_LABEL_COMMIT,
839 strlen(GOT_OBJ_LABEL_COMMIT)) == 0) {
840 (*tag)->obj_type = GOT_OBJ_TYPE_COMMIT;
841 label_len = strlen(GOT_OBJ_LABEL_COMMIT);
844 } else if (strncmp(s, GOT_OBJ_LABEL_TREE,
845 strlen(GOT_OBJ_LABEL_TREE)) == 0) {
846 (*tag)->obj_type = GOT_OBJ_TYPE_TREE;
847 label_len = strlen(GOT_OBJ_LABEL_TREE);
850 } else if (strncmp(s, GOT_OBJ_LABEL_BLOB,
851 strlen(GOT_OBJ_LABEL_BLOB)) == 0) {
852 (*tag)->obj_type = GOT_OBJ_TYPE_BLOB;
853 label_len = strlen(GOT_OBJ_LABEL_BLOB);
856 } else if (strncmp(s, GOT_OBJ_LABEL_TAG,
857 strlen(GOT_OBJ_LABEL_TAG)) == 0) {
858 (*tag)->obj_type = GOT_OBJ_TYPE_TAG;
859 label_len = strlen(GOT_OBJ_LABEL_TAG);
863 err = got_error(GOT_ERR_BAD_OBJ_DATA);
867 if (remain <= 0 || *s != '\n') {
868 err = got_error(GOT_ERR_BAD_OBJ_DATA);
874 err = got_error(GOT_ERR_BAD_OBJ_DATA);
878 err = got_error(GOT_ERR_BAD_OBJ_DATA);
882 label_len = strlen(GOT_TAG_LABEL_TAG);
883 if (strncmp(s, GOT_TAG_LABEL_TAG, label_len) == 0) {
888 err = got_error(GOT_ERR_BAD_OBJ_DATA);
892 p = memchr(s, '\n', remain);
894 err = got_error(GOT_ERR_BAD_OBJ_DATA);
899 (*tag)->tag = strndup(s, slen);
900 if ((*tag)->tag == NULL) {
901 err = got_error_from_errno("strndup");
907 err = got_error(GOT_ERR_BAD_OBJ_DATA);
911 err = got_error(GOT_ERR_BAD_OBJ_DATA);
915 label_len = strlen(GOT_TAG_LABEL_TAGGER);
916 if (strncmp(s, GOT_TAG_LABEL_TAGGER, label_len) == 0) {
922 err = got_error(GOT_ERR_BAD_OBJ_DATA);
926 p = memchr(s, '\n', remain);
928 err = got_error(GOT_ERR_BAD_OBJ_DATA);
933 err = parse_commit_time(&(*tag)->tagger_time,
934 &(*tag)->tagger_gmtoff, s);
937 (*tag)->tagger = strdup(s);
938 if ((*tag)->tagger == NULL) {
939 err = got_error_from_errno("strdup");
945 err = got_error(GOT_ERR_BAD_OBJ_DATA);
949 /* Some old tags in the Linux git repo have no tagger. */
950 (*tag)->tagger = strdup("");
951 if ((*tag)->tagger == NULL) {
952 err = got_error_from_errno("strdup");
957 (*tag)->tagmsg = strndup(s, remain);
958 if ((*tag)->tagmsg == NULL) {
959 err = got_error_from_errno("strndup");
964 got_object_tag_close(*tag);
970 const struct got_error *
971 got_read_file_to_mem(uint8_t **outbuf, size_t *outlen, FILE *f)
973 const struct got_error *err = NULL;
974 static const size_t blocksize = 512;
975 size_t n, total, remain;
981 buf = malloc(blocksize);
983 return got_error_from_errno("malloc");
990 newbuf = reallocarray(buf, 1, total + blocksize);
991 if (newbuf == NULL) {
992 err = got_error_from_errno("reallocarray");
998 n = fread(buf + total, 1, remain, f);
1001 err = got_ferror(f, GOT_ERR_IO);