2 5d56da81 2019-01-13 stsp * Copyright (c) 2018, 2019 Stefan Sperling <stsp@openbsd.org>
4 d71d75ad 2017-11-05 stsp * Permission to use, copy, modify, and distribute this software for any
5 d71d75ad 2017-11-05 stsp * purpose with or without fee is hereby granted, provided that the above
6 d71d75ad 2017-11-05 stsp * copyright notice and this permission notice appear in all copies.
8 d71d75ad 2017-11-05 stsp * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9 d71d75ad 2017-11-05 stsp * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10 d71d75ad 2017-11-05 stsp * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11 d71d75ad 2017-11-05 stsp * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12 d71d75ad 2017-11-05 stsp * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13 d71d75ad 2017-11-05 stsp * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14 d71d75ad 2017-11-05 stsp * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
17 2178c42e 2018-04-22 stsp #include <sys/types.h>
18 0ffeb3c2 2017-11-26 stsp #include <sys/stat.h>
19 d1cda826 2017-11-06 stsp #include <sys/queue.h>
20 f8b19efd 2021-10-13 stsp #include <sys/tree.h>
21 2178c42e 2018-04-22 stsp #include <sys/uio.h>
22 64a8571e 2022-01-07 stsp #include <sys/mman.h>
24 a1fd68d8 2018-01-12 stsp #include <errno.h>
25 2178c42e 2018-04-22 stsp #include <fcntl.h>
26 d71d75ad 2017-11-05 stsp #include <stdio.h>
27 ab9a70b2 2017-11-06 stsp #include <stdlib.h>
28 ab9a70b2 2017-11-06 stsp #include <string.h>
29 d71d75ad 2017-11-05 stsp #include <sha1.h>
30 81a12da5 2020-09-09 naddy #include <unistd.h>
31 ab9a70b2 2017-11-06 stsp #include <zlib.h>
32 e40622f4 2020-07-23 stsp #include <libgen.h>
33 ab9a70b2 2017-11-06 stsp #include <limits.h>
34 2178c42e 2018-04-22 stsp #include <imsg.h>
36 ab9a70b2 2017-11-06 stsp #include "got_error.h"
37 d71d75ad 2017-11-05 stsp #include "got_object.h"
38 ab9a70b2 2017-11-06 stsp #include "got_repository.h"
39 511a516b 2018-05-19 stsp #include "got_opentemp.h"
40 324d37e7 2019-05-11 stsp #include "got_path.h"
42 718b3ab0 2018-03-17 stsp #include "got_lib_sha1.h"
43 718b3ab0 2018-03-17 stsp #include "got_lib_delta.h"
44 63581804 2018-07-09 stsp #include "got_lib_inflate.h"
45 718b3ab0 2018-03-17 stsp #include "got_lib_object.h"
46 6bef87be 2018-09-11 stsp #include "got_lib_object_idcache.h"
47 6bef87be 2018-09-11 stsp #include "got_lib_object_cache.h"
48 ad242220 2018-09-08 stsp #include "got_lib_object_parse.h"
49 15a94983 2018-12-23 stsp #include "got_lib_pack.h"
50 7bb0daa1 2018-06-21 stsp #include "got_lib_repository.h"
53 ab9a70b2 2017-11-06 stsp #define MIN(_a,_b) ((_a) < (_b) ? (_a) : (_b))
56 0ab4c957 2022-06-13 stsp #ifndef nitems
57 0ab4c957 2022-06-13 stsp #define nitems(_a) (sizeof((_a)) / sizeof((_a)[0]))
60 3235492e 2018-04-01 stsp struct got_object_id *
61 3235492e 2018-04-01 stsp got_object_get_id(struct got_object *obj)
63 6402fb3c 2018-09-15 stsp return &obj->id;
66 bacc9935 2018-05-20 stsp const struct got_error *
67 bacc9935 2018-05-20 stsp got_object_get_id_str(char **outbuf, struct got_object *obj)
69 bacc9935 2018-05-20 stsp return got_object_id_str(outbuf, &obj->id);
72 15a94983 2018-12-23 stsp const struct got_error *
73 15a94983 2018-12-23 stsp got_object_get_type(int *type, struct got_repository *repo,
74 15a94983 2018-12-23 stsp struct got_object_id *id)
76 15a94983 2018-12-23 stsp const struct got_error *err = NULL;
77 15a94983 2018-12-23 stsp struct got_object *obj;
79 15a94983 2018-12-23 stsp err = got_object_open(&obj, repo, id);
83 b107e67f 2018-01-19 stsp switch (obj->type) {
84 a1fd68d8 2018-01-12 stsp case GOT_OBJ_TYPE_COMMIT:
85 a1fd68d8 2018-01-12 stsp case GOT_OBJ_TYPE_TREE:
86 a1fd68d8 2018-01-12 stsp case GOT_OBJ_TYPE_BLOB:
87 b107e67f 2018-01-19 stsp case GOT_OBJ_TYPE_TAG:
88 15a94983 2018-12-23 stsp *type = obj->type;
91 15a94983 2018-12-23 stsp err = got_error(GOT_ERR_OBJ_TYPE);
95 15a94983 2018-12-23 stsp got_object_close(obj);
99 90bdb554 2019-04-11 stsp const struct got_error *
100 90bdb554 2019-04-11 stsp got_object_get_path(char **path, struct got_object_id *id,
101 90bdb554 2019-04-11 stsp struct got_repository *repo)
103 ab9a70b2 2017-11-06 stsp const struct got_error *err = NULL;
104 7a132809 2018-07-23 stsp char *hex = NULL;
105 41d2888b 2019-08-11 stsp char *path_objects;
107 e6b1056e 2018-04-22 stsp *path = NULL;
109 41d2888b 2019-08-11 stsp path_objects = got_repo_get_path_objects(repo);
110 ab9a70b2 2017-11-06 stsp if (path_objects == NULL)
111 638f9024 2019-05-13 stsp return got_error_from_errno("got_repo_get_path_objects");
113 ef0981d5 2018-02-12 stsp err = got_object_id_str(&hex, id);
117 d1cda826 2017-11-06 stsp if (asprintf(path, "%s/%.2x/%s", path_objects,
118 d1cda826 2017-11-06 stsp id->sha1[0], hex + 2) == -1)
119 638f9024 2019-05-13 stsp err = got_error_from_errno("asprintf");
123 d1cda826 2017-11-06 stsp free(path_objects);
124 d1cda826 2017-11-06 stsp return err;
127 762d73f4 2021-04-10 stsp const struct got_error *
128 762d73f4 2021-04-10 stsp got_object_open_loose_fd(int *fd, struct got_object_id *id,
129 4796fb13 2018-12-23 stsp struct got_repository *repo)
131 d1cda826 2017-11-06 stsp const struct got_error *err = NULL;
132 a1fd68d8 2018-01-12 stsp char *path;
134 90bdb554 2019-04-11 stsp err = got_object_get_path(&path, id, repo);
136 d1cda826 2017-11-06 stsp return err;
137 8bd0cdad 2021-12-31 stsp *fd = open(path, O_RDONLY | O_NOFOLLOW | O_CLOEXEC);
138 d5003b79 2018-04-22 stsp if (*fd == -1) {
139 e82b1d81 2019-07-27 stsp err = got_error_from_errno2("open", path);
143 4558fcd4 2018-01-14 stsp free(path);
144 59d1e4a0 2021-03-10 stsp return err;
147 59d1e4a0 2021-03-10 stsp const struct got_error *
148 6dfa2fd3 2018-02-12 stsp got_object_open_by_id_str(struct got_object **obj, struct got_repository *repo,
149 6dfa2fd3 2018-02-12 stsp const char *id_str)
151 6dfa2fd3 2018-02-12 stsp struct got_object_id id;
153 6dfa2fd3 2018-02-12 stsp if (!got_parse_sha1_digest(id.sha1, id_str))
154 6dd1ece6 2019-11-10 stsp return got_error_path(id_str, GOT_ERR_BAD_OBJ_ID_STR);
156 6dfa2fd3 2018-02-12 stsp return got_object_open(obj, repo, &id);
159 15a94983 2018-12-23 stsp const struct got_error *
160 15a94983 2018-12-23 stsp got_object_resolve_id_str(struct got_object_id **id,
161 15a94983 2018-12-23 stsp struct got_repository *repo, const char *id_str)
163 15a94983 2018-12-23 stsp const struct got_error *err = NULL;
164 15a94983 2018-12-23 stsp struct got_object *obj;
166 15a94983 2018-12-23 stsp err = got_object_open_by_id_str(&obj, repo, id_str);
168 15a94983 2018-12-23 stsp return err;
170 15a94983 2018-12-23 stsp *id = got_object_id_dup(got_object_get_id(obj));
171 15a94983 2018-12-23 stsp got_object_close(obj);
172 15a94983 2018-12-23 stsp if (*id == NULL)
173 638f9024 2019-05-13 stsp return got_error_from_errno("got_object_id_dup");
175 15a94983 2018-12-23 stsp return NULL;
178 e32baab7 2018-11-05 stsp const struct got_error *
179 dbc6a6b6 2018-07-12 stsp got_object_qid_alloc(struct got_object_qid **qid, struct got_object_id *id)
181 dbc6a6b6 2018-07-12 stsp *qid = calloc(1, sizeof(**qid));
182 dbc6a6b6 2018-07-12 stsp if (*qid == NULL)
183 638f9024 2019-05-13 stsp return got_error_from_errno("calloc");
185 d7b5a0e8 2022-04-20 stsp memcpy(&(*qid)->id, id, sizeof((*qid)->id));
186 9ca9aafb 2021-06-18 stsp return NULL;
189 9ca9aafb 2021-06-18 stsp const struct got_error *
190 9ca9aafb 2021-06-18 stsp got_object_id_queue_copy(const struct got_object_id_queue *src,
191 9ca9aafb 2021-06-18 stsp struct got_object_id_queue *dest)
193 9ca9aafb 2021-06-18 stsp const struct got_error *err;
194 9ca9aafb 2021-06-18 stsp struct got_object_qid *qid;
196 dbdddfee 2021-06-23 naddy STAILQ_FOREACH(qid, src, entry) {
197 9ca9aafb 2021-06-18 stsp struct got_object_qid *new;
199 9ca9aafb 2021-06-18 stsp * Deep-copy the object ID only. Let the caller deal
200 9ca9aafb 2021-06-18 stsp * with setting up the new->data pointer if needed.
202 5e91dae4 2022-08-30 stsp err = got_object_qid_alloc(&new, &qid->id);
204 9ca9aafb 2021-06-18 stsp got_object_id_queue_free(dest);
205 9ca9aafb 2021-06-18 stsp return err;
207 dbdddfee 2021-06-23 naddy STAILQ_INSERT_TAIL(dest, new, entry);
210 dbc6a6b6 2018-07-12 stsp return NULL;
214 56e0773d 2019-11-28 stsp got_object_tree_get_nentries(struct got_tree_object *tree)
216 56e0773d 2019-11-28 stsp return tree->nentries;
219 56e0773d 2019-11-28 stsp struct got_tree_entry *
220 56e0773d 2019-11-28 stsp got_object_tree_get_first_entry(struct got_tree_object *tree)
222 56e0773d 2019-11-28 stsp return got_object_tree_get_entry(tree, 0);
225 56e0773d 2019-11-28 stsp struct got_tree_entry *
226 56e0773d 2019-11-28 stsp got_object_tree_get_last_entry(struct got_tree_object *tree)
228 56e0773d 2019-11-28 stsp return got_object_tree_get_entry(tree, tree->nentries - 1);
231 56e0773d 2019-11-28 stsp struct got_tree_entry *
232 56e0773d 2019-11-28 stsp got_object_tree_get_entry(struct got_tree_object *tree, int i)
234 56e0773d 2019-11-28 stsp if (i < 0 || i >= tree->nentries)
235 56e0773d 2019-11-28 stsp return NULL;
236 56e0773d 2019-11-28 stsp return &tree->entries[i];
240 56e0773d 2019-11-28 stsp got_tree_entry_get_mode(struct got_tree_entry *te)
242 56e0773d 2019-11-28 stsp return te->mode;
245 56e0773d 2019-11-28 stsp const char *
246 56e0773d 2019-11-28 stsp got_tree_entry_get_name(struct got_tree_entry *te)
248 56e0773d 2019-11-28 stsp return &te->name[0];
251 56e0773d 2019-11-28 stsp struct got_object_id *
252 56e0773d 2019-11-28 stsp got_tree_entry_get_id(struct got_tree_entry *te)
254 56e0773d 2019-11-28 stsp return &te->id;
257 0d6c6ee3 2020-05-20 stsp const struct got_error *
258 af57b12a 2020-07-23 stsp got_object_blob_read_to_str(char **s, struct got_blob_object *blob)
260 0d6c6ee3 2020-05-20 stsp const struct got_error *err = NULL;
261 32596e16 2020-07-23 stsp size_t len, totlen, hdrlen, offset;
265 659dc16e 2020-07-23 stsp hdrlen = got_object_blob_get_hdrlen(blob);
266 659dc16e 2020-07-23 stsp totlen = 0;
267 32596e16 2020-07-23 stsp offset = 0;
271 659dc16e 2020-07-23 stsp err = got_object_blob_read_block(&len, blob);
273 af57b12a 2020-07-23 stsp return err;
275 659dc16e 2020-07-23 stsp if (len == 0)
278 659dc16e 2020-07-23 stsp totlen += len - hdrlen;
279 af57b12a 2020-07-23 stsp p = realloc(*s, totlen + 1);
280 659dc16e 2020-07-23 stsp if (p == NULL) {
281 659dc16e 2020-07-23 stsp err = got_error_from_errno("realloc");
284 af57b12a 2020-07-23 stsp return err;
287 659dc16e 2020-07-23 stsp /* Skip blob object header first time around. */
288 af57b12a 2020-07-23 stsp memcpy(*s + offset,
289 f8f7c882 2020-07-23 stsp got_object_blob_get_read_buf(blob) + hdrlen, len - hdrlen);
290 659dc16e 2020-07-23 stsp hdrlen = 0;
291 32596e16 2020-07-23 stsp offset = totlen;
292 659dc16e 2020-07-23 stsp } while (len > 0);
294 af57b12a 2020-07-23 stsp (*s)[totlen] = '\0';
295 af57b12a 2020-07-23 stsp return NULL;
298 af57b12a 2020-07-23 stsp const struct got_error *
299 af57b12a 2020-07-23 stsp got_tree_entry_get_symlink_target(char **link_target, struct got_tree_entry *te,
300 af57b12a 2020-07-23 stsp struct got_repository *repo)
302 af57b12a 2020-07-23 stsp const struct got_error *err = NULL;
303 af57b12a 2020-07-23 stsp struct got_blob_object *blob = NULL;
304 eb81bc23 2022-06-28 tracey int fd = -1;
306 af57b12a 2020-07-23 stsp *link_target = NULL;
308 af57b12a 2020-07-23 stsp if (!got_object_tree_entry_is_symlink(te))
309 af57b12a 2020-07-23 stsp return got_error(GOT_ERR_TREE_ENTRY_TYPE);
311 eb81bc23 2022-06-28 tracey fd = got_opentempfd();
312 eb81bc23 2022-06-28 tracey if (fd == -1) {
313 eb81bc23 2022-06-28 tracey err = got_error_from_errno("got_opentempfd");
314 eb81bc23 2022-06-28 tracey goto done;
317 eb81bc23 2022-06-28 tracey err = got_object_open_as_blob(&blob, repo,
318 eb81bc23 2022-06-28 tracey got_tree_entry_get_id(te), PATH_MAX, fd);
320 eb81bc23 2022-06-28 tracey goto done;
322 af57b12a 2020-07-23 stsp err = got_object_blob_read_to_str(link_target, blob);
324 eb81bc23 2022-06-28 tracey if (fd != -1 && close(fd) == -1 && err == NULL)
325 eb81bc23 2022-06-28 tracey err = got_error_from_errno("close");
326 eb81bc23 2022-06-28 tracey if (blob)
327 eb81bc23 2022-06-28 tracey got_object_blob_close(blob);
329 659dc16e 2020-07-23 stsp free(*link_target);
330 659dc16e 2020-07-23 stsp *link_target = NULL;
332 0d6c6ee3 2020-05-20 stsp return err;
336 56e0773d 2019-11-28 stsp got_tree_entry_get_index(struct got_tree_entry *te)
338 56e0773d 2019-11-28 stsp return te->idx;
341 56e0773d 2019-11-28 stsp struct got_tree_entry *
342 56e0773d 2019-11-28 stsp got_tree_entry_get_next(struct got_tree_object *tree,
343 56e0773d 2019-11-28 stsp struct got_tree_entry *te)
345 56e0773d 2019-11-28 stsp return got_object_tree_get_entry(tree, te->idx + 1);
348 56e0773d 2019-11-28 stsp struct got_tree_entry *
349 56e0773d 2019-11-28 stsp got_tree_entry_get_prev(struct got_tree_object *tree,
350 56e0773d 2019-11-28 stsp struct got_tree_entry *te)
352 56e0773d 2019-11-28 stsp return got_object_tree_get_entry(tree, te->idx - 1);
355 a19581a2 2018-06-21 stsp const struct got_error *
356 68482ea3 2017-11-27 stsp got_object_blob_close(struct got_blob_object *blob)
358 fb43ecf1 2019-02-11 stsp const struct got_error *err = NULL;
359 15c8b0e6 2018-04-24 stsp free(blob->read_buf);
360 56b63ca4 2021-01-22 stsp if (blob->f && fclose(blob->f) == EOF)
361 638f9024 2019-05-13 stsp err = got_error_from_errno("fclose");
362 ac544f8c 2019-01-13 stsp free(blob->data);
363 68482ea3 2017-11-27 stsp free(blob);
364 fb43ecf1 2019-02-11 stsp return err;
368 8ba819a3 2020-07-23 stsp got_object_blob_rewind(struct got_blob_object *blob)
370 8ba819a3 2020-07-23 stsp if (blob->f)
371 8ba819a3 2020-07-23 stsp rewind(blob->f);
375 f934cf2c 2018-02-12 stsp got_object_blob_id_str(struct got_blob_object *blob, char *buf, size_t size)
377 f934cf2c 2018-02-12 stsp return got_sha1_digest_to_str(blob->id.sha1, buf, size);
381 f934cf2c 2018-02-12 stsp got_object_blob_get_hdrlen(struct got_blob_object *blob)
383 f934cf2c 2018-02-12 stsp return blob->hdrlen;
386 f934cf2c 2018-02-12 stsp const uint8_t *
387 f934cf2c 2018-02-12 stsp got_object_blob_get_read_buf(struct got_blob_object *blob)
389 f934cf2c 2018-02-12 stsp return blob->read_buf;
392 68482ea3 2017-11-27 stsp const struct got_error *
393 eb651edf 2018-02-11 stsp got_object_blob_read_block(size_t *outlenp, struct got_blob_object *blob)
397 eb651edf 2018-02-11 stsp n = fread(blob->read_buf, 1, blob->blocksize, blob->f);
398 eb651edf 2018-02-11 stsp if (n == 0 && ferror(blob->f))
399 eb651edf 2018-02-11 stsp return got_ferror(blob->f, GOT_ERR_IO);
400 eb651edf 2018-02-11 stsp *outlenp = n;
401 35e9ba5d 2018-06-21 stsp return NULL;
404 35e9ba5d 2018-06-21 stsp const struct got_error *
405 0d569390 2023-01-04 op got_object_blob_is_binary(int *binary, struct got_blob_object *blob)
407 0d569390 2023-01-04 op const struct got_error *err;
408 0d569390 2023-01-04 op size_t hdrlen, len;
411 0d569390 2023-01-04 op hdrlen = got_object_blob_get_hdrlen(blob);
413 0d569390 2023-01-04 op if (fseeko(blob->f, hdrlen, SEEK_SET) == -1)
414 0d569390 2023-01-04 op return got_error_from_errno("fseeko");
416 0d569390 2023-01-04 op err = got_object_blob_read_block(&len, blob);
420 0d569390 2023-01-04 op *binary = memchr(blob->read_buf, '\0', len) != NULL;
422 0d569390 2023-01-04 op if (fseeko(blob->f, hdrlen, SEEK_SET) == -1)
423 0d569390 2023-01-04 op return got_error_from_errno("fseeko");
427 389a68d8 2023-01-05 op const struct got_error *
428 389a68d8 2023-01-05 op got_object_blob_getline(char **line, ssize_t *linelen, size_t *linesize,
429 389a68d8 2023-01-05 op struct got_blob_object *blob)
431 389a68d8 2023-01-05 op *linelen = getline(line, linesize, blob->f);
432 389a68d8 2023-01-05 op if (*linelen == -1 && !feof(blob->f))
433 389a68d8 2023-01-05 op return got_error_from_errno("getline");
437 0d569390 2023-01-04 op const struct got_error *
438 be659d10 2020-11-18 stsp got_object_blob_dump_to_file(off_t *filesize, int *nlines,
439 6c4c42e0 2019-06-24 stsp off_t **line_offsets, FILE *outfile, struct got_blob_object *blob)
441 35e9ba5d 2018-06-21 stsp const struct got_error *err = NULL;
442 b6752625 2018-12-24 stsp size_t n, len, hdrlen;
443 84451b3e 2018-07-10 stsp const uint8_t *buf;
445 c33ebc60 2020-11-18 stsp const int alloc_chunksz = 512;
446 c33ebc60 2020-11-18 stsp size_t nalloc = 0;
447 f595d9bd 2019-08-14 stsp off_t off = 0, total_len = 0;
449 6c4c42e0 2019-06-24 stsp if (line_offsets)
450 6c4c42e0 2019-06-24 stsp *line_offsets = NULL;
451 f595d9bd 2019-08-14 stsp if (filesize)
452 f595d9bd 2019-08-14 stsp *filesize = 0;
453 84451b3e 2018-07-10 stsp if (nlines)
454 84451b3e 2018-07-10 stsp *nlines = 0;
456 35e9ba5d 2018-06-21 stsp hdrlen = got_object_blob_get_hdrlen(blob);
458 35e9ba5d 2018-06-21 stsp err = got_object_blob_read_block(&len, blob);
460 35e9ba5d 2018-06-21 stsp return err;
461 35e9ba5d 2018-06-21 stsp if (len == 0)
463 84451b3e 2018-07-10 stsp buf = got_object_blob_get_read_buf(blob);
464 b02560ec 2019-08-19 stsp i = hdrlen;
465 f1cbc3bc 2020-11-18 stsp if (nlines) {
466 f1cbc3bc 2020-11-18 stsp if (line_offsets && *line_offsets == NULL) {
467 78695fb7 2019-08-12 stsp /* Have some data but perhaps no '\n'. */
468 78695fb7 2019-08-12 stsp *nlines = 1;
469 c33ebc60 2020-11-18 stsp nalloc = alloc_chunksz;
470 c33ebc60 2020-11-18 stsp *line_offsets = calloc(nalloc,
471 c33ebc60 2020-11-18 stsp sizeof(**line_offsets));
472 78695fb7 2019-08-12 stsp if (*line_offsets == NULL)
473 845785d4 2020-02-02 tracey return got_error_from_errno("calloc");
475 b02560ec 2019-08-19 stsp /* Skip forward over end of first line. */
476 b02560ec 2019-08-19 stsp while (i < len) {
477 b02560ec 2019-08-19 stsp if (buf[i] == '\n')
482 b02560ec 2019-08-19 stsp /* Scan '\n' offsets in remaining chunk of data. */
483 b02560ec 2019-08-19 stsp while (i < len) {
484 b02560ec 2019-08-19 stsp if (buf[i] != '\n') {
488 f595d9bd 2019-08-14 stsp (*nlines)++;
489 c33ebc60 2020-11-18 stsp if (line_offsets && nalloc < *nlines) {
490 c33ebc60 2020-11-18 stsp size_t n = *nlines + alloc_chunksz;
491 78695fb7 2019-08-12 stsp off_t *o = recallocarray(*line_offsets,
492 c33ebc60 2020-11-18 stsp nalloc, n, sizeof(**line_offsets));
493 78695fb7 2019-08-12 stsp if (o == NULL) {
494 78695fb7 2019-08-12 stsp free(*line_offsets);
495 78695fb7 2019-08-12 stsp *line_offsets = NULL;
496 78695fb7 2019-08-12 stsp return got_error_from_errno(
497 78695fb7 2019-08-12 stsp "recallocarray");
499 78695fb7 2019-08-12 stsp *line_offsets = o;
500 c33ebc60 2020-11-18 stsp nalloc = n;
502 f1cbc3bc 2020-11-18 stsp if (line_offsets) {
503 f1cbc3bc 2020-11-18 stsp off = total_len + i - hdrlen + 1;
504 f1cbc3bc 2020-11-18 stsp (*line_offsets)[*nlines - 1] = off;
509 35e9ba5d 2018-06-21 stsp /* Skip blob object header first time around. */
510 454a6b59 2018-12-24 stsp n = fwrite(buf + hdrlen, 1, len - hdrlen, outfile);
511 b6752625 2018-12-24 stsp if (n != len - hdrlen)
512 b6752625 2018-12-24 stsp return got_ferror(outfile, GOT_ERR_IO);
513 f595d9bd 2019-08-14 stsp total_len += len - hdrlen;
514 35e9ba5d 2018-06-21 stsp hdrlen = 0;
515 35e9ba5d 2018-06-21 stsp } while (len != 0);
517 cbe7f848 2019-02-11 stsp if (fflush(outfile) != 0)
518 638f9024 2019-05-13 stsp return got_error_from_errno("fflush");
519 35e9ba5d 2018-06-21 stsp rewind(outfile);
521 f595d9bd 2019-08-14 stsp if (filesize)
522 f595d9bd 2019-08-14 stsp *filesize = total_len;
524 776d4d29 2018-06-17 stsp return NULL;
527 d24820bf 2019-08-11 stsp const char *
528 d24820bf 2019-08-11 stsp got_object_tag_get_name(struct got_tag_object *tag)
530 d24820bf 2019-08-11 stsp return tag->tag;
534 0bd18d37 2019-02-01 stsp got_object_tag_get_object_type(struct got_tag_object *tag)
536 0bd18d37 2019-02-01 stsp return tag->obj_type;
539 0bd18d37 2019-02-01 stsp struct got_object_id *
540 0bd18d37 2019-02-01 stsp got_object_tag_get_object_id(struct got_tag_object *tag)
542 0bd18d37 2019-02-01 stsp return &tag->id;
546 01073a5d 2019-08-22 stsp got_object_tag_get_tagger_time(struct got_tag_object *tag)
548 01073a5d 2019-08-22 stsp return tag->tagger_time;
552 01073a5d 2019-08-22 stsp got_object_tag_get_tagger_gmtoff(struct got_tag_object *tag)
554 01073a5d 2019-08-22 stsp return tag->tagger_gmtoff;
557 01073a5d 2019-08-22 stsp const char *
558 01073a5d 2019-08-22 stsp got_object_tag_get_tagger(struct got_tag_object *tag)
560 01073a5d 2019-08-22 stsp return tag->tagger;
563 01073a5d 2019-08-22 stsp const char *
564 01073a5d 2019-08-22 stsp got_object_tag_get_message(struct got_tag_object *tag)
566 01073a5d 2019-08-22 stsp return tag->tagmsg;
569 776d4d29 2018-06-17 stsp static struct got_tree_entry *
570 65a9bbe9 2018-09-15 stsp find_entry_by_name(struct got_tree_object *tree, const char *name, size_t len)
574 63da309a 2018-11-07 stsp /* Note that tree entries are sorted in strncmp() order. */
575 56e0773d 2019-11-28 stsp for (i = 0; i < tree->nentries; i++) {
576 56e0773d 2019-11-28 stsp struct got_tree_entry *te = &tree->entries[i];
577 63da309a 2018-11-07 stsp int cmp = strncmp(te->name, name, len);
578 63da309a 2018-11-07 stsp if (cmp < 0)
580 63da309a 2018-11-07 stsp if (cmp > 0)
582 63da309a 2018-11-07 stsp if (te->name[len] == '\0')
585 eb651edf 2018-02-11 stsp return NULL;
588 56e0773d 2019-11-28 stsp struct got_tree_entry *
589 a129376b 2019-03-28 stsp got_object_tree_find_entry(struct got_tree_object *tree, const char *name)
591 a129376b 2019-03-28 stsp return find_entry_by_name(tree, name, strlen(name));
594 776d4d29 2018-06-17 stsp const struct got_error *
595 67b631c9 2021-10-10 stsp got_object_tree_find_path(struct got_object_id **id, mode_t *mode,
596 67b631c9 2021-10-10 stsp struct got_repository *repo, struct got_tree_object *tree,
597 67b631c9 2021-10-10 stsp const char *path)
599 776d4d29 2018-06-17 stsp const struct got_error *err = NULL;
600 67b631c9 2021-10-10 stsp struct got_tree_object *subtree = NULL;
601 db37e2c0 2018-06-21 stsp struct got_tree_entry *te = NULL;
602 65a9bbe9 2018-09-15 stsp const char *seg, *s;
603 b7cd37e5 2018-11-18 stsp size_t seglen;
605 27d434c2 2018-09-15 stsp *id = NULL;
608 5e54fb30 2019-05-31 stsp while (s[0] == '/')
611 65a9bbe9 2018-09-15 stsp seglen = 0;
612 67b631c9 2021-10-10 stsp subtree = tree;
613 b7cd37e5 2018-11-18 stsp while (*s) {
614 776d4d29 2018-06-17 stsp struct got_tree_object *next_tree;
616 776d4d29 2018-06-17 stsp if (*s != '/') {
623 67b631c9 2021-10-10 stsp te = find_entry_by_name(subtree, seg, seglen);
624 db37e2c0 2018-06-21 stsp if (te == NULL) {
625 b66cd6f3 2020-07-31 stsp err = got_error_path(path, GOT_ERR_NO_TREE_ENTRY);
629 b7cd37e5 2018-11-18 stsp if (*s == '\0')
632 776d4d29 2018-06-17 stsp seg = s + 1;
633 65a9bbe9 2018-09-15 stsp seglen = 0;
636 776d4d29 2018-06-17 stsp err = got_object_open_as_tree(&next_tree, repo,
641 67b631c9 2021-10-10 stsp if (subtree != tree)
642 67b631c9 2021-10-10 stsp got_object_tree_close(subtree);
643 67b631c9 2021-10-10 stsp subtree = next_tree;
648 56e0773d 2019-11-28 stsp *id = got_object_id_dup(&te->id);
649 27d434c2 2018-09-15 stsp if (*id == NULL)
650 638f9024 2019-05-13 stsp return got_error_from_errno("got_object_id_dup");
652 67b631c9 2021-10-10 stsp *mode = te->mode;
654 b66cd6f3 2020-07-31 stsp err = got_error_path(path, GOT_ERR_NO_TREE_ENTRY);
656 67b631c9 2021-10-10 stsp if (subtree && subtree != tree)
657 67b631c9 2021-10-10 stsp got_object_tree_close(subtree);
658 67b631c9 2021-10-10 stsp return err;
661 67b631c9 2021-10-10 stsp const struct got_error *
662 67b631c9 2021-10-10 stsp got_object_id_by_path(struct got_object_id **id, struct got_repository *repo,
663 a44927cc 2022-04-07 stsp struct got_commit_object *commit, const char *path)
665 67b631c9 2021-10-10 stsp const struct got_error *err = NULL;
666 67b631c9 2021-10-10 stsp struct got_tree_object *tree = NULL;
668 67b631c9 2021-10-10 stsp *id = NULL;
670 67b631c9 2021-10-10 stsp /* Handle opening of root of commit's tree. */
671 67b631c9 2021-10-10 stsp if (got_path_is_root_dir(path)) {
672 67b631c9 2021-10-10 stsp *id = got_object_id_dup(commit->tree_id);
673 67b631c9 2021-10-10 stsp if (*id == NULL)
674 67b631c9 2021-10-10 stsp err = got_error_from_errno("got_object_id_dup");
676 67b631c9 2021-10-10 stsp err = got_object_open_as_tree(&tree, repo, commit->tree_id);
679 67b631c9 2021-10-10 stsp err = got_object_tree_find_path(id, NULL, repo, tree, path);
683 776d4d29 2018-06-17 stsp got_object_tree_close(tree);
684 776d4d29 2018-06-17 stsp return err;
688 ac5f2b26 2020-05-05 stsp * Normalize file mode bits to avoid false positive tree entry differences
689 ac5f2b26 2020-05-05 stsp * in case tree entries have unexpected mode bits set.
691 ac5f2b26 2020-05-05 stsp static mode_t
692 ac5f2b26 2020-05-05 stsp normalize_mode_for_comparison(mode_t mode)
695 ac5f2b26 2020-05-05 stsp * For directories, the only relevant bit is the IFDIR bit.
696 ac5f2b26 2020-05-05 stsp * This allows us to detect paths changing from a directory
697 ac5f2b26 2020-05-05 stsp * to a file and vice versa.
699 ac5f2b26 2020-05-05 stsp if (S_ISDIR(mode))
700 ac5f2b26 2020-05-05 stsp return mode & S_IFDIR;
703 40dde666 2020-07-23 stsp * For symlinks, the only relevant bit is the IFLNK bit.
704 40dde666 2020-07-23 stsp * This allows us to detect paths changing from a symlinks
705 40dde666 2020-07-23 stsp * to a file or directory and vice versa.
707 40dde666 2020-07-23 stsp if (S_ISLNK(mode))
708 40dde666 2020-07-23 stsp return mode & S_IFLNK;
710 ac5f2b26 2020-05-05 stsp /* For files, the only change we care about is the executable bit. */
711 ac5f2b26 2020-05-05 stsp return mode & S_IXUSR;
714 07862c20 2018-09-15 stsp const struct got_error *
715 07862c20 2018-09-15 stsp got_object_tree_path_changed(int *changed,
716 07862c20 2018-09-15 stsp struct got_tree_object *tree01, struct got_tree_object *tree02,
717 07862c20 2018-09-15 stsp const char *path, struct got_repository *repo)
719 07862c20 2018-09-15 stsp const struct got_error *err = NULL;
720 07862c20 2018-09-15 stsp struct got_tree_object *tree1 = NULL, *tree2 = NULL;
721 07862c20 2018-09-15 stsp struct got_tree_entry *te1 = NULL, *te2 = NULL;
722 65a9bbe9 2018-09-15 stsp const char *seg, *s;
723 3b7f9878 2018-11-18 stsp size_t seglen;
725 07862c20 2018-09-15 stsp *changed = 0;
727 07862c20 2018-09-15 stsp /* We not do support comparing the root path. */
728 61a7d79f 2020-02-29 stsp if (got_path_is_root_dir(path))
729 63f810e6 2020-02-29 stsp return got_error_path(path, GOT_ERR_BAD_PATH);
731 07862c20 2018-09-15 stsp tree1 = tree01;
732 07862c20 2018-09-15 stsp tree2 = tree02;
734 61a7d79f 2020-02-29 stsp while (*s == '/')
737 65a9bbe9 2018-09-15 stsp seglen = 0;
738 3b7f9878 2018-11-18 stsp while (*s) {
739 07862c20 2018-09-15 stsp struct got_tree_object *next_tree1, *next_tree2;
740 ac5f2b26 2020-05-05 stsp mode_t mode1, mode2;
742 07862c20 2018-09-15 stsp if (*s != '/') {
749 65a9bbe9 2018-09-15 stsp te1 = find_entry_by_name(tree1, seg, seglen);
750 07862c20 2018-09-15 stsp if (te1 == NULL) {
751 07862c20 2018-09-15 stsp err = got_error(GOT_ERR_NO_OBJ);
756 e8bfb8f3 2020-12-18 stsp te2 = find_entry_by_name(tree2, seg, seglen);
759 e8bfb8f3 2020-12-18 stsp mode1 = normalize_mode_for_comparison(te1->mode);
760 e8bfb8f3 2020-12-18 stsp mode2 = normalize_mode_for_comparison(te2->mode);
761 e8bfb8f3 2020-12-18 stsp if (mode1 != mode2) {
762 e8bfb8f3 2020-12-18 stsp *changed = 1;
766 e8bfb8f3 2020-12-18 stsp if (got_object_id_cmp(&te1->id, &te2->id) == 0) {
767 e8bfb8f3 2020-12-18 stsp *changed = 0;
772 3b7f9878 2018-11-18 stsp if (*s == '\0') { /* final path element */
773 07862c20 2018-09-15 stsp *changed = 1;
777 07862c20 2018-09-15 stsp seg = s + 1;
779 65a9bbe9 2018-09-15 stsp seglen = 0;
781 07862c20 2018-09-15 stsp err = got_object_open_as_tree(&next_tree1, repo,
783 07862c20 2018-09-15 stsp te1 = NULL;
786 a31cea73 2018-09-15 stsp if (tree1 != tree01)
787 a31cea73 2018-09-15 stsp got_object_tree_close(tree1);
788 07862c20 2018-09-15 stsp tree1 = next_tree1;
791 e8bfb8f3 2020-12-18 stsp err = got_object_open_as_tree(&next_tree2, repo,
793 e8bfb8f3 2020-12-18 stsp te2 = NULL;
796 e8bfb8f3 2020-12-18 stsp if (tree2 != tree02)
797 e8bfb8f3 2020-12-18 stsp got_object_tree_close(tree2);
798 e8bfb8f3 2020-12-18 stsp tree2 = next_tree2;
799 e8bfb8f3 2020-12-18 stsp } else if (tree2) {
800 e8bfb8f3 2020-12-18 stsp if (tree2 != tree02)
801 e8bfb8f3 2020-12-18 stsp got_object_tree_close(tree2);
802 e8bfb8f3 2020-12-18 stsp tree2 = NULL;
807 a31cea73 2018-09-15 stsp if (tree1 && tree1 != tree01)
808 07862c20 2018-09-15 stsp got_object_tree_close(tree1);
809 a31cea73 2018-09-15 stsp if (tree2 && tree2 != tree02)
810 07862c20 2018-09-15 stsp got_object_tree_close(tree2);
811 77880158 2018-11-04 stsp return err;
814 ed175427 2019-05-09 stsp const struct got_error *
815 ed175427 2019-05-09 stsp got_object_tree_entry_dup(struct got_tree_entry **new_te,
816 ed175427 2019-05-09 stsp struct got_tree_entry *te)
818 ed175427 2019-05-09 stsp const struct got_error *err = NULL;
820 ed175427 2019-05-09 stsp *new_te = calloc(1, sizeof(**new_te));
821 ed175427 2019-05-09 stsp if (*new_te == NULL)
822 638f9024 2019-05-13 stsp return got_error_from_errno("calloc");
824 ed175427 2019-05-09 stsp (*new_te)->mode = te->mode;
825 56e0773d 2019-11-28 stsp memcpy((*new_te)->name, te->name, sizeof((*new_te)->name));
826 56e0773d 2019-11-28 stsp memcpy(&(*new_te)->id, &te->id, sizeof((*new_te)->id));
827 8c4eabf2 2019-05-10 stsp return err;
831 56e0773d 2019-11-28 stsp got_object_tree_entry_is_submodule(struct got_tree_entry *te)
833 63c5ca5d 2019-08-24 stsp return (te->mode & S_IFMT) == (S_IFDIR | S_IFLNK);
837 e40622f4 2020-07-23 stsp got_object_tree_entry_is_symlink(struct got_tree_entry *te)
839 e40622f4 2020-07-23 stsp /* S_IFDIR check avoids confusing symlinks with submodules. */
840 e40622f4 2020-07-23 stsp return ((te->mode & (S_IFDIR | S_IFLNK)) == S_IFLNK);
843 e40622f4 2020-07-23 stsp static const struct got_error *
844 e40622f4 2020-07-23 stsp resolve_symlink(char **link_target, const char *path,
845 a44927cc 2022-04-07 stsp struct got_commit_object *commit, struct got_repository *repo)
847 e40622f4 2020-07-23 stsp const struct got_error *err = NULL;
848 dbdd6209 2020-10-19 stsp char buf[PATH_MAX];
849 e40622f4 2020-07-23 stsp char *name, *parent_path = NULL;
850 e40622f4 2020-07-23 stsp struct got_object_id *tree_obj_id = NULL;
851 e40622f4 2020-07-23 stsp struct got_tree_object *tree = NULL;
852 e40622f4 2020-07-23 stsp struct got_tree_entry *te = NULL;
854 e40622f4 2020-07-23 stsp *link_target = NULL;
856 dbdd6209 2020-10-19 stsp if (strlcpy(buf, path, sizeof(buf)) >= sizeof(buf))
857 dbdd6209 2020-10-19 stsp return got_error(GOT_ERR_NO_SPACE);
859 dbdd6209 2020-10-19 stsp name = basename(buf);
860 e40622f4 2020-07-23 stsp if (name == NULL)
861 e40622f4 2020-07-23 stsp return got_error_from_errno2("basename", path);
863 e40622f4 2020-07-23 stsp err = got_path_dirname(&parent_path, path);
865 e40622f4 2020-07-23 stsp return err;
867 a44927cc 2022-04-07 stsp err = got_object_id_by_path(&tree_obj_id, repo, commit,
868 e40622f4 2020-07-23 stsp parent_path);
870 e40622f4 2020-07-23 stsp if (err->code == GOT_ERR_NO_TREE_ENTRY) {
871 e40622f4 2020-07-23 stsp /* Display the complete path in error message. */
872 e40622f4 2020-07-23 stsp err = got_error_path(path, err->code);
877 e40622f4 2020-07-23 stsp err = got_object_open_as_tree(&tree, repo, tree_obj_id);
881 e40622f4 2020-07-23 stsp te = got_object_tree_find_entry(tree, name);
882 e40622f4 2020-07-23 stsp if (te == NULL) {
883 e40622f4 2020-07-23 stsp err = got_error_path(path, GOT_ERR_NO_TREE_ENTRY);
887 e40622f4 2020-07-23 stsp if (got_object_tree_entry_is_symlink(te)) {
888 e40622f4 2020-07-23 stsp err = got_tree_entry_get_symlink_target(link_target, te, repo);
891 e40622f4 2020-07-23 stsp if (!got_path_is_absolute(*link_target)) {
892 e40622f4 2020-07-23 stsp char *abspath;
893 e40622f4 2020-07-23 stsp if (asprintf(&abspath, "%s/%s", parent_path,
894 e40622f4 2020-07-23 stsp *link_target) == -1) {
895 e40622f4 2020-07-23 stsp err = got_error_from_errno("asprintf");
898 e40622f4 2020-07-23 stsp free(*link_target);
899 e40622f4 2020-07-23 stsp *link_target = malloc(PATH_MAX);
900 e40622f4 2020-07-23 stsp if (*link_target == NULL) {
901 e40622f4 2020-07-23 stsp err = got_error_from_errno("malloc");
904 e40622f4 2020-07-23 stsp err = got_canonpath(abspath, *link_target, PATH_MAX);
905 e40622f4 2020-07-23 stsp free(abspath);
911 b68bd9d2 2022-09-03 op free(parent_path);
912 e40622f4 2020-07-23 stsp free(tree_obj_id);
914 e40622f4 2020-07-23 stsp got_object_tree_close(tree);
916 e40622f4 2020-07-23 stsp free(*link_target);
917 e40622f4 2020-07-23 stsp *link_target = NULL;
919 e40622f4 2020-07-23 stsp return err;
922 ca6e02ac 2020-01-07 stsp const struct got_error *
923 e40622f4 2020-07-23 stsp got_object_resolve_symlinks(char **link_target, const char *path,
924 a44927cc 2022-04-07 stsp struct got_commit_object *commit, struct got_repository *repo)
926 e40622f4 2020-07-23 stsp const struct got_error *err = NULL;
927 e40622f4 2020-07-23 stsp char *next_target = NULL;
928 e40622f4 2020-07-23 stsp int max_recursion = 40; /* matches Git */
930 e40622f4 2020-07-23 stsp *link_target = NULL;
933 e40622f4 2020-07-23 stsp err = resolve_symlink(&next_target,
934 a44927cc 2022-04-07 stsp *link_target ? *link_target : path, commit, repo);
937 e40622f4 2020-07-23 stsp if (next_target) {
938 e40622f4 2020-07-23 stsp free(*link_target);
939 e40622f4 2020-07-23 stsp if (--max_recursion == 0) {
940 e40622f4 2020-07-23 stsp err = got_error_path(path, GOT_ERR_RECURSION);
941 e40622f4 2020-07-23 stsp *link_target = NULL;
944 e40622f4 2020-07-23 stsp *link_target = next_target;
946 e40622f4 2020-07-23 stsp } while (next_target);
948 e40622f4 2020-07-23 stsp return err;
952 34a842a4 2022-09-18 mark got_object_commit_retain(struct got_commit_object *commit)
954 568eae95 2022-09-11 mark commit->refcnt++;
957 13b2bc37 2022-10-23 stsp const struct got_error *
958 13b2bc37 2022-10-23 stsp got_object_raw_alloc(struct got_raw_object **obj, uint8_t *outbuf, int *outfd,
959 60c140ae 2023-01-09 stsp size_t max_in_mem_size, size_t hdrlen, off_t size)
961 13b2bc37 2022-10-23 stsp const struct got_error *err = NULL;
964 1c28a361 2022-10-25 op tot = hdrlen + size;
966 13b2bc37 2022-10-23 stsp *obj = calloc(1, sizeof(**obj));
967 13b2bc37 2022-10-23 stsp if (*obj == NULL) {
968 13b2bc37 2022-10-23 stsp err = got_error_from_errno("calloc");
971 13b2bc37 2022-10-23 stsp (*obj)->fd = -1;
972 13b2bc37 2022-10-23 stsp (*obj)->tempfile_idx = -1;
974 13b2bc37 2022-10-23 stsp if (outbuf) {
975 13b2bc37 2022-10-23 stsp (*obj)->data = outbuf;
977 13b2bc37 2022-10-23 stsp struct stat sb;
978 13b2bc37 2022-10-23 stsp if (fstat(*outfd, &sb) == -1) {
979 13b2bc37 2022-10-23 stsp err = got_error_from_errno("fstat");
983 1c28a361 2022-10-25 op if (sb.st_size != tot) {
984 e98a81e6 2023-01-09 stsp err = got_error_msg(GOT_ERR_BAD_OBJ_HDR,
985 e98a81e6 2023-01-09 stsp "raw object has unexpected size");
988 13b2bc37 2022-10-23 stsp #ifndef GOT_PACK_NO_MMAP
989 60c140ae 2023-01-09 stsp if (tot > 0 && tot <= max_in_mem_size) {
990 1c28a361 2022-10-25 op (*obj)->data = mmap(NULL, tot, PROT_READ,
991 13b2bc37 2022-10-23 stsp MAP_PRIVATE, *outfd, 0);
992 13b2bc37 2022-10-23 stsp if ((*obj)->data == MAP_FAILED) {
993 13b2bc37 2022-10-23 stsp if (errno != ENOMEM) {
994 13b2bc37 2022-10-23 stsp err = got_error_from_errno("mmap");
997 13b2bc37 2022-10-23 stsp (*obj)->data = NULL;
999 13b2bc37 2022-10-23 stsp (*obj)->fd = *outfd;
1000 13b2bc37 2022-10-23 stsp *outfd = -1;
1004 13b2bc37 2022-10-23 stsp if (*outfd != -1) {
1005 13b2bc37 2022-10-23 stsp (*obj)->f = fdopen(*outfd, "r");
1006 13b2bc37 2022-10-23 stsp if ((*obj)->f == NULL) {
1007 13b2bc37 2022-10-23 stsp err = got_error_from_errno("fdopen");
1008 13b2bc37 2022-10-23 stsp goto done;
1010 13b2bc37 2022-10-23 stsp *outfd = -1;
1013 13b2bc37 2022-10-23 stsp (*obj)->hdrlen = hdrlen;
1014 13b2bc37 2022-10-23 stsp (*obj)->size = size;
1016 13b2bc37 2022-10-23 stsp if (err) {
1017 13b2bc37 2022-10-23 stsp if (*obj) {
1018 13b2bc37 2022-10-23 stsp got_object_raw_close(*obj);
1019 13b2bc37 2022-10-23 stsp *obj = NULL;
1022 13b2bc37 2022-10-23 stsp (*obj)->refcnt++;
1023 13b2bc37 2022-10-23 stsp return err;