Edit

thodg/got/lib/object.c

Branch :

  • Show log

    Commit

  • Author : Stefan Sperling
    Date : 2018-09-08 16:40:28
    Hash : ad242220
    Message : implement fork+exec (and by the way, fix the build...)

  • lib/object.c
  • /*
     * Copyright (c) 2018 Stefan Sperling <stsp@openbsd.org>
     *
     * Permission to use, copy, modify, and distribute this software for any
     * purpose with or without fee is hereby granted, provided that the above
     * copyright notice and this permission notice appear in all copies.
     *
     * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
     * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
     * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
     * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
     * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
     * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
     * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
     */
    
    #include <sys/types.h>
    #include <sys/stat.h>
    #include <sys/queue.h>
    #include <sys/uio.h>
    #include <sys/socket.h>
    #include <sys/wait.h>
    
    #include <errno.h>
    #include <fcntl.h>
    #include <stdio.h>
    #include <stdlib.h>
    #include <string.h>
    #include <stdint.h>
    #include <sha1.h>
    #include <zlib.h>
    #include <ctype.h>
    #include <limits.h>
    #include <imsg.h>
    #include <time.h>
    
    #include "got_error.h"
    #include "got_object.h"
    #include "got_repository.h"
    #include "got_opentemp.h"
    
    #include "got_lib_sha1.h"
    #include "got_lib_delta.h"
    #include "got_lib_pack.h"
    #include "got_lib_path.h"
    #include "got_lib_inflate.h"
    #include "got_lib_object.h"
    #include "got_lib_privsep.h"
    #include "got_lib_object_parse.h"
    #include "got_lib_repository.h"
    
    #ifndef MIN
    #define	MIN(_a,_b) ((_a) < (_b) ? (_a) : (_b))
    #endif
    
    const struct got_error *
    got_object_id_str(char **outbuf, struct got_object_id *id)
    {
    	static const size_t len = SHA1_DIGEST_STRING_LENGTH;
    
    	*outbuf = malloc(len);
    	if (*outbuf == NULL)
    		return got_error_from_errno();
    
    	if (got_sha1_digest_to_str(id->sha1, *outbuf, len) == NULL) {
    		free(*outbuf);
    		*outbuf = NULL;
    		return got_error(GOT_ERR_BAD_OBJ_ID_STR);
    	}
    
    	return NULL;
    }
    
    int
    got_object_id_cmp(struct got_object_id *id1, struct got_object_id *id2)
    {
    	return memcmp(id1->sha1, id2->sha1, SHA1_DIGEST_LENGTH);
    }
    
    struct got_object_id *
    got_object_id_dup(struct got_object_id *id1)
    {
    	struct got_object_id *id2;
    
    	id2 = malloc(sizeof(*id2));
    	if (id2 == NULL)
    		return NULL;
    	memcpy(id2, id1, sizeof(*id2));
    	return id2;
    }
    
    struct got_object_id *
    got_object_get_id(struct got_object *obj)
    {
    	return got_object_id_dup(&obj->id);
    }
    
    const struct got_error *
    got_object_get_id_str(char **outbuf, struct got_object *obj)
    {
    	return got_object_id_str(outbuf, &obj->id);
    }
    
    int
    got_object_get_type(struct got_object *obj)
    {
    	switch (obj->type) {
    	case GOT_OBJ_TYPE_COMMIT:
    	case GOT_OBJ_TYPE_TREE:
    	case GOT_OBJ_TYPE_BLOB:
    	case GOT_OBJ_TYPE_TAG:
    		return obj->type;
    	default:
    		abort();
    		break;
    	}
    
    	/* not reached */
    	return 0;
    }
    
    static const struct got_error *
    object_path(char **path, struct got_object_id *id, struct got_repository *repo)
    {
    	const struct got_error *err = NULL;
    	char *hex = NULL;
    	char *path_objects = got_repo_get_path_objects(repo);
    
    	*path = NULL;
    
    	if (path_objects == NULL)
    		return got_error_from_errno();
    
    	err = got_object_id_str(&hex, id);
    	if (err)
    		goto done;
    
    	if (asprintf(path, "%s/%.2x/%s", path_objects,
    	    id->sha1[0], hex + 2) == -1)
    		err = got_error_from_errno();
    
    done:
    	free(hex);
    	free(path_objects);
    	return err;
    }
    
    static const struct got_error *
    open_loose_object(int *fd, struct got_object *obj, struct got_repository *repo)
    {
    	const struct got_error *err = NULL;
    	char *path;
    
    	err = object_path(&path, &obj->id, repo);
    	if (err)
    		return err;
    	*fd = open(path, O_RDONLY | O_NOFOLLOW, GOT_DEFAULT_FILE_MODE);
    	if (*fd == -1) {
    		err = got_error_from_errno();
    		goto done;
    	}
    done:
    	free(path);
    	return err;
    }
    
    const struct got_error *
    got_object_open(struct got_object **obj, struct got_repository *repo,
        struct got_object_id *id)
    {
    	const struct got_error *err = NULL;
    	char *path;
    	int fd;
    
    	*obj = got_repo_get_cached_object(repo, id);
    	if (*obj != NULL) {
    		(*obj)->refcnt++;
    		return NULL;
    	}
    
    	err = object_path(&path, id, repo);
    	if (err)
    		return err;
    
    	fd = open(path, O_RDONLY | O_NOFOLLOW, GOT_DEFAULT_FILE_MODE);
    	if (fd == -1) {
    		if (errno != ENOENT) {
    			err = got_error_from_errno();
    			goto done;
    		}
    		err = got_packfile_open_object(obj, id, repo);
    		if (err)
    			goto done;
    		if (*obj == NULL)
    			err = got_error(GOT_ERR_NO_OBJ);
    	} else {
    		err = got_object_read_header_privsep(obj, repo, fd);
    		if (err)
    			goto done;
    		memcpy((*obj)->id.sha1, id->sha1, SHA1_DIGEST_LENGTH);
    	}
    
    	if (err == NULL) {
    		(*obj)->refcnt++;
    		err = got_repo_cache_object(repo, id, *obj);
    	}
    done:
    	free(path);
    	if (fd != -1)
    		close(fd);
    	return err;
    
    }
    
    const struct got_error *
    got_object_open_by_id_str(struct got_object **obj, struct got_repository *repo,
        const char *id_str)
    {
    	struct got_object_id id;
    
    	if (!got_parse_sha1_digest(id.sha1, id_str))
    		return got_error(GOT_ERR_BAD_OBJ_ID_STR);
    
    	return got_object_open(obj, repo, &id);
    }
    
    const struct got_error *
    got_object_open_as_commit(struct got_commit_object **commit,
        struct got_repository *repo, struct got_object_id *id)
    {
    	const struct got_error *err;
    	struct got_object *obj;
    
    	*commit = NULL;
    
    	err = got_object_open(&obj, repo, id);
    	if (err)
    		return err;
    	if (got_object_get_type(obj) != GOT_OBJ_TYPE_COMMIT) {
    		err = got_error(GOT_ERR_OBJ_TYPE);
    		goto done;
    	}
    
    	err = got_object_commit_open(commit, repo, obj);
    done:
    	got_object_close(obj);
    	return err;
    }
    
    const struct got_error *
    got_object_qid_alloc(struct got_object_qid **qid, struct got_object_id *id)
    {
    	const struct got_error *err = NULL;
    
    	*qid = calloc(1, sizeof(**qid));
    	if (*qid == NULL)
    		return got_error_from_errno();
    
    	(*qid)->id = got_object_id_dup(id);
    	if ((*qid)->id == NULL) {
    		err = got_error_from_errno();
    		got_object_qid_free(*qid);
    		*qid = NULL;
    		return err;
    	}
    
    	return NULL;
    }
    
    const struct got_error *
    got_object_commit_open(struct got_commit_object **commit,
        struct got_repository *repo, struct got_object *obj)
    {
    	const struct got_error *err = NULL;
    
    	*commit = got_repo_get_cached_commit(repo, &obj->id);
    	if (*commit != NULL) {
    		(*commit)->refcnt++;
    		return NULL;
    	}
    
    	if (obj->type != GOT_OBJ_TYPE_COMMIT)
    		return got_error(GOT_ERR_OBJ_TYPE);
    
    	if (obj->flags & GOT_OBJ_FLAG_PACKED) {
    		uint8_t *buf;
    		size_t len;
    		err = got_packfile_extract_object_to_mem(&buf, &len, obj, repo);
    		if (err)
    			return err;
    		obj->size = len;
    		err = got_object_parse_commit(commit, buf, len);
    		free(buf);
    	} else {
    		int fd;
    		err = open_loose_object(&fd, obj, repo);
    		if (err)
    			return err;
    		err = got_object_read_commit_privsep(commit, obj, fd, repo);
    		close(fd);
    	}
    
    	if (err == NULL) {
    		(*commit)->refcnt++;
    		err = got_repo_cache_commit(repo, &obj->id, *commit);
    	}
    
    	return err;
    }
    
    const struct got_error *
    got_object_tree_open(struct got_tree_object **tree,
        struct got_repository *repo, struct got_object *obj)
    {
    	const struct got_error *err = NULL;
    
    	*tree = got_repo_get_cached_tree(repo, &obj->id);
    	if (*tree != NULL) {
    		(*tree)->refcnt++;
    		return NULL;
    	}
    
    	if (obj->type != GOT_OBJ_TYPE_TREE)
    		return got_error(GOT_ERR_OBJ_TYPE);
    
    	if (obj->flags & GOT_OBJ_FLAG_PACKED) {
    		uint8_t *buf;
    		size_t len;
    		err = got_packfile_extract_object_to_mem(&buf, &len, obj, repo);
    		if (err)
    			return err;
    		obj->size = len;
    		err = got_object_parse_tree(tree, buf, len);
    		free(buf);
    	} else {
    		int fd;
    		err = open_loose_object(&fd, obj, repo);
    		if (err)
    			return err;
    		err = got_object_read_tree_privsep(tree, obj, fd, repo);
    		close(fd);
    	}
    
    	if (err == NULL) {
    		(*tree)->refcnt++;
    		err = got_repo_cache_tree(repo, &obj->id, *tree);
    	}
    
    	return err;
    }
    
    const struct got_error *
    got_object_open_as_tree(struct got_tree_object **tree,
        struct got_repository *repo, struct got_object_id *id)
    {
    	const struct got_error *err;
    	struct got_object *obj;
    
    	*tree = NULL;
    
    	err = got_object_open(&obj, repo, id);
    	if (err)
    		return err;
    	if (got_object_get_type(obj) != GOT_OBJ_TYPE_TREE) {
    		err = got_error(GOT_ERR_OBJ_TYPE);
    		goto done;
    	}
    
    	err = got_object_tree_open(tree, repo, obj);
    done:
    	got_object_close(obj);
    	return err;
    }
    
    const struct got_tree_entries *
    got_object_tree_get_entries(struct got_tree_object *tree)
    {
    	return &tree->entries;
    }
    
    const struct got_error *
    got_object_blob_open(struct got_blob_object **blob,
        struct got_repository *repo, struct got_object *obj, size_t blocksize)
    {
    	const struct got_error *err = NULL;
    
    	if (obj->type != GOT_OBJ_TYPE_BLOB)
    		return got_error(GOT_ERR_OBJ_TYPE);
    
    	if (blocksize < obj->hdrlen)
    		return got_error(GOT_ERR_NO_SPACE);
    
    	*blob = calloc(1, sizeof(**blob));
    	if (*blob == NULL)
    		return got_error_from_errno();
    
    	(*blob)->read_buf = malloc(blocksize);
    	if ((*blob)->read_buf == NULL) {
    		err = got_error_from_errno();
    		goto done;
    	}
    	if (obj->flags & GOT_OBJ_FLAG_PACKED) {
    		err = got_packfile_extract_object(&((*blob)->f), obj, repo);
    		if (err)
    			goto done;
    	} else {
    		int infd, outfd;
    		size_t size;
    		struct stat sb;
    
    		err = open_loose_object(&infd, obj, repo);
    		if (err)
    			goto done;
    
    
    		outfd = got_opentempfd();
    		if (outfd == -1) {
    			err = got_error_from_errno();
    			close(infd);
    			goto done;
    		}
    
    		err = got_object_read_blob_privsep(&size, outfd, infd, repo);
    		close(infd);
    		if (err)
    			goto done;
    
    		if (size != obj->hdrlen + obj->size) {
    			err = got_error(GOT_ERR_PRIVSEP_LEN);
    			close(outfd);
    			goto done;
    		}
    
    		if (fstat(outfd, &sb) == -1) {
    			err = got_error_from_errno();
    			close(outfd);
    			goto done;
    		}
    
    		if (sb.st_size != size) {
    			err = got_error(GOT_ERR_PRIVSEP_LEN);
    			close(outfd);
    			goto done;
    		}
    
    		(*blob)->f = fdopen(outfd, "rb");
    		if ((*blob)->f == NULL) {
    			err = got_error_from_errno();
    			close(outfd);
    			goto done;
    		}
    	}
    
    	(*blob)->hdrlen = obj->hdrlen;
    	(*blob)->blocksize = blocksize;
    	memcpy(&(*blob)->id.sha1, obj->id.sha1, SHA1_DIGEST_LENGTH);
    
    done:
    	if (err && *blob) {
    		if ((*blob)->f)
    			fclose((*blob)->f);
    		free((*blob)->read_buf);
    		free(*blob);
    		*blob = NULL;
    	}
    	return err;
    }
    
    const struct got_error *
    got_object_open_as_blob(struct got_blob_object **blob,
        struct got_repository *repo, struct got_object_id *id,
        size_t blocksize)
    {
    	const struct got_error *err;
    	struct got_object *obj;
    
    	*blob = NULL;
    
    	err = got_object_open(&obj, repo, id);
    	if (err)
    		return err;
    	if (got_object_get_type(obj) != GOT_OBJ_TYPE_BLOB) {
    		err = got_error(GOT_ERR_OBJ_TYPE);
    		goto done;
    	}
    
    	err = got_object_blob_open(blob, repo, obj, blocksize);
    done:
    	got_object_close(obj);
    	return err;
    }
    
    void
    got_object_blob_close(struct got_blob_object *blob)
    {
    	free(blob->read_buf);
    	fclose(blob->f);
    	free(blob);
    }
    
    char *
    got_object_blob_id_str(struct got_blob_object *blob, char *buf, size_t size)
    {
    	return got_sha1_digest_to_str(blob->id.sha1, buf, size);
    }
    
    size_t
    got_object_blob_get_hdrlen(struct got_blob_object *blob)
    {
    	return blob->hdrlen;
    }
    
    const uint8_t *
    got_object_blob_get_read_buf(struct got_blob_object *blob)
    {
    	return blob->read_buf;
    }
    
    const struct got_error *
    got_object_blob_read_block(size_t *outlenp, struct got_blob_object *blob)
    {
    	size_t n;
    
    	n = fread(blob->read_buf, 1, blob->blocksize, blob->f);
    	if (n == 0 && ferror(blob->f))
    		return got_ferror(blob->f, GOT_ERR_IO);
    	*outlenp = n;
    	return NULL;
    }
    
    const struct got_error *
    got_object_blob_dump_to_file(size_t *total_len, size_t *nlines,
        FILE *outfile, struct got_blob_object *blob)
    {
    	const struct got_error *err = NULL;
    	size_t len, hdrlen;
    	const uint8_t *buf;
    	int i;
    
    	if (total_len)
    		*total_len = 0;
    	if (nlines)
    		*nlines = 0;
    
    	hdrlen = got_object_blob_get_hdrlen(blob);
    	do {
    		err = got_object_blob_read_block(&len, blob);
    		if (err)
    			return err;
    		if (len == 0)
    			break;
    		if (total_len)
    			*total_len += len;
    		buf = got_object_blob_get_read_buf(blob);
    		if (nlines) {
    			for (i = 0; i < len; i++) {
    				if (buf[i] == '\n')
    					(*nlines)++;
    			}
    		}
    		/* Skip blob object header first time around. */
    		fwrite(buf + hdrlen, len - hdrlen, 1, outfile);
    		hdrlen = 0;
    	} while (len != 0);
    
    	fflush(outfile);
    	rewind(outfile);
    
    	return NULL;
    }
    
    static struct got_tree_entry *
    find_entry_by_name(struct got_tree_object *tree, const char *name)
    {
    	struct got_tree_entry *te;
    
    	SIMPLEQ_FOREACH(te, &tree->entries.head, entry) {
    		if (strcmp(te->name, name) == 0)
    			return te;
    	}
    	return NULL;
    }
    
    const struct got_error *
    got_object_open_by_path(struct got_object **obj, struct got_repository *repo,
        struct got_object_id *commit_id, const char *path)
    {
    	const struct got_error *err = NULL;
    	struct got_commit_object *commit = NULL;
    	struct got_tree_object *tree = NULL;
    	struct got_tree_entry *te = NULL;
    	char *seg, *s, *s0 = NULL;
    	size_t len = strlen(path);
    
    	*obj = NULL;
    
    	/* We are expecting an absolute in-repository path. */
    	if (path[0] != '/')
    		return got_error(GOT_ERR_NOT_ABSPATH);
    
    	err = got_object_open_as_commit(&commit, repo, commit_id);
    	if (err)
    		goto done;
    
    	/* Handle opening of root of commit's tree. */
    	if (path[1] == '\0') {
    		err = got_object_open(obj, repo, commit->tree_id);
    		goto done;
    	}
    
    	err = got_object_open_as_tree(&tree, repo, commit->tree_id);
    	if (err)
    		goto done;
    
    	s0 = strdup(path);
    	if (s0 == NULL) {
    		err = got_error_from_errno();
    		goto done;
    	}
    	err = got_canonpath(path, s0, len + 1);
    	if (err)
    		goto done;
    
    	s = s0;
    	s++; /* skip leading '/' */
    	len--;
    	seg = s;
    	while (len > 0) {
    		struct got_tree_object *next_tree;
    
    		if (*s != '/') {
    			s++;
    			len--;
    			if (*s)
    				continue;
    		}
    
    		/* end of path segment */
    		*s = '\0';
    
    		te = find_entry_by_name(tree, seg);
    		if (te == NULL) {
    			err = got_error(GOT_ERR_NO_OBJ);
    			goto done;
    		}
    
    		if (len == 0)
    			break;
    
    		seg = s + 1;
    		s++;
    		len--;
    		if (*s) {
    			err = got_object_open_as_tree(&next_tree, repo,
    			    te->id);
    			te = NULL;
    			if (err)
    				goto done;
    			got_object_tree_close(tree);
    			tree = next_tree;
    		}
    	}
    
    	if (te)
    		err = got_object_open(obj, repo, te->id);
    	else
    		err = got_error(GOT_ERR_NO_OBJ);
    done:
    	free(s0);
    	if (commit)
    		got_object_commit_close(commit);
    	if (tree)
    		got_object_tree_close(tree);
    	return err;
    }