Hash :
ab525a74
Author :
Date :
2011-07-07T19:20:13
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256
/*
* This file is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License, version 2,
* as published by the Free Software Foundation.
*
* In addition to the permissions in the GNU General Public License,
* the authors give you unlimited permission to link the compiled
* version of this file into combinations with other programs,
* and to distribute those combinations without any restriction
* coming from the use of this file. (The General Public License
* restrictions do apply in other respects; for example, they cover
* modification of the file, and distribution when not linked into
* a combined executable.)
*
* This file is distributed in the hope that it will be useful, but
* WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; see the file COPYING. If not, write to
* the Free Software Foundation, 51 Franklin Street, Fifth Floor,
* Boston, MA 02110-1301, USA.
*/
#include "git2/indexer.h"
#include "git2/zlib.h"
#include "common.h"
#include "pack.h"
#include "mwindow.h"
#include "posix.h"
typedef struct git_indexer {
struct pack_file *pack;
git_vector objects;
git_vector deltas;
struct stat st;
git_indexer_stats stats;
} git_indexer;
static int parse_header(git_indexer *idx)
{
struct pack_header hdr;
int error;
/* Verify we recognize this pack file format. */
if ((error = p_read(idx->pack->pack_fd, &hdr, sizeof(hdr))) < GIT_SUCCESS)
goto cleanup;
if (hdr.hdr_signature != htonl(PACK_SIGNATURE)) {
error = git__throw(GIT_EOBJCORRUPTED, "Wrong pack signature");
goto cleanup;
}
if (!pack_version_ok(hdr.hdr_version)) {
error = git__throw(GIT_EOBJCORRUPTED, "Wrong pack version");
goto cleanup;
}
/*
* FIXME: At this point we have no idea how many of the are
* deltas, so assume all objects are both until we get a better
* idea
*/
error = git_vector_init(&idx->objects, hdr.hdr_entries, NULL /* FIXME: probably need something */);
if (error < GIT_SUCCESS)
goto cleanup;
error = git_vector_init(&idx->deltas, hdr.hdr_entries, NULL /* FIXME: probably need something */);
if (error < GIT_SUCCESS)
goto cleanup;
idx->stats.total = hdr.hdr_entries;
return GIT_SUCCESS;
cleanup:
git_vector_free(&idx->objects);
git_vector_free(&idx->deltas);
return error;
}
int git_indexer_new(git_indexer **out, const char *packname)
{
git_indexer *idx;
unsigned int namelen;
int ret, error;
idx = git__malloc(sizeof(git_indexer));
if (idx == NULL)
return GIT_ENOMEM;
memset(idx, 0x0, sizeof(*idx));
namelen = strlen(packname);
idx->pack = git__malloc(sizeof(struct pack_file) + namelen + 1);
if (idx->pack == NULL)
goto cleanup;
memset(idx->pack, 0x0, sizeof(struct pack_file));
memcpy(idx->pack->pack_name, packname, namelen);
ret = p_stat(packname, &idx->st);
if (ret < 0) {
if (errno == ENOENT)
error = git__throw(GIT_ENOTFOUND, "Failed to stat packfile. File not found");
else
error = git__throw(GIT_EOSERR, "Failed to stat packfile.");
goto cleanup;
}
ret = p_open(idx->pack->pack_name, O_RDONLY);
if (ret < 0) {
error = git__throw(GIT_EOSERR, "Failed to open packfile");
goto cleanup;
}
idx->pack->pack_fd = ret;
error = parse_header(idx);
if (error < GIT_SUCCESS) {
error = git__rethrow(error, "Failed to parse packfile header");
goto cleanup;
}
*out = idx;
return GIT_SUCCESS;
cleanup:
free(idx->pack);
free(idx);
return error;
}
/*
* Parse the variable-width length and return it. Assumes that the
* whole number exists inside the buffer. As this is the git format,
* the first byte only contains length information in the lower nibble
* because the higher one is used for type and continuation. The
* output parameter is necessary because we don't know how long the
* entry is actually going to be.
*/
static unsigned long entry_len(const char **bufout, const char *buf)
{
unsigned long size, c;
const char *p = buf;
unsigned shift;
c = *p;
size = c & 0xf;
shift = 4;
/* As long as the MSB is set, we need to continue */
while (c & 0x80) {
p++;
c = *p;
size += (c & 0x7f) << shift;
shift += 7;
}
*bufout = p;
return size;
}
static git_otype entry_type(const char *buf)
{
return (*buf >> 4) & 7;
}
/*
* Create the index. Every time something interesting happens
* (something has been parse or resolved), the callback gets called
* with some stats so it can tell the user how hard we're working
*/
int git_indexer_run(git_indexer *idx, int (*cb)(const git_indexer_stats *, void *), void *data)
{
git_mwindow_file *mwf = &idx->pack->mwf;
git_mwindow *w = NULL;
off_t off = 0;
int error;
const char *ptr;
unsigned int fanout[256] = {0};
error = git_mwindow_file_register(mwf);
if (error < GIT_SUCCESS)
return git__rethrow(error, "Failed to register mwindow file");
/* Notify before the first one */
if (cb)
cb(&idx->stats, data);
while (idx->stats.processed < idx->stats.total) {
unsigned long size;
git_otype type;
/* 4k is a bit magic for the moment */
ptr = git_mwindow_open(mwf, &w, idx->pack->pack_fd, 4096, off, 0, NULL);
if (ptr == NULL) {
error = GIT_ENOMEM;
goto cleanup;
}
/*
* The size is when expanded, so we need to inflate the object
* so we know where the next one ist.
*/
type = entry_type(ptr);
size = entry_len(&data, ptr);
switch (type) {
case GIT_OBJ_COMMIT:
case GIT_OBJ_TREE:
case GIT_OBJ_BLOB:
case GIT_OBJ_TAG:
break;
default:
error = git__throw(GIT_EOBJCORRUPTED, "Invalid object type");
goto cleanup;
}
/*
* Do we need to uncompress everything if we're not running in
* strict mode? Or at least can't we free the data?
*/
/* Get a window for the compressed data */
//ptr = git_mwindow_open(mwf, &w, idx->pack->pack_fd, size, data - ptr, 0, NULL);
idx->stats.processed++;
if (cb)
cb(&idx->stats, data);
}
cleanup:
git_mwindow_free_all(mwf);
return error;
}
void git_indexer_free(git_indexer *idx)
{
p_close(idx->pack->pack_fd);
git_vector_free(&idx->objects);
git_vector_free(&idx->deltas);
free(idx->pack);
free(idx);
}