pack.h 4.91 KB
Newer Older
1
/*
Edward Thomson committed
2
 * Copyright (C) the libgit2 contributors. All rights reserved.
3
 *
Vicent Marti committed
4 5
 * This file is part of libgit2, distributed under the GNU GPL v2 with
 * a Linking Exception. For full terms see the included COPYING file.
6 7 8 9 10
 */

#ifndef INCLUDE_pack_h__
#define INCLUDE_pack_h__

11 12
#include "common.h"

13 14
#include "git2/oid.h"

15
#include "array.h"
16 17
#include "map.h"
#include "mwindow.h"
18
#include "odb.h"
19
#include "offmap.h"
20
#include "oidmap.h"
21
#include "zstream.h"
22

23 24
#define GIT_PACK_FILE_MODE 0444

25 26 27
#define PACK_SIGNATURE 0x5041434b	/* "PACK" */
#define PACK_VERSION 2
#define pack_version_ok(v) ((v) == htonl(2) || (v) == htonl(3))
28
struct git_pack_header {
29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
	uint32_t hdr_signature;
	uint32_t hdr_version;
	uint32_t hdr_entries;
};

/*
 * The first four bytes of index formats later than version 1 should
 * start with this signature, as all older git binaries would find this
 * value illegal and abort reading the file.
 *
 * This is the case because the number of objects in a packfile
 * cannot exceed 1,431,660,000 as every object would need at least
 * 3 bytes of data and the overall packfile cannot exceed 4 GiB with
 * version 1 of the index file due to the offsets limited to 32 bits.
 * Clearly the signature exceeds this maximum.
 *
 * Very old git binaries will also compare the first 4 bytes to the
 * next 4 bytes in the index and abort with a "non-monotonic index"
 * error if the second 4 byte word is smaller than the first 4
Vicent Marti committed
48
 * byte word. This would be true in the proposed future index
49 50 51 52 53
 * format as idx_signature would be greater than idx_version.
 */

#define PACK_IDX_SIGNATURE 0xff744f63	/* "\377tOc" */

54
struct git_pack_idx_header {
55 56 57 58
	uint32_t idx_signature;
	uint32_t idx_version;
};

59
typedef struct git_pack_cache_entry {
60
	size_t last_usage; /* enough? */
61
	git_atomic refcount;
62 63 64
	git_rawobj raw;
} git_pack_cache_entry;

65
struct pack_chain_elem {
66 67
	off64_t base_key;
	off64_t offset;
68
	size_t size;
69
	git_object_t type;
70 71 72 73
};

typedef git_array_t(struct pack_chain_elem) git_dependency_chain;

74 75
#define GIT_PACK_CACHE_MEMORY_LIMIT 16 * 1024 * 1024
#define GIT_PACK_CACHE_SIZE_LIMIT 1024 * 1024 /* don't bother caching anything over 1MB */
76 77 78 79

typedef struct {
	size_t memory_used;
	size_t memory_limit;
80
	size_t use_ctr;
81 82 83 84
	git_mutex lock;
	git_offmap *entries;
} git_pack_cache;

85
struct git_pack_file {
86 87
	git_mwindow_file mwf;
	git_map index_map;
Russell Belfer committed
88
	git_mutex lock; /* protect updates to mwf and index_map */
89
	git_atomic refcount;
90 91 92 93 94 95 96

	uint32_t num_objects;
	uint32_t num_bad_objects;
	git_oid *bad_object_sha1; /* array of git_oid */

	int index_version;
	git_time_t mtime;
97
	unsigned pack_local:1, pack_keep:1, has_cache:1;
98
	git_oidmap *idx_cache;
99
	git_oid **oids;
100

101
	git_pack_cache bases; /* delta base cache */
102

103 104
	time_t last_freshen; /* last time the packfile was freshened */

105 106 107 108
	/* something like ".git/objects/pack/xxxxx.pack" */
	char pack_name[GIT_FLEX_ARRAY]; /* more */
};

109 110 111 112 113 114 115 116 117 118 119 120 121
/**
 * Return the position where an OID (or a prefix) would be inserted within the
 * OID Lookup Table of an .idx file. This performs binary search between the lo
 * and hi indices.
 *
 * The stride parameter is provided because .idx files version 1 store the OIDs
 * interleaved with the 4-byte file offsets of the objects within the .pack
 * file (stride = 24), whereas files with version 2 store them in a contiguous
 * flat array (stride = 20).
 */
int git_pack__lookup_sha1(const void *oid_lookup_table, size_t stride, unsigned lo,
		unsigned hi, const unsigned char *oid_prefix);

122
struct git_pack_entry {
123
	off64_t offset;
124
	git_oid sha1;
125
	struct git_pack_file *p;
126 127
};

128
typedef struct git_packfile_stream {
129
	off64_t curpos;
130
	int done;
131
	git_zstream zstream;
132 133 134 135
	struct git_pack_file *p;
	git_mwindow *mw;
} git_packfile_stream;

136
size_t git_packfile__object_header(unsigned char *hdr, size_t size, git_object_t type);
137

138 139
int git_packfile__name(char **out, const char *path);

140 141
int git_packfile_unpack_header(
		size_t *size_p,
142
		git_object_t *type_p,
143 144
		git_mwindow_file *mwf,
		git_mwindow **w_curs,
145
		off64_t *curpos);
146

147 148
int git_packfile_resolve_header(
		size_t *size_p,
149
		git_object_t *type_p,
150
		struct git_pack_file *p,
151
		off64_t offset);
152

153
int git_packfile_unpack(git_rawobj *obj, struct git_pack_file *p, off64_t *obj_offset);
154

155
int git_packfile_stream_open(git_packfile_stream *obj, struct git_pack_file *p, off64_t curpos);
156
ssize_t git_packfile_stream_read(git_packfile_stream *obj, void *buffer, size_t len);
157
void git_packfile_stream_dispose(git_packfile_stream *obj);
158

159 160 161 162 163 164
int get_delta_base(
		off64_t *delta_base_out,
		struct git_pack_file *p,
		git_mwindow **w_curs,
		off64_t *curpos,
		git_object_t type,
165
		off64_t delta_obj_offset);
166

167
void git_packfile_close(struct git_pack_file *p, bool unlink_packfile);
168
void git_packfile_free(struct git_pack_file *p);
169 170
int git_packfile_alloc(struct git_pack_file **pack_out, const char *path);

171 172 173 174
int git_pack_entry_find(
		struct git_pack_entry *e,
		struct git_pack_file *p,
		const git_oid *short_oid,
175
		size_t len);
176 177
int git_pack_foreach_entry(
		struct git_pack_file *p,
178
		git_odb_foreach_cb cb,
179
		void *data);
180

181
#endif