zstream.c 4.68 KB
Newer Older
1 2 3 4 5 6 7 8 9 10
#include "clar_libgit2.h"
#include "zstream.h"

static const char *data = "This is a test test test of This is a test";

#define INFLATE_EXTRA 2

static void assert_zlib_equal_(
	const void *expected, size_t e_len,
	const void *compressed, size_t c_len,
11
	const char *msg, const char *file, const char *func, int line)
12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
{
	z_stream stream;
	char *expanded = git__calloc(1, e_len + INFLATE_EXTRA);
	cl_assert(expanded);

	memset(&stream, 0, sizeof(stream));
	stream.next_out  = (Bytef *)expanded;
	stream.avail_out = (uInt)(e_len + INFLATE_EXTRA);
	stream.next_in   = (Bytef *)compressed;
	stream.avail_in  = (uInt)c_len;

	cl_assert(inflateInit(&stream) == Z_OK);
	cl_assert(inflate(&stream, Z_FINISH));
	inflateEnd(&stream);

	clar__assert_equal(
28
		file, func, line, msg, 1,
29 30
		"%d", (int)stream.total_out, (int)e_len);
	clar__assert_equal(
31
		file, func, line, "Buffer len was not exact match", 1,
32 33 34 35
		"%d", (int)stream.avail_out, (int)INFLATE_EXTRA);

	clar__assert(
		memcmp(expanded, expected, e_len) == 0,
36
		file, func, line, "uncompressed data did not match", NULL, 1);
37 38 39 40 41

	git__free(expanded);
}

#define assert_zlib_equal(E,EL,C,CL) \
42
	assert_zlib_equal_(E, EL, C, CL, #EL " != " #CL, __FILE__, __func__, (int)__LINE__)
43

44
void test_zstream__basic(void)
45 46 47 48 49
{
	git_zstream z = GIT_ZSTREAM_INIT;
	char out[128];
	size_t outlen = sizeof(out);

50
	cl_git_pass(git_zstream_init(&z, GIT_ZSTREAM_DEFLATE));
51 52 53 54 55 56 57 58 59
	cl_git_pass(git_zstream_set_input(&z, data, strlen(data) + 1));
	cl_git_pass(git_zstream_get_output(out, &outlen, &z));
	cl_assert(git_zstream_done(&z));
	cl_assert(outlen > 0);
	git_zstream_free(&z);

	assert_zlib_equal(data, strlen(data) + 1, out, outlen);
}

60
void test_zstream__fails_on_trailing_garbage(void)
61
{
62
	git_str deflated = GIT_STR_INIT, inflated = GIT_STR_INIT;
63
	char i = 0;
64 65 66 67 68 69

	/* compress a simple string */
	git_zstream_deflatebuf(&deflated, "foobar!!", 8);

	/* append some garbage */
	for (i = 0; i < 10; i++) {
70
		git_str_putc(&deflated, i);
71 72 73 74
	}

	cl_git_fail(git_zstream_inflatebuf(&inflated, deflated.ptr, deflated.size));

75 76
	git_str_dispose(&deflated);
	git_str_dispose(&inflated);
77 78
}

79
void test_zstream__buffer(void)
80
{
81
	git_str out = GIT_STR_INIT;
82 83
	cl_git_pass(git_zstream_deflatebuf(&out, data, strlen(data) + 1));
	assert_zlib_equal(data, strlen(data) + 1, out.ptr, out.size);
84
	git_str_dispose(&out);
85 86 87 88
}

#define BIG_STRING_PART "Big Data IS Big - Long Data IS Long - We need a buffer larger than 1024 x 1024 to make sure we trigger chunked compression - Big Big Data IS Bigger than Big - Long Long Data IS Longer than Long"

89
static void compress_and_decompress_input_various_ways(git_str *input)
90
{
91 92
	git_str out1 = GIT_STR_INIT, out2 = GIT_STR_INIT;
	git_str inflated = GIT_STR_INIT;
93 94 95
	size_t i, fixed_size = max(input->size / 2, 256);
	char *fixed = git__malloc(fixed_size);
	cl_assert(fixed);
96

97
	/* compress with deflatebuf */
98

99 100
	cl_git_pass(git_zstream_deflatebuf(&out1, input->ptr, input->size));
	assert_zlib_equal(input->ptr, input->size, out1.ptr, out1.size);
101

102
	/* compress with various fixed size buffer (accumulating the output) */
103

104 105 106
	for (i = 0; i < 3; ++i) {
		git_zstream zs = GIT_ZSTREAM_INIT;
		size_t use_fixed_size;
107

108 109 110 111 112 113
		switch (i) {
		case 0: use_fixed_size = 256; break;
		case 1: use_fixed_size = fixed_size / 2; break;
		case 2: use_fixed_size = fixed_size; break;
		}
		cl_assert(use_fixed_size <= fixed_size);
114

115
		cl_git_pass(git_zstream_init(&zs, GIT_ZSTREAM_DEFLATE));
116
		cl_git_pass(git_zstream_set_input(&zs, input->ptr, input->size));
117

118 119 120
		while (!git_zstream_done(&zs)) {
			size_t written = use_fixed_size;
			cl_git_pass(git_zstream_get_output(fixed, &written, &zs));
121
			cl_git_pass(git_str_put(&out2, fixed, written));
122 123 124 125 126 127 128 129 130
		}

		git_zstream_free(&zs);
		assert_zlib_equal(input->ptr, input->size, out2.ptr, out2.size);

		/* did both approaches give the same data? */
		cl_assert_equal_sz(out1.size, out2.size);
		cl_assert(!memcmp(out1.ptr, out2.ptr, out1.size));

131
		git_str_dispose(&out2);
132 133
	}

134 135 136 137
	cl_git_pass(git_zstream_inflatebuf(&inflated, out1.ptr, out1.size));
	cl_assert_equal_i(input->size, inflated.size);
	cl_assert(memcmp(input->ptr, inflated.ptr, inflated.size) == 0);

138 139
	git_str_dispose(&out1);
	git_str_dispose(&inflated);
140 141 142
	git__free(fixed);
}

143
void test_zstream__big_data(void)
144
{
145
	git_str in = GIT_STR_INIT;
146 147 148 149 150
	size_t scan, target;

	for (target = 1024; target <= 1024 * 1024 * 4; target *= 8) {

		/* make a big string that's easy to compress */
151
		git_str_clear(&in);
152 153
		while (in.size < target)
			cl_git_pass(
154
				git_str_put(&in, BIG_STRING_PART, strlen(BIG_STRING_PART)));
155

156
		compress_and_decompress_input_various_ways(&in);
157 158 159 160 161 162

		/* make a big string that's hard to compress */
		srand(0xabad1dea);
		for (scan = 0; scan < in.size; ++scan)
			in.ptr[scan] = (char)rand();

163
		compress_and_decompress_input_various_ways(&in);
164
	}
165

166
	git_str_dispose(&in);
167
}