1 // (C) Copyright 2008 CodeRage, LLC (turkanis at coderage dot com)
2 // (C) Copyright 2004-2007 Jonathan Turkanis
3 // Distributed under the Boost Software License, Version 1.0. (See accompanying
4 // file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt.)
5
6 // See http://www.boost.org/libs/iostreams for documentation.
7
8 #include <cstddef>
9 #include <string>
10 #include <boost/iostreams/copy.hpp>
11 #include <boost/iostreams/device/array.hpp>
12 #include <boost/iostreams/device/back_inserter.hpp>
13 #include <boost/iostreams/filter/gzip.hpp>
14 #include <boost/iostreams/filter/test.hpp>
15 #include <boost/iostreams/filtering_stream.hpp>
16 #include <boost/ref.hpp>
17 #include <boost/range/iterator_range.hpp>
18 #include <boost/test/test_tools.hpp>
19 #include <boost/test/unit_test.hpp>
20 #include "detail/sequence.hpp"
21 #include "detail/verification.hpp"
22
23 using namespace boost;
24 using namespace boost::iostreams;
25 using namespace boost::iostreams::test;
26 namespace io = boost::iostreams;
27 using boost::unit_test::test_suite;
28
29 struct gzip_alloc : std::allocator<char> {
gzip_allocgzip_alloc30 gzip_alloc() { }
gzip_allocgzip_alloc31 gzip_alloc(const gzip_alloc& other) { }
32 template<typename T>
gzip_allocgzip_alloc33 gzip_alloc(const std::allocator<T>& other) { }
34 };
35
compression_test()36 void compression_test()
37 {
38 text_sequence data;
39
40 // Test compression and decompression with metadata
41 for (int i = 0; i < 4; ++i) {
42 gzip_params params;
43 if (i & 1) {
44 params.file_name = "original file name";
45 }
46 if (i & 2) {
47 params.comment = "detailed file description";
48 }
49 gzip_compressor out(params);
50 gzip_decompressor in;
51 BOOST_CHECK(
52 test_filter_pair( boost::ref(out),
53 boost::ref(in),
54 std::string(data.begin(), data.end()) )
55 );
56 BOOST_CHECK(in.file_name() == params.file_name);
57 BOOST_CHECK(in.comment() == params.comment);
58 }
59
60 // Test compression and decompression with custom allocator
61 BOOST_CHECK(
62 test_filter_pair( basic_gzip_compressor<gzip_alloc>(),
63 basic_gzip_decompressor<gzip_alloc>(),
64 std::string(data.begin(), data.end()) )
65 );
66 }
67
multiple_member_test()68 void multiple_member_test()
69 {
70 text_sequence data;
71 std::vector<char> temp, dest;
72
73 // Write compressed data to temp, twice in succession
74 filtering_ostream out;
75 out.push(gzip_compressor());
76 out.push(io::back_inserter(temp));
77 io::copy(make_iterator_range(data), out);
78 out.push(io::back_inserter(temp));
79 io::copy(make_iterator_range(data), out);
80
81 // Read compressed data from temp into dest
82 filtering_istream in;
83 in.push(gzip_decompressor());
84 in.push(array_source(&temp[0], temp.size()));
85 io::copy(in, io::back_inserter(dest));
86
87 // Check that dest consists of two copies of data
88 BOOST_REQUIRE_EQUAL(data.size() * 2, dest.size());
89 BOOST_CHECK(std::equal(data.begin(), data.end(), dest.begin()));
90 BOOST_CHECK(std::equal(data.begin(), data.end(), dest.begin() + dest.size() / 2));
91
92 dest.clear();
93 io::copy(
94 array_source(&temp[0], temp.size()),
95 io::compose(gzip_decompressor(), io::back_inserter(dest)));
96
97 // Check that dest consists of two copies of data
98 BOOST_REQUIRE_EQUAL(data.size() * 2, dest.size());
99 BOOST_CHECK(std::equal(data.begin(), data.end(), dest.begin()));
100 BOOST_CHECK(std::equal(data.begin(), data.end(), dest.begin() + dest.size() / 2));
101 }
102
array_source_test()103 void array_source_test()
104 {
105 std::string data = "simple test string.";
106 std::string encoded;
107
108 filtering_ostream out;
109 out.push(gzip_compressor());
110 out.push(io::back_inserter(encoded));
111 io::copy(make_iterator_range(data), out);
112
113 std::string res;
114 io::array_source src(encoded.data(),encoded.length());
115 io::copy(io::compose(io::gzip_decompressor(), src), io::back_inserter(res));
116
117 BOOST_CHECK_EQUAL(data, res);
118 }
119
120 #if defined(BOOST_MSVC)
121 # pragma warning(push)
122 # pragma warning(disable:4309) // Truncation of constant value
123 #endif
124
header_test()125 void header_test()
126 {
127 // This test is in response to https://svn.boost.org/trac/boost/ticket/5908
128 // which describes a problem parsing gzip headers with extra fields as
129 // defined in RFC 1952 (http://www.ietf.org/rfc/rfc1952.txt).
130 // The extra field data used here is characteristic of the tabix file
131 // format (http://samtools.sourceforge.net/tabix.shtml).
132 const char header_bytes[] = {
133 static_cast<char>(gzip::magic::id1),
134 static_cast<char>(gzip::magic::id2),
135 gzip::method::deflate, // Compression Method: deflate
136 gzip::flags::extra | gzip::flags::name | gzip::flags::comment, // flags
137 '\x22', '\x9c', '\xf3', '\x4e', // 4 byte modification time (little endian)
138 gzip::extra_flags::best_compression, // XFL
139 gzip::os_unix, // OS
140 6, 0, // 2 byte length of extra field (little endian, 6 bytes)
141 'B', 'C', 2, 0, 0, 0, // 6 bytes worth of extra field data
142 'a', 'b', 'c', 0, // original filename, null terminated
143 'n', 'o', ' ', 'c', 'o', 'm', 'm', 'e', 'n', 't', 0, // comment
144 };
145 size_t sz = sizeof(header_bytes)/sizeof(header_bytes[0]);
146
147 boost::iostreams::detail::gzip_header hdr;
148 for (size_t i = 0; i < sz; ++i) {
149 hdr.process(header_bytes[i]);
150
151 // Require that we are done at the last byte, not before.
152 if (i == sz-1)
153 BOOST_REQUIRE(hdr.done());
154 else
155 BOOST_REQUIRE(!hdr.done());
156 }
157
158 BOOST_CHECK_EQUAL("abc", hdr.file_name());
159 BOOST_CHECK_EQUAL("no comment", hdr.comment());
160 BOOST_CHECK_EQUAL(0x4ef39c22, hdr.mtime());
161 BOOST_CHECK_EQUAL(gzip::os_unix, hdr.os());
162 }
163
164 #if defined(BOOST_MSVC)
165 # pragma warning(pop)
166 #endif
167
empty_file_test()168 void empty_file_test()
169 {
170 // This test is in response to https://svn.boost.org/trac/boost/ticket/5237
171 // The previous implementation of gzip_compressor only wrote the gzip file
172 // header when the first bytes of uncompressed input were processed, causing
173 // incorrect behavior for empty files
174 BOOST_CHECK(
175 test_filter_pair( gzip_compressor(),
176 gzip_decompressor(),
177 std::string() )
178 );
179 }
180
multipart_test()181 void multipart_test()
182 {
183 // This test verifies that the gzip_decompressor properly handles a file
184 // that was written in multiple parts using Z_FULL_FLUSH, and in particular
185 // handles the CRC properly when one of those parts is empty.
186 const char multipart_file[] = {
187 '\x1f', '\x8b', '\x08', '\x00', '\x00', '\x00', '\x00', '\x00', '\x02', '\xff', '\xf2', '\xc9',
188 '\xcc', '\x4b', '\x55', '\x30', '\xe4', '\xf2', '\x01', '\x51', '\x46', '\x10', '\xca', '\x98',
189 '\x0b', '\x00', '\x00', '\x00', '\xff', '\xff', '\x03', '\x00', '\xdb', '\xa7', '\x83', '\xc9',
190 '\x15', '\x00', '\x00', '\x00', '\x1f', '\x8b', '\x08', '\x00', '\x00', '\x00', '\x00', '\x00',
191 '\x02', '\xff', '\xf2', '\xc9', '\xcc', '\x4b', '\x55', '\x30', '\xe1', '\xf2', '\x01', '\x51',
192 '\xa6', '\x10', '\xca', '\x8c', '\x0b', '\x00', '\x00', '\x00', '\xff', '\xff', '\x03', '\x00',
193 '\x41', '\xe3', '\xcc', '\xaa', '\x15', '\x00', '\x00', '\x00', '\x1f', '\x8b', '\x08', '\x00',
194 '\x00', '\x00', '\x00', '\x00', '\x02', '\xff', '\x02', '\x00', '\x00', '\x00', '\xff', '\xff',
195 '\x03', '\x00', '\x00', '\x00', '\x00', '\x00', '\x00', '\x00', '\x00', '\x00', '\x1f', '\x8b',
196 '\x08', '\x00', '\x00', '\x00', '\x00', '\x00', '\x02', '\xff', '\xf2', '\xc9', '\xcc', '\x4b',
197 '\x55', '\x30', '\xe7', '\xf2', '\x01', '\x51', '\x16', '\x10', '\xca', '\x92', '\x0b', '\x00',
198 '\x00', '\x00', '\xff', '\xff', '\x03', '\x00', '\x2b', '\xac', '\xd3', '\xf5', '\x15', '\x00',
199 '\x00', '\x00'
200 };
201
202 filtering_istream in;
203 std::string line;
204
205 in.push(gzip_decompressor());
206 in.push(io::array_source(multipart_file, sizeof(multipart_file)));
207
208 // First part
209 std::getline(in, line);
210 BOOST_CHECK_EQUAL("Line 1", line);
211 std::getline(in, line);
212 BOOST_CHECK_EQUAL("Line 2", line);
213 std::getline(in, line);
214 BOOST_CHECK_EQUAL("Line 3", line);
215
216 // Second part immediately follows
217 std::getline(in, line);
218 BOOST_CHECK_EQUAL("Line 4", line);
219 std::getline(in, line);
220 BOOST_CHECK_EQUAL("Line 5", line);
221 std::getline(in, line);
222 BOOST_CHECK_EQUAL("Line 6", line);
223
224 // Then an empty part, followed by one last 3-line part.
225 std::getline(in, line);
226 BOOST_CHECK_EQUAL("Line 7", line);
227 std::getline(in, line);
228 BOOST_CHECK_EQUAL("Line 8", line);
229 std::getline(in, line);
230 BOOST_CHECK_EQUAL("Line 9", line);
231
232 // Check for gzip errors too.
233 BOOST_CHECK(!in.bad());
234 }
235
init_unit_test_suite(int,char * [])236 test_suite* init_unit_test_suite(int, char* [])
237 {
238 test_suite* test = BOOST_TEST_SUITE("gzip test");
239 test->add(BOOST_TEST_CASE(&compression_test));
240 test->add(BOOST_TEST_CASE(&multiple_member_test));
241 test->add(BOOST_TEST_CASE(&array_source_test));
242 test->add(BOOST_TEST_CASE(&header_test));
243 test->add(BOOST_TEST_CASE(&empty_file_test));
244 test->add(BOOST_TEST_CASE(&multipart_test));
245 return test;
246 }
247