1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "ui/base/resource/data_pack.h"
6
7 #include <errno.h>
8
9 #include "base/files/file_util.h"
10 #include "base/files/memory_mapped_file.h"
11 #include "base/logging.h"
12 #include "base/memory/ref_counted_memory.h"
13 #include "base/metrics/histogram.h"
14 #include "base/strings/string_piece.h"
15
16 // For details of the file layout, see
17 // http://dev.chromium.org/developers/design-documents/linuxresourcesandlocalizedstrings
18
19 namespace {
20
21 static const uint32 kFileFormatVersion = 4;
22 // Length of file header: version, entry count and text encoding type.
23 static const size_t kHeaderLength = 2 * sizeof(uint32) + sizeof(uint8);
24
25 #pragma pack(push,2)
26 struct DataPackEntry {
27 uint16 resource_id;
28 uint32 file_offset;
29
CompareById__anon3561815c0111::DataPackEntry30 static int CompareById(const void* void_key, const void* void_entry) {
31 uint16 key = *reinterpret_cast<const uint16*>(void_key);
32 const DataPackEntry* entry =
33 reinterpret_cast<const DataPackEntry*>(void_entry);
34 if (key < entry->resource_id) {
35 return -1;
36 } else if (key > entry->resource_id) {
37 return 1;
38 } else {
39 return 0;
40 }
41 }
42 };
43 #pragma pack(pop)
44
45 COMPILE_ASSERT(sizeof(DataPackEntry) == 6, size_of_entry_must_be_six);
46
47 // We're crashing when trying to load a pak file on Windows. Add some error
48 // codes for logging.
49 // http://crbug.com/58056
50 enum LoadErrors {
51 INIT_FAILED = 1,
52 BAD_VERSION,
53 INDEX_TRUNCATED,
54 ENTRY_NOT_FOUND,
55 HEADER_TRUNCATED,
56 WRONG_ENCODING,
57 INIT_FAILED_FROM_FILE,
58
59 LOAD_ERRORS_COUNT,
60 };
61
62 } // namespace
63
64 namespace ui {
65
DataPack(ui::ScaleFactor scale_factor)66 DataPack::DataPack(ui::ScaleFactor scale_factor)
67 : resource_count_(0),
68 text_encoding_type_(BINARY),
69 scale_factor_(scale_factor) {
70 }
71
~DataPack()72 DataPack::~DataPack() {
73 }
74
LoadFromPath(const base::FilePath & path)75 bool DataPack::LoadFromPath(const base::FilePath& path) {
76 mmap_.reset(new base::MemoryMappedFile);
77 if (!mmap_->Initialize(path)) {
78 DLOG(ERROR) << "Failed to mmap datapack";
79 UMA_HISTOGRAM_ENUMERATION("DataPack.Load", INIT_FAILED,
80 LOAD_ERRORS_COUNT);
81 mmap_.reset();
82 return false;
83 }
84 return LoadImpl();
85 }
86
LoadFromFile(base::File file)87 bool DataPack::LoadFromFile(base::File file) {
88 return LoadFromFileRegion(file.Pass(),
89 base::MemoryMappedFile::Region::kWholeFile);
90 }
91
LoadFromFileRegion(base::File file,const base::MemoryMappedFile::Region & region)92 bool DataPack::LoadFromFileRegion(
93 base::File file,
94 const base::MemoryMappedFile::Region& region) {
95 mmap_.reset(new base::MemoryMappedFile);
96 if (!mmap_->Initialize(file.Pass(), region)) {
97 DLOG(ERROR) << "Failed to mmap datapack";
98 UMA_HISTOGRAM_ENUMERATION("DataPack.Load", INIT_FAILED_FROM_FILE,
99 LOAD_ERRORS_COUNT);
100 mmap_.reset();
101 return false;
102 }
103 return LoadImpl();
104 }
105
LoadImpl()106 bool DataPack::LoadImpl() {
107 // Sanity check the header of the file.
108 if (kHeaderLength > mmap_->length()) {
109 DLOG(ERROR) << "Data pack file corruption: incomplete file header.";
110 UMA_HISTOGRAM_ENUMERATION("DataPack.Load", HEADER_TRUNCATED,
111 LOAD_ERRORS_COUNT);
112 mmap_.reset();
113 return false;
114 }
115
116 // Parse the header of the file.
117 // First uint32: version; second: resource count;
118 const uint32* ptr = reinterpret_cast<const uint32*>(mmap_->data());
119 uint32 version = ptr[0];
120 if (version != kFileFormatVersion) {
121 LOG(ERROR) << "Bad data pack version: got " << version << ", expected "
122 << kFileFormatVersion;
123 UMA_HISTOGRAM_ENUMERATION("DataPack.Load", BAD_VERSION,
124 LOAD_ERRORS_COUNT);
125 mmap_.reset();
126 return false;
127 }
128 resource_count_ = ptr[1];
129
130 // third: text encoding.
131 const uint8* ptr_encoding = reinterpret_cast<const uint8*>(ptr + 2);
132 text_encoding_type_ = static_cast<TextEncodingType>(*ptr_encoding);
133 if (text_encoding_type_ != UTF8 && text_encoding_type_ != UTF16 &&
134 text_encoding_type_ != BINARY) {
135 LOG(ERROR) << "Bad data pack text encoding: got " << text_encoding_type_
136 << ", expected between " << BINARY << " and " << UTF16;
137 UMA_HISTOGRAM_ENUMERATION("DataPack.Load", WRONG_ENCODING,
138 LOAD_ERRORS_COUNT);
139 mmap_.reset();
140 return false;
141 }
142
143 // Sanity check the file.
144 // 1) Check we have enough entries. There's an extra entry after the last item
145 // which gives the length of the last item.
146 if (kHeaderLength + (resource_count_ + 1) * sizeof(DataPackEntry) >
147 mmap_->length()) {
148 LOG(ERROR) << "Data pack file corruption: too short for number of "
149 "entries specified.";
150 UMA_HISTOGRAM_ENUMERATION("DataPack.Load", INDEX_TRUNCATED,
151 LOAD_ERRORS_COUNT);
152 mmap_.reset();
153 return false;
154 }
155 // 2) Verify the entries are within the appropriate bounds. There's an extra
156 // entry after the last item which gives us the length of the last item.
157 for (size_t i = 0; i < resource_count_ + 1; ++i) {
158 const DataPackEntry* entry = reinterpret_cast<const DataPackEntry*>(
159 mmap_->data() + kHeaderLength + (i * sizeof(DataPackEntry)));
160 if (entry->file_offset > mmap_->length()) {
161 LOG(ERROR) << "Entry #" << i << " in data pack points off end of file. "
162 << "Was the file corrupted?";
163 UMA_HISTOGRAM_ENUMERATION("DataPack.Load", ENTRY_NOT_FOUND,
164 LOAD_ERRORS_COUNT);
165 mmap_.reset();
166 return false;
167 }
168 }
169
170 return true;
171 }
172
HasResource(uint16 resource_id) const173 bool DataPack::HasResource(uint16 resource_id) const {
174 return !!bsearch(&resource_id, mmap_->data() + kHeaderLength, resource_count_,
175 sizeof(DataPackEntry), DataPackEntry::CompareById);
176 }
177
GetStringPiece(uint16 resource_id,base::StringPiece * data) const178 bool DataPack::GetStringPiece(uint16 resource_id,
179 base::StringPiece* data) const {
180 // It won't be hard to make this endian-agnostic, but it's not worth
181 // bothering to do right now.
182 #if defined(__BYTE_ORDER)
183 // Linux check
184 COMPILE_ASSERT(__BYTE_ORDER == __LITTLE_ENDIAN,
185 datapack_assumes_little_endian);
186 #elif defined(__BIG_ENDIAN__)
187 // Mac check
188 #error DataPack assumes little endian
189 #endif
190
191 const DataPackEntry* target = reinterpret_cast<const DataPackEntry*>(
192 bsearch(&resource_id, mmap_->data() + kHeaderLength, resource_count_,
193 sizeof(DataPackEntry), DataPackEntry::CompareById));
194 if (!target) {
195 return false;
196 }
197
198 const DataPackEntry* next_entry = target + 1;
199 // If the next entry points beyond the end of the file this data pack's entry
200 // table is corrupt. Log an error and return false. See
201 // http://crbug.com/371301.
202 if (next_entry->file_offset > mmap_->length()) {
203 size_t entry_index = target -
204 reinterpret_cast<const DataPackEntry*>(mmap_->data() + kHeaderLength);
205 LOG(ERROR) << "Entry #" << entry_index << " in data pack points off end "
206 << "of file. This should have been caught when loading. Was the "
207 << "file modified?";
208 return false;
209 }
210
211 size_t length = next_entry->file_offset - target->file_offset;
212 data->set(reinterpret_cast<const char*>(mmap_->data() + target->file_offset),
213 length);
214 return true;
215 }
216
GetStaticMemory(uint16 resource_id) const217 base::RefCountedStaticMemory* DataPack::GetStaticMemory(
218 uint16 resource_id) const {
219 base::StringPiece piece;
220 if (!GetStringPiece(resource_id, &piece))
221 return NULL;
222
223 return new base::RefCountedStaticMemory(piece.data(), piece.length());
224 }
225
GetTextEncodingType() const226 ResourceHandle::TextEncodingType DataPack::GetTextEncodingType() const {
227 return text_encoding_type_;
228 }
229
GetScaleFactor() const230 ui::ScaleFactor DataPack::GetScaleFactor() const {
231 return scale_factor_;
232 }
233
234 // static
WritePack(const base::FilePath & path,const std::map<uint16,base::StringPiece> & resources,TextEncodingType textEncodingType)235 bool DataPack::WritePack(const base::FilePath& path,
236 const std::map<uint16, base::StringPiece>& resources,
237 TextEncodingType textEncodingType) {
238 FILE* file = base::OpenFile(path, "wb");
239 if (!file)
240 return false;
241
242 if (fwrite(&kFileFormatVersion, sizeof(kFileFormatVersion), 1, file) != 1) {
243 LOG(ERROR) << "Failed to write file version";
244 base::CloseFile(file);
245 return false;
246 }
247
248 // Note: the python version of this function explicitly sorted keys, but
249 // std::map is a sorted associative container, we shouldn't have to do that.
250 uint32 entry_count = resources.size();
251 if (fwrite(&entry_count, sizeof(entry_count), 1, file) != 1) {
252 LOG(ERROR) << "Failed to write entry count";
253 base::CloseFile(file);
254 return false;
255 }
256
257 if (textEncodingType != UTF8 && textEncodingType != UTF16 &&
258 textEncodingType != BINARY) {
259 LOG(ERROR) << "Invalid text encoding type, got " << textEncodingType
260 << ", expected between " << BINARY << " and " << UTF16;
261 base::CloseFile(file);
262 return false;
263 }
264
265 uint8 write_buffer = textEncodingType;
266 if (fwrite(&write_buffer, sizeof(uint8), 1, file) != 1) {
267 LOG(ERROR) << "Failed to write file text resources encoding";
268 base::CloseFile(file);
269 return false;
270 }
271
272 // Each entry is a uint16 + a uint32. We have an extra entry after the last
273 // item so we can compute the size of the list item.
274 uint32 index_length = (entry_count + 1) * sizeof(DataPackEntry);
275 uint32 data_offset = kHeaderLength + index_length;
276 for (std::map<uint16, base::StringPiece>::const_iterator it =
277 resources.begin();
278 it != resources.end(); ++it) {
279 uint16 resource_id = it->first;
280 if (fwrite(&resource_id, sizeof(resource_id), 1, file) != 1) {
281 LOG(ERROR) << "Failed to write id for " << resource_id;
282 base::CloseFile(file);
283 return false;
284 }
285
286 if (fwrite(&data_offset, sizeof(data_offset), 1, file) != 1) {
287 LOG(ERROR) << "Failed to write offset for " << resource_id;
288 base::CloseFile(file);
289 return false;
290 }
291
292 data_offset += it->second.length();
293 }
294
295 // We place an extra entry after the last item that allows us to read the
296 // size of the last item.
297 uint16 resource_id = 0;
298 if (fwrite(&resource_id, sizeof(resource_id), 1, file) != 1) {
299 LOG(ERROR) << "Failed to write extra resource id.";
300 base::CloseFile(file);
301 return false;
302 }
303
304 if (fwrite(&data_offset, sizeof(data_offset), 1, file) != 1) {
305 LOG(ERROR) << "Failed to write extra offset.";
306 base::CloseFile(file);
307 return false;
308 }
309
310 for (std::map<uint16, base::StringPiece>::const_iterator it =
311 resources.begin();
312 it != resources.end(); ++it) {
313 if (fwrite(it->second.data(), it->second.length(), 1, file) != 1) {
314 LOG(ERROR) << "Failed to write data for " << it->first;
315 base::CloseFile(file);
316 return false;
317 }
318 }
319
320 base::CloseFile(file);
321
322 return true;
323 }
324
325 } // namespace ui
326