641d4513dc3be1dcf12328f735caf88ba22a92cb
[project/make_ext4fs.git] / libsparse / sparse_read.c
1 /*
2 * Copyright (C) 2012 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17 #define _GNU_SOURCE
18 #define _FILE_OFFSET_BITS 64
19 #define _LARGEFILE64_SOURCE 1
20
21 #include <fcntl.h>
22 #include <stdarg.h>
23 #include <stdbool.h>
24 #include <stdint.h>
25 #include <stdio.h>
26 #include <stdlib.h>
27 #include <string.h>
28 #include <unistd.h>
29
30 #include <sparse/sparse.h>
31
32 #include "defs.h"
33 #include "output_file.h"
34 #include "sparse_crc32.h"
35 #include "sparse_file.h"
36 #include "sparse_format.h"
37
38 #if defined(__APPLE__) && defined(__MACH__)
39 #define lseek64 lseek
40 #define off64_t off_t
41 #endif
42
43 #define SPARSE_HEADER_MAJOR_VER 1
44 #define SPARSE_HEADER_LEN (sizeof(sparse_header_t))
45 #define CHUNK_HEADER_LEN (sizeof(chunk_header_t))
46
47 #define COPY_BUF_SIZE (1024U*1024U)
48 static char *copybuf;
49
50 #define min(a, b) \
51 ({ typeof(a) _a = (a); typeof(b) _b = (b); (_a < _b) ? _a : _b; })
52
53 static void verbose_error(bool verbose, int err, const char *fmt, ...)
54 {
55 char *s = "";
56 char *at = "";
57 if (fmt) {
58 va_list argp;
59 int size;
60
61 va_start(argp, fmt);
62 size = vsnprintf(NULL, 0, fmt, argp);
63 va_end(argp);
64
65 if (size < 0) {
66 return;
67 }
68
69 at = malloc(size + 1);
70 if (at == NULL) {
71 return;
72 }
73
74 va_start(argp, fmt);
75 vsnprintf(at, size, fmt, argp);
76 va_end(argp);
77 at[size] = 0;
78 s = " at ";
79 }
80 if (verbose) {
81 if (err == -EOVERFLOW) {
82 sparse_print_verbose("EOF while reading file%s%s\n", s, at);
83 } else if (err == -EINVAL) {
84 sparse_print_verbose("Invalid sparse file format%s%s\n", s, at);
85 } else if (err == -ENOMEM) {
86 sparse_print_verbose("Failed allocation while reading file%s%s\n",
87 s, at);
88 } else {
89 sparse_print_verbose("Unknown error %d%s%s\n", err, s, at);
90 }
91 }
92 if (fmt) {
93 free(at);
94 }
95 }
96
97 static int process_raw_chunk(struct sparse_file *s, unsigned int chunk_size,
98 int fd, int64_t offset, unsigned int blocks, unsigned int block,
99 uint32_t *crc32)
100 {
101 int ret;
102 int chunk;
103 unsigned int len = blocks * s->block_size;
104
105 if (chunk_size % s->block_size != 0) {
106 return -EINVAL;
107 }
108
109 if (chunk_size / s->block_size != blocks) {
110 return -EINVAL;
111 }
112
113 ret = sparse_file_add_fd(s, fd, offset, len, block);
114 if (ret < 0) {
115 return ret;
116 }
117
118 if (crc32) {
119 while (len) {
120 chunk = min(len, COPY_BUF_SIZE);
121 ret = read_all(fd, copybuf, chunk);
122 if (ret < 0) {
123 return ret;
124 }
125 *crc32 = sparse_crc32(*crc32, copybuf, chunk);
126 len -= chunk;
127 }
128 } else {
129 lseek64(fd, len, SEEK_CUR);
130 }
131
132 return 0;
133 }
134
135 static int process_fill_chunk(struct sparse_file *s, unsigned int chunk_size,
136 int fd, unsigned int blocks, unsigned int block, uint32_t *crc32)
137 {
138 int ret;
139 int chunk;
140 int64_t len = (int64_t)blocks * s->block_size;
141 uint32_t fill_val;
142 uint32_t *fillbuf;
143 unsigned int i;
144
145 if (chunk_size != sizeof(fill_val)) {
146 return -EINVAL;
147 }
148
149 ret = read_all(fd, &fill_val, sizeof(fill_val));
150 if (ret < 0) {
151 return ret;
152 }
153
154 ret = sparse_file_add_fill(s, fill_val, len, block);
155 if (ret < 0) {
156 return ret;
157 }
158
159 if (crc32) {
160 /* Fill copy_buf with the fill value */
161 fillbuf = (uint32_t *)copybuf;
162 for (i = 0; i < (COPY_BUF_SIZE / sizeof(fill_val)); i++) {
163 fillbuf[i] = fill_val;
164 }
165
166 while (len) {
167 chunk = min(len, COPY_BUF_SIZE);
168 *crc32 = sparse_crc32(*crc32, copybuf, chunk);
169 len -= chunk;
170 }
171 }
172
173 return 0;
174 }
175
176 static int process_skip_chunk(struct sparse_file *s, unsigned int chunk_size,
177 int fd __unused, unsigned int blocks,
178 unsigned int block __unused, uint32_t *crc32)
179 {
180 if (chunk_size != 0) {
181 return -EINVAL;
182 }
183
184 if (crc32) {
185 int64_t len = (int64_t)blocks * s->block_size;
186 memset(copybuf, 0, COPY_BUF_SIZE);
187
188 while (len) {
189 int chunk = min(len, COPY_BUF_SIZE);
190 *crc32 = sparse_crc32(*crc32, copybuf, chunk);
191 len -= chunk;
192 }
193 }
194
195 return 0;
196 }
197
198 static int process_crc32_chunk(int fd, unsigned int chunk_size, uint32_t crc32)
199 {
200 uint32_t file_crc32;
201 int ret;
202
203 if (chunk_size != sizeof(file_crc32)) {
204 return -EINVAL;
205 }
206
207 ret = read_all(fd, &file_crc32, sizeof(file_crc32));
208 if (ret < 0) {
209 return ret;
210 }
211
212 if (file_crc32 != crc32) {
213 return -EINVAL;
214 }
215
216 return 0;
217 }
218
219 static int process_chunk(struct sparse_file *s, int fd, off64_t offset,
220 unsigned int chunk_hdr_sz, chunk_header_t *chunk_header,
221 unsigned int cur_block, uint32_t *crc_ptr)
222 {
223 int ret;
224 unsigned int chunk_data_size;
225
226 chunk_data_size = chunk_header->total_sz - chunk_hdr_sz;
227
228 switch (chunk_header->chunk_type) {
229 case CHUNK_TYPE_RAW:
230 ret = process_raw_chunk(s, chunk_data_size, fd, offset,
231 chunk_header->chunk_sz, cur_block, crc_ptr);
232 if (ret < 0) {
233 verbose_error(s->verbose, ret, "data block at %lld", offset);
234 return ret;
235 }
236 return chunk_header->chunk_sz;
237 case CHUNK_TYPE_FILL:
238 ret = process_fill_chunk(s, chunk_data_size, fd,
239 chunk_header->chunk_sz, cur_block, crc_ptr);
240 if (ret < 0) {
241 verbose_error(s->verbose, ret, "fill block at %lld", offset);
242 return ret;
243 }
244 return chunk_header->chunk_sz;
245 case CHUNK_TYPE_DONT_CARE:
246 ret = process_skip_chunk(s, chunk_data_size, fd,
247 chunk_header->chunk_sz, cur_block, crc_ptr);
248 if (chunk_data_size != 0) {
249 if (ret < 0) {
250 verbose_error(s->verbose, ret, "skip block at %lld", offset);
251 return ret;
252 }
253 }
254 return chunk_header->chunk_sz;
255 case CHUNK_TYPE_CRC32:
256 ret = process_crc32_chunk(fd, chunk_data_size, *crc_ptr);
257 if (ret < 0) {
258 verbose_error(s->verbose, -EINVAL, "crc block at %lld",
259 offset);
260 return ret;
261 }
262 return 0;
263 default:
264 verbose_error(s->verbose, -EINVAL, "unknown block %04X at %lld",
265 chunk_header->chunk_type, offset);
266 }
267
268 return 0;
269 }
270
271 static int sparse_file_read_sparse(struct sparse_file *s, int fd, bool crc)
272 {
273 int ret;
274 unsigned int i;
275 sparse_header_t sparse_header;
276 chunk_header_t chunk_header;
277 uint32_t crc32 = 0;
278 uint32_t *crc_ptr = 0;
279 unsigned int cur_block = 0;
280 off64_t offset;
281
282 if (!copybuf) {
283 copybuf = malloc(COPY_BUF_SIZE);
284 }
285
286 if (!copybuf) {
287 return -ENOMEM;
288 }
289
290 if (crc) {
291 crc_ptr = &crc32;
292 }
293
294 ret = read_all(fd, &sparse_header, sizeof(sparse_header));
295 if (ret < 0) {
296 return ret;
297 }
298
299 if (sparse_header.magic != SPARSE_HEADER_MAGIC) {
300 return -EINVAL;
301 }
302
303 if (sparse_header.major_version != SPARSE_HEADER_MAJOR_VER) {
304 return -EINVAL;
305 }
306
307 if (sparse_header.file_hdr_sz < SPARSE_HEADER_LEN) {
308 return -EINVAL;
309 }
310
311 if (sparse_header.chunk_hdr_sz < sizeof(chunk_header)) {
312 return -EINVAL;
313 }
314
315 if (sparse_header.file_hdr_sz > SPARSE_HEADER_LEN) {
316 /* Skip the remaining bytes in a header that is longer than
317 * we expected.
318 */
319 lseek64(fd, sparse_header.file_hdr_sz - SPARSE_HEADER_LEN, SEEK_CUR);
320 }
321
322 for (i = 0; i < sparse_header.total_chunks; i++) {
323 ret = read_all(fd, &chunk_header, sizeof(chunk_header));
324 if (ret < 0) {
325 return ret;
326 }
327
328 if (sparse_header.chunk_hdr_sz > CHUNK_HEADER_LEN) {
329 /* Skip the remaining bytes in a header that is longer than
330 * we expected.
331 */
332 lseek64(fd, sparse_header.chunk_hdr_sz - CHUNK_HEADER_LEN, SEEK_CUR);
333 }
334
335 offset = lseek64(fd, 0, SEEK_CUR);
336
337 ret = process_chunk(s, fd, offset, sparse_header.chunk_hdr_sz, &chunk_header,
338 cur_block, crc_ptr);
339 if (ret < 0) {
340 return ret;
341 }
342
343 cur_block += ret;
344 }
345
346 if (sparse_header.total_blks != cur_block) {
347 return -EINVAL;
348 }
349
350 return 0;
351 }
352
353 static int sparse_file_read_normal(struct sparse_file *s, int fd)
354 {
355 int ret;
356 uint32_t *buf = malloc(s->block_size);
357 unsigned int block = 0;
358 int64_t remain = s->len;
359 int64_t offset = 0;
360 unsigned int to_read;
361 unsigned int i;
362 bool sparse_block;
363
364 if (!buf) {
365 return -ENOMEM;
366 }
367
368 while (remain > 0) {
369 to_read = min(remain, s->block_size);
370 ret = read_all(fd, buf, to_read);
371 if (ret < 0) {
372 error("failed to read sparse file");
373 return ret;
374 }
375
376 if (to_read == s->block_size) {
377 sparse_block = true;
378 for (i = 1; i < s->block_size / sizeof(uint32_t); i++) {
379 if (buf[0] != buf[i]) {
380 sparse_block = false;
381 break;
382 }
383 }
384 } else {
385 sparse_block = false;
386 }
387
388 if (sparse_block) {
389 /* TODO: add flag to use skip instead of fill for buf[0] == 0 */
390 sparse_file_add_fill(s, buf[0], to_read, block);
391 } else {
392 sparse_file_add_fd(s, fd, offset, to_read, block);
393 }
394
395 remain -= to_read;
396 offset += to_read;
397 block++;
398 }
399
400 return 0;
401 }
402
403 int sparse_file_read(struct sparse_file *s, int fd, bool sparse, bool crc)
404 {
405 if (crc && !sparse) {
406 return -EINVAL;
407 }
408
409 if (sparse) {
410 return sparse_file_read_sparse(s, fd, crc);
411 } else {
412 return sparse_file_read_normal(s, fd);
413 }
414 }
415
416 struct sparse_file *sparse_file_import(int fd, bool verbose, bool crc)
417 {
418 int ret;
419 sparse_header_t sparse_header;
420 int64_t len;
421 struct sparse_file *s;
422
423 ret = read_all(fd, &sparse_header, sizeof(sparse_header));
424 if (ret < 0) {
425 verbose_error(verbose, ret, "header");
426 return NULL;
427 }
428
429 if (sparse_header.magic != SPARSE_HEADER_MAGIC) {
430 verbose_error(verbose, -EINVAL, "header magic");
431 return NULL;
432 }
433
434 if (sparse_header.major_version != SPARSE_HEADER_MAJOR_VER) {
435 verbose_error(verbose, -EINVAL, "header major version");
436 return NULL;
437 }
438
439 if (sparse_header.file_hdr_sz < SPARSE_HEADER_LEN) {
440 return NULL;
441 }
442
443 if (sparse_header.chunk_hdr_sz < sizeof(chunk_header_t)) {
444 return NULL;
445 }
446
447 len = (int64_t)sparse_header.total_blks * sparse_header.blk_sz;
448 s = sparse_file_new(sparse_header.blk_sz, len);
449 if (!s) {
450 verbose_error(verbose, -EINVAL, NULL);
451 return NULL;
452 }
453
454 ret = lseek64(fd, 0, SEEK_SET);
455 if (ret < 0) {
456 verbose_error(verbose, ret, "seeking");
457 sparse_file_destroy(s);
458 return NULL;
459 }
460
461 s->verbose = verbose;
462
463 ret = sparse_file_read(s, fd, true, crc);
464 if (ret < 0) {
465 sparse_file_destroy(s);
466 return NULL;
467 }
468
469 return s;
470 }
471
472 struct sparse_file *sparse_file_import_auto(int fd, bool crc, bool verbose)
473 {
474 struct sparse_file *s;
475 int64_t len;
476 int ret;
477
478 s = sparse_file_import(fd, verbose, crc);
479 if (s) {
480 return s;
481 }
482
483 len = lseek64(fd, 0, SEEK_END);
484 if (len < 0) {
485 return NULL;
486 }
487
488 lseek64(fd, 0, SEEK_SET);
489
490 s = sparse_file_new(4096, len);
491 if (!s) {
492 return NULL;
493 }
494
495 ret = sparse_file_read_normal(s, fd);
496 if (ret < 0) {
497 sparse_file_destroy(s);
498 return NULL;
499 }
500
501 return s;
502 }