Blame - applypatch/imgdiff.cpp - android_bootable_recovery

blob: e78a60477ce3f5e6b7a6acf7c7d3a923c0411096 [file] [log] [blame]

Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	1	/*
				2	* Copyright (C) 2009 The Android Open Source Project
				3	*
				4	* Licensed under the Apache License, Version 2.0 (the "License");
				5	* you may not use this file except in compliance with the License.
				6	* You may obtain a copy of the License at
				7	*
				8	* http://www.apache.org/licenses/LICENSE-2.0
				9	*
				10	* Unless required by applicable law or agreed to in writing, software
				11	* distributed under the License is distributed on an "AS IS" BASIS,
				12	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
				13	* See the License for the specific language governing permissions and
				14	* limitations under the License.
				15	*/
				16
				17	/*
				18	* This program constructs binary patches for images -- such as boot.img
				19	* and recovery.img -- that consist primarily of large chunks of gzipped
				20	* data interspersed with uncompressed data. Doing a naive bsdiff of
				21	* these files is not useful because small changes in the data lead to
				22	* large changes in the compressed bitstream; bsdiff patches of gzipped
				23	* data are typically as large as the data itself.
				24	*
				25	* To patch these usefully, we break the source and target images up into
				26	* chunks of two types: "normal" and "gzip". Normal chunks are simply
				27	* patched using a plain bsdiff. Gzip chunks are first expanded, then a
				28	* bsdiff is applied to the uncompressed data, then the patched data is
				29	* gzipped using the same encoder parameters. Patched chunks are
				30	* concatenated together to create the output file; the output image
				31	* should be exactly the same series of bytes as the target image used
				32	* originally to generate the patch.
				33	*
				34	* To work well with this tool, the gzipped sections of the target
				35	* image must have been generated using the same deflate encoder that
				36	* is available in applypatch, namely, the one in the zlib library.
				37	* In practice this means that images should be compressed using the
				38	* "minigzip" tool included in the zlib distribution, not the GNU gzip
				39	* program.
				40	*
				41	* An "imgdiff" patch consists of a header describing the chunk structure
				42	* of the file and any encoding parameters needed for the gzipped
				43	* chunks, followed by N bsdiff patches, one per chunk.
				44	*
				45	* For a diff to be generated, the source and target images must have the
				46	* same "chunk" structure: that is, the same number of gzipped and normal
				47	* chunks in the same order. Android boot and recovery images currently
				48	* consist of five chunks: a small normal header, a gzipped kernel, a
				49	* small normal section, a gzipped ramdisk, and finally a small normal
				50	* footer.
				51	*
				52	* Caveats: we locate gzipped sections within the source and target
				53	* images by searching for the byte sequence 1f8b0800: 1f8b is the gzip
				54	* magic number; 08 specifies the "deflate" encoding [the only encoding
				55	* supported by the gzip standard]; and 00 is the flags byte. We do not
				56	* currently support any extra header fields (which would be indicated by
				57	* a nonzero flags byte). We also don't handle the case when that byte
				58	* sequence appears spuriously in the file. (Note that it would have to
				59	* occur spuriously within a normal chunk to be a problem.)
				60	*
				61	*
				62	* The imgdiff patch header looks like this:
				63	*
				64	* "IMGDIFF1" (8) [magic number and version]
				65	* chunk count (4)
				66	* for each chunk:
				67	* chunk type (4) [CHUNK_{NORMAL, GZIP, DEFLATE, RAW}]
				68	* if chunk type == CHUNK_NORMAL:
				69	* source start (8)
				70	* source len (8)
				71	* bsdiff patch offset (8) [from start of patch file]
				72	* if chunk type == CHUNK_GZIP: (version 1 only)
				73	* source start (8)
				74	* source len (8)
				75	* bsdiff patch offset (8) [from start of patch file]
				76	* source expanded len (8) [size of uncompressed source]
				77	* target expected len (8) [size of uncompressed target]
				78	* gzip level (4)
				79	* method (4)
				80	* windowBits (4)
				81	* memLevel (4)
				82	* strategy (4)
				83	* gzip header len (4)
				84	* gzip header (gzip header len)
				85	* gzip footer (8)
				86	* if chunk type == CHUNK_DEFLATE: (version 2 only)
				87	* source start (8)
				88	* source len (8)
				89	* bsdiff patch offset (8) [from start of patch file]
				90	* source expanded len (8) [size of uncompressed source]
				91	* target expected len (8) [size of uncompressed target]
				92	* gzip level (4)
				93	* method (4)
				94	* windowBits (4)
				95	* memLevel (4)
				96	* strategy (4)
				97	* if chunk type == RAW: (version 2 only)
				98	* target len (4)
				99	* data (target len)
				100	*
				101	* All integers are little-endian. "source start" and "source len"
				102	* specify the section of the input image that comprises this chunk,
				103	* including the gzip header and footer for gzip chunks. "source
				104	* expanded len" is the size of the uncompressed source data. "target
				105	* expected len" is the size of the uncompressed data after applying
				106	* the bsdiff patch. The next five parameters specify the zlib
				107	* parameters to be used when compressing the patched data, and the
				108	* next three specify the header and footer to be wrapped around the
				109	* compressed data to create the output chunk (so that header contents
				110	* like the timestamp are recreated exactly).
				111	*
				112	* After the header there are 'chunk count' bsdiff patches; the offset
				113	* of each from the beginning of the file is specified in the header.
Doug Zongker	a3ccba6	2012-08-20 15:28:02 -0700	[diff] [blame]	114	*
				115	* This tool can take an optional file of "bonus data". This is an
				116	* extra file of data that is appended to chunk #1 after it is
				117	* compressed (it must be a CHUNK_DEFLATE chunk). The same file must
				118	* be available (and passed to applypatch with -b) when applying the
				119	* patch. This is used to reduce the size of recovery-from-boot
				120	* patches by combining the boot image with recovery ramdisk
				121	* information that is stored on the system partition.
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	122	*/
				123
				124	#include <errno.h>
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	125	#include <inttypes.h>
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	126	#include <stdio.h>
				127	#include <stdlib.h>
				128	#include <string.h>
				129	#include <sys/stat.h>
				130	#include <unistd.h>
				131	#include <sys/types.h>
				132
Sen Jiang	2fffcb1	2016-05-03 15:49:10 -0700	[diff] [blame]	133	#include <bsdiff.h>
				134
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	135	#include "zlib.h"
				136	#include "imgdiff.h"
				137	#include "utils.h"
				138
				139	typedef struct {
				140	int type; // CHUNK_NORMAL, CHUNK_DEFLATE
				141	size_t start; // offset of chunk in original image file
				142
				143	size_t len;
				144	unsigned char* data; // data to be patched (uncompressed, for deflate chunks)
				145
				146	size_t source_start;
				147	size_t source_len;
				148
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	149	// --- for CHUNK_DEFLATE chunks only: ---
				150
				151	// original (compressed) deflate data
				152	size_t deflate_len;
				153	unsigned char* deflate_data;
				154
				155	char* filename; // used for zip entries
				156
				157	// deflate encoder parameters
				158	int level, method, windowBits, memLevel, strategy;
				159
				160	size_t source_uncompressed_len;
				161	} ImageChunk;
				162
				163	typedef struct {
				164	int data_offset;
				165	int deflate_len;
				166	int uncomp_len;
				167	char* filename;
				168	} ZipFileEntry;
				169
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	170	static int fileentry_compare(const void* a, const void* b) {
				171	int ao = ((ZipFileEntry*)a)->data_offset;
				172	int bo = ((ZipFileEntry*)b)->data_offset;
				173	if (ao < bo) {
				174	return -1;
				175	} else if (ao > bo) {
				176	return 1;
				177	} else {
				178	return 0;
				179	}
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	180	}
				181
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	182	unsigned char* ReadZip(const char* filename,
				183	int* num_chunks, ImageChunk** chunks,
				184	int include_pseudo_chunk) {
				185	struct stat st;
				186	if (stat(filename, &st) != 0) {
				187	printf("failed to stat \"%s\": %s\n", filename, strerror(errno));
				188	return NULL;
				189	}
				190
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	191	size_t sz = static_cast<size_t>(st.st_size);
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	192	unsigned char* img = reinterpret_cast<unsigned char*>(malloc(sz));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	193	FILE* f = fopen(filename, "rb");
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	194	if (fread(img, 1, sz, f) != sz) {
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	195	printf("failed to read \"%s\" %s\n", filename, strerror(errno));
				196	fclose(f);
				197	return NULL;
				198	}
				199	fclose(f);
				200
				201	// look for the end-of-central-directory record.
				202
				203	int i;
				204	for (i = st.st_size-20; i >= 0 && i > st.st_size - 65600; --i) {
				205	if (img[i] == 0x50 && img[i+1] == 0x4b &&
				206	img[i+2] == 0x05 && img[i+3] == 0x06) {
				207	break;
				208	}
				209	}
				210	// double-check: this archive consists of a single "disk"
				211	if (!(img[i+4] == 0 && img[i+5] == 0 && img[i+6] == 0 && img[i+7] == 0)) {
				212	printf("can't process multi-disk archive\n");
				213	return NULL;
				214	}
				215
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	216	int cdcount = Read2(img+i+8);
				217	int cdoffset = Read4(img+i+16);
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	218
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	219	ZipFileEntry* temp_entries = reinterpret_cast<ZipFileEntry*>(malloc(
				220	cdcount * sizeof(ZipFileEntry)));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	221	int entrycount = 0;
				222
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	223	unsigned char* cd = img+cdoffset;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	224	for (i = 0; i < cdcount; ++i) {
				225	if (!(cd[0] == 0x50 && cd[1] == 0x4b && cd[2] == 0x01 && cd[3] == 0x02)) {
				226	printf("bad central directory entry %d\n", i);
Rahul Chaudhry	3a5177b	2016-11-15 16:18:46 -0800	[diff] [blame^]	227	free(temp_entries);
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	228	return NULL;
				229	}
				230
				231	int clen = Read4(cd+20); // compressed len
				232	int ulen = Read4(cd+24); // uncompressed len
				233	int nlen = Read2(cd+28); // filename len
				234	int xlen = Read2(cd+30); // extra field len
				235	int mlen = Read2(cd+32); // file comment len
				236	int hoffset = Read4(cd+42); // local header offset
				237
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	238	char* filename = reinterpret_cast<char*>(malloc(nlen+1));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	239	memcpy(filename, cd+46, nlen);
				240	filename[nlen] = '\0';
				241
				242	int method = Read2(cd+10);
				243
				244	cd += 46 + nlen + xlen + mlen;
				245
				246	if (method != 8) { // 8 == deflate
				247	free(filename);
				248	continue;
				249	}
				250
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	251	unsigned char* lh = img + hoffset;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	252
				253	if (!(lh[0] == 0x50 && lh[1] == 0x4b && lh[2] == 0x03 && lh[3] == 0x04)) {
				254	printf("bad local file header entry %d\n", i);
				255	return NULL;
				256	}
				257
				258	if (Read2(lh+26) != nlen \|\| memcmp(lh+30, filename, nlen) != 0) {
				259	printf("central dir filename doesn't match local header\n");
				260	return NULL;
				261	}
				262
				263	xlen = Read2(lh+28); // extra field len; might be different from CD entry?
				264
				265	temp_entries[entrycount].data_offset = hoffset+30+nlen+xlen;
				266	temp_entries[entrycount].deflate_len = clen;
				267	temp_entries[entrycount].uncomp_len = ulen;
				268	temp_entries[entrycount].filename = filename;
				269	++entrycount;
				270	}
				271
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	272	qsort(temp_entries, entrycount, sizeof(ZipFileEntry), fileentry_compare);
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	273
				274	#if 0
				275	printf("found %d deflated entries\n", entrycount);
				276	for (i = 0; i < entrycount; ++i) {
				277	printf("off %10d len %10d unlen %10d %p %s\n",
				278	temp_entries[i].data_offset,
				279	temp_entries[i].deflate_len,
				280	temp_entries[i].uncomp_len,
				281	temp_entries[i].filename,
				282	temp_entries[i].filename);
				283	}
				284	#endif
				285
				286	*num_chunks = 0;
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	287	chunks = reinterpret_cast<ImageChunk>(malloc((entrycount2+2) sizeof(ImageChunk)));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	288	ImageChunk* curr = *chunks;
				289
				290	if (include_pseudo_chunk) {
				291	curr->type = CHUNK_NORMAL;
				292	curr->start = 0;
				293	curr->len = st.st_size;
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	294	curr->data = img;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	295	curr->filename = NULL;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	296	++curr;
				297	++*num_chunks;
				298	}
				299
				300	int pos = 0;
				301	int nextentry = 0;
				302
				303	while (pos < st.st_size) {
				304	if (nextentry < entrycount && pos == temp_entries[nextentry].data_offset) {
				305	curr->type = CHUNK_DEFLATE;
				306	curr->start = pos;
				307	curr->deflate_len = temp_entries[nextentry].deflate_len;
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	308	curr->deflate_data = img + pos;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	309	curr->filename = temp_entries[nextentry].filename;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	310
				311	curr->len = temp_entries[nextentry].uncomp_len;
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	312	curr->data = reinterpret_cast<unsigned char*>(malloc(curr->len));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	313
				314	z_stream strm;
				315	strm.zalloc = Z_NULL;
				316	strm.zfree = Z_NULL;
				317	strm.opaque = Z_NULL;
				318	strm.avail_in = curr->deflate_len;
				319	strm.next_in = curr->deflate_data;
				320
				321	// -15 means we are decoding a 'raw' deflate stream; zlib will
				322	// not expect zlib headers.
				323	int ret = inflateInit2(&strm, -15);
				324
				325	strm.avail_out = curr->len;
				326	strm.next_out = curr->data;
				327	ret = inflate(&strm, Z_NO_FLUSH);
				328	if (ret != Z_STREAM_END) {
				329	printf("failed to inflate \"%s\"; %d\n", curr->filename, ret);
				330	return NULL;
				331	}
				332
				333	inflateEnd(&strm);
				334
				335	pos += curr->deflate_len;
				336	++nextentry;
				337	++*num_chunks;
				338	++curr;
				339	continue;
				340	}
				341
				342	// use a normal chunk to take all the data up to the start of the
				343	// next deflate section.
				344
				345	curr->type = CHUNK_NORMAL;
				346	curr->start = pos;
				347	if (nextentry < entrycount) {
				348	curr->len = temp_entries[nextentry].data_offset - pos;
				349	} else {
				350	curr->len = st.st_size - pos;
				351	}
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	352	curr->data = img + pos;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	353	curr->filename = NULL;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	354	pos += curr->len;
				355
				356	++*num_chunks;
				357	++curr;
				358	}
				359
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	360	free(temp_entries);
				361	return img;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	362	}
				363
				364	/*
				365	* Read the given file and break it up into chunks, putting the number
				366	* of chunks and their info in num_chunks and *chunks,
				367	* respectively. Returns a malloc'd block of memory containing the
				368	* contents of the file; various pointers in the output chunk array
				369	* will point into this block of memory. The caller should free the
				370	* return value when done with all the chunks. Returns NULL on
				371	* failure.
				372	*/
				373	unsigned char* ReadImage(const char* filename,
				374	int* num_chunks, ImageChunk** chunks) {
				375	struct stat st;
				376	if (stat(filename, &st) != 0) {
				377	printf("failed to stat \"%s\": %s\n", filename, strerror(errno));
				378	return NULL;
				379	}
				380
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	381	size_t sz = static_cast<size_t>(st.st_size);
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	382	unsigned char* img = reinterpret_cast<unsigned char*>(malloc(sz + 4));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	383	FILE* f = fopen(filename, "rb");
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	384	if (fread(img, 1, sz, f) != sz) {
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	385	printf("failed to read \"%s\" %s\n", filename, strerror(errno));
				386	fclose(f);
				387	return NULL;
				388	}
				389	fclose(f);
				390
				391	// append 4 zero bytes to the data so we can always search for the
				392	// four-byte string 1f8b0800 starting at any point in the actual
				393	// file data, without special-casing the end of the data.
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	394	memset(img+sz, 0, 4);
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	395
				396	size_t pos = 0;
				397
				398	*num_chunks = 0;
				399	*chunks = NULL;
				400
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	401	while (pos < sz) {
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	402	unsigned char* p = img+pos;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	403
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	404	if (sz - pos >= 4 &&
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	405	p[0] == 0x1f && p[1] == 0x8b &&
				406	p[2] == 0x08 && // deflate compression
				407	p[3] == 0x00) { // no header flags
				408	// 'pos' is the offset of the start of a gzip chunk.
Johan Redestig	c68bd34	2015-04-14 21:20:06 +0200	[diff] [blame]	409	size_t chunk_offset = pos;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	410
				411	*num_chunks += 3;
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	412	chunks = reinterpret_cast<ImageChunk>(realloc(*chunks,
				413	num_chunks sizeof(ImageChunk)));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	414	ImageChunk* curr = chunks + (num_chunks-3);
				415
				416	// create a normal chunk for the header.
				417	curr->start = pos;
				418	curr->type = CHUNK_NORMAL;
				419	curr->len = GZIP_HEADER_LEN;
				420	curr->data = p;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	421
				422	pos += curr->len;
				423	p += curr->len;
				424	++curr;
				425
				426	curr->type = CHUNK_DEFLATE;
				427	curr->filename = NULL;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	428
				429	// We must decompress this chunk in order to discover where it
				430	// ends, and so we can put the uncompressed data and its length
				431	// into curr->data and curr->len.
				432
				433	size_t allocated = 32768;
				434	curr->len = 0;
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	435	curr->data = reinterpret_cast<unsigned char*>(malloc(allocated));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	436	curr->start = pos;
				437	curr->deflate_data = p;
				438
				439	z_stream strm;
				440	strm.zalloc = Z_NULL;
				441	strm.zfree = Z_NULL;
				442	strm.opaque = Z_NULL;
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	443	strm.avail_in = sz - pos;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	444	strm.next_in = p;
				445
				446	// -15 means we are decoding a 'raw' deflate stream; zlib will
				447	// not expect zlib headers.
				448	int ret = inflateInit2(&strm, -15);
				449
				450	do {
				451	strm.avail_out = allocated - curr->len;
				452	strm.next_out = curr->data + curr->len;
				453	ret = inflate(&strm, Z_NO_FLUSH);
Johan Redestig	c68bd34	2015-04-14 21:20:06 +0200	[diff] [blame]	454	if (ret < 0) {
Sen Jiang	fa4f1b7	2016-02-11 16:14:23 -0800	[diff] [blame]	455	printf("Warning: inflate failed [%s] at offset [%zu],"
				456	" treating as a normal chunk\n",
David Riley	0779fc9	2015-12-10 10:18:25 -0800	[diff] [blame]	457	strm.msg, chunk_offset);
Sen Jiang	fa4f1b7	2016-02-11 16:14:23 -0800	[diff] [blame]	458	break;
Johan Redestig	c68bd34	2015-04-14 21:20:06 +0200	[diff] [blame]	459	}
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	460	curr->len = allocated - strm.avail_out;
				461	if (strm.avail_out == 0) {
				462	allocated *= 2;
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	463	curr->data = reinterpret_cast<unsigned char*>(realloc(curr->data, allocated));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	464	}
				465	} while (ret != Z_STREAM_END);
				466
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	467	curr->deflate_len = sz - strm.avail_in - pos;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	468	inflateEnd(&strm);
Sen Jiang	fa4f1b7	2016-02-11 16:14:23 -0800	[diff] [blame]	469
				470	if (ret < 0) {
				471	free(curr->data);
				472	*num_chunks -= 2;
				473	continue;
				474	}
				475
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	476	pos += curr->deflate_len;
				477	p += curr->deflate_len;
				478	++curr;
				479
				480	// create a normal chunk for the footer
				481
				482	curr->type = CHUNK_NORMAL;
				483	curr->start = pos;
				484	curr->len = GZIP_FOOTER_LEN;
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	485	curr->data = img+pos;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	486
				487	pos += curr->len;
				488	p += curr->len;
				489	++curr;
				490
				491	// The footer (that we just skipped over) contains the size of
				492	// the uncompressed data. Double-check to make sure that it
				493	// matches the size of the data we got when we actually did
				494	// the decompression.
				495	size_t footer_size = Read4(p-4);
				496	if (footer_size != curr[-2].len) {
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	497	printf("Error: footer size %zu != decompressed size %zu\n",
				498	footer_size, curr[-2].len);
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	499	free(img);
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	500	return NULL;
				501	}
				502	} else {
				503	// Reallocate the list for every chunk; we expect the number of
				504	// chunks to be small (5 for typical boot and recovery images).
				505	++*num_chunks;
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	506	chunks = reinterpret_cast<ImageChunk>(realloc(chunks, num_chunks * sizeof(ImageChunk)));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	507	ImageChunk* curr = chunks + (num_chunks-1);
				508	curr->start = pos;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	509
				510	// 'pos' is not the offset of the start of a gzip chunk, so scan
				511	// forward until we find a gzip header.
				512	curr->type = CHUNK_NORMAL;
				513	curr->data = p;
				514
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	515	for (curr->len = 0; curr->len < (sz - pos); ++curr->len) {
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	516	if (p[curr->len] == 0x1f &&
				517	p[curr->len+1] == 0x8b &&
				518	p[curr->len+2] == 0x08 &&
				519	p[curr->len+3] == 0x00) {
				520	break;
				521	}
				522	}
				523	pos += curr->len;
				524	}
				525	}
				526
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	527	return img;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	528	}
				529
				530	#define BUFFER_SIZE 32768
				531
				532	/*
				533	* Takes the uncompressed data stored in the chunk, compresses it
				534	* using the zlib parameters stored in the chunk, and checks that it
				535	* matches exactly the compressed data we started with (also stored in
				536	* the chunk). Return 0 on success.
				537	*/
				538	int TryReconstruction(ImageChunk* chunk, unsigned char* out) {
				539	size_t p = 0;
				540
				541	#if 0
				542	printf("trying %d %d %d %d %d\n",
				543	chunk->level, chunk->method, chunk->windowBits,
				544	chunk->memLevel, chunk->strategy);
				545	#endif
				546
				547	z_stream strm;
				548	strm.zalloc = Z_NULL;
				549	strm.zfree = Z_NULL;
				550	strm.opaque = Z_NULL;
				551	strm.avail_in = chunk->len;
				552	strm.next_in = chunk->data;
				553	int ret;
				554	ret = deflateInit2(&strm, chunk->level, chunk->method, chunk->windowBits,
				555	chunk->memLevel, chunk->strategy);
				556	do {
				557	strm.avail_out = BUFFER_SIZE;
				558	strm.next_out = out;
				559	ret = deflate(&strm, Z_FINISH);
				560	size_t have = BUFFER_SIZE - strm.avail_out;
				561
				562	if (memcmp(out, chunk->deflate_data+p, have) != 0) {
				563	// mismatch; data isn't the same.
				564	deflateEnd(&strm);
				565	return -1;
				566	}
				567	p += have;
				568	} while (ret != Z_STREAM_END);
				569	deflateEnd(&strm);
				570	if (p != chunk->deflate_len) {
				571	// mismatch; ran out of data before we should have.
				572	return -1;
				573	}
				574	return 0;
				575	}
				576
				577	/*
				578	* Verify that we can reproduce exactly the same compressed data that
				579	* we started with. Sets the level, method, windowBits, memLevel, and
				580	* strategy fields in the chunk to the encoding parameters needed to
				581	* produce the right output. Returns 0 on success.
				582	*/
				583	int ReconstructDeflateChunk(ImageChunk* chunk) {
				584	if (chunk->type != CHUNK_DEFLATE) {
				585	printf("attempt to reconstruct non-deflate chunk\n");
				586	return -1;
				587	}
				588
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	589	unsigned char* out = reinterpret_cast<unsigned char*>(malloc(BUFFER_SIZE));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	590
				591	// We only check two combinations of encoder parameters: level 6
				592	// (the default) and level 9 (the maximum).
				593	for (chunk->level = 6; chunk->level <= 9; chunk->level += 3) {
				594	chunk->windowBits = -15; // 32kb window; negative to indicate a raw stream.
				595	chunk->memLevel = 8; // the default value.
				596	chunk->method = Z_DEFLATED;
				597	chunk->strategy = Z_DEFAULT_STRATEGY;
				598
				599	if (TryReconstruction(chunk, out) == 0) {
				600	free(out);
				601	return 0;
				602	}
				603	}
				604
				605	free(out);
				606	return -1;
				607	}
				608
				609	/*
				610	* Given source and target chunks, compute a bsdiff patch between them
				611	* by running bsdiff in a subprocess. Return the patch data, placing
				612	* its length in *size. Return NULL on failure. We expect the bsdiff
				613	* program to be in the path.
				614	*/
				615	unsigned char* MakePatch(ImageChunk* src, ImageChunk* tgt, size_t* size) {
				616	if (tgt->type == CHUNK_NORMAL) {
				617	if (tgt->len <= 160) {
				618	tgt->type = CHUNK_RAW;
				619	*size = tgt->len;
				620	return tgt->data;
				621	}
				622	}
				623
				624	char ptemp[] = "/tmp/imgdiff-patch-XXXXXX";
Jeremy Compostella	a91c66d	2015-09-08 19:15:09 +0200	[diff] [blame]	625	int fd = mkstemp(ptemp);
				626
				627	if (fd == -1) {
				628	printf("MakePatch failed to create a temporary file: %s\n",
				629	strerror(errno));
				630	return NULL;
				631	}
				632	close(fd); // temporary file is created and we don't need its file
				633	// descriptor
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	634
Sen Jiang	2fffcb1	2016-05-03 15:49:10 -0700	[diff] [blame]	635	int r = bsdiff::bsdiff(src->data, src->len, tgt->data, tgt->len, ptemp);
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	636	if (r != 0) {
				637	printf("bsdiff() failed: %d\n", r);
				638	return NULL;
				639	}
				640
				641	struct stat st;
				642	if (stat(ptemp, &st) != 0) {
				643	printf("failed to stat patch file %s: %s\n",
				644	ptemp, strerror(errno));
				645	return NULL;
				646	}
				647
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	648	size_t sz = static_cast<size_t>(st.st_size);
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	649	// TODO: Memory leak on error return.
				650	unsigned char* data = reinterpret_cast<unsigned char*>(malloc(sz));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	651
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	652	if (tgt->type == CHUNK_NORMAL && tgt->len <= sz) {
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	653	unlink(ptemp);
				654
				655	tgt->type = CHUNK_RAW;
				656	*size = tgt->len;
				657	return tgt->data;
				658	}
				659
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	660	*size = sz;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	661
				662	FILE* f = fopen(ptemp, "rb");
				663	if (f == NULL) {
				664	printf("failed to open patch %s: %s\n", ptemp, strerror(errno));
				665	return NULL;
				666	}
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	667	if (fread(data, 1, sz, f) != sz) {
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	668	printf("failed to read patch %s: %s\n", ptemp, strerror(errno));
				669	return NULL;
				670	}
				671	fclose(f);
				672
				673	unlink(ptemp);
				674
				675	tgt->source_start = src->start;
				676	switch (tgt->type) {
				677	case CHUNK_NORMAL:
				678	tgt->source_len = src->len;
				679	break;
				680	case CHUNK_DEFLATE:
				681	tgt->source_len = src->deflate_len;
				682	tgt->source_uncompressed_len = src->len;
				683	break;
				684	}
				685
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	686	return data;
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	687	}
				688
				689	/*
				690	* Cause a gzip chunk to be treated as a normal chunk (ie, as a blob
				691	* of uninterpreted data). The resulting patch will likely be about
				692	* as big as the target file, but it lets us handle the case of images
				693	* where some gzip chunks are reconstructible but others aren't (by
				694	* treating the ones that aren't as normal chunks).
				695	*/
				696	void ChangeDeflateChunkToNormal(ImageChunk* ch) {
				697	if (ch->type != CHUNK_DEFLATE) return;
				698	ch->type = CHUNK_NORMAL;
				699	free(ch->data);
				700	ch->data = ch->deflate_data;
				701	ch->len = ch->deflate_len;
				702	}
				703
				704	/*
				705	* Return true if the data in the chunk is identical (including the
				706	* compressed representation, for gzip chunks).
				707	*/
				708	int AreChunksEqual(ImageChunk* a, ImageChunk* b) {
				709	if (a->type != b->type) return 0;
				710
				711	switch (a->type) {
				712	case CHUNK_NORMAL:
				713	return a->len == b->len && memcmp(a->data, b->data, a->len) == 0;
				714
				715	case CHUNK_DEFLATE:
				716	return a->deflate_len == b->deflate_len &&
				717	memcmp(a->deflate_data, b->deflate_data, a->deflate_len) == 0;
				718
				719	default:
				720	printf("unknown chunk type %d\n", a->type);
				721	return 0;
				722	}
				723	}
				724
				725	/*
				726	* Look for runs of adjacent normal chunks and compress them down into
				727	* a single chunk. (Such runs can be produced when deflate chunks are
				728	* changed to normal chunks.)
				729	*/
				730	void MergeAdjacentNormalChunks(ImageChunk* chunks, int* num_chunks) {
				731	int out = 0;
				732	int in_start = 0, in_end;
				733	while (in_start < *num_chunks) {
				734	if (chunks[in_start].type != CHUNK_NORMAL) {
				735	in_end = in_start+1;
				736	} else {
				737	// in_start is a normal chunk. Look for a run of normal chunks
				738	// that constitute a solid block of data (ie, each chunk begins
				739	// where the previous one ended).
				740	for (in_end = in_start+1;
				741	in_end < *num_chunks && chunks[in_end].type == CHUNK_NORMAL &&
				742	(chunks[in_end].start ==
				743	chunks[in_end-1].start + chunks[in_end-1].len &&
				744	chunks[in_end].data ==
				745	chunks[in_end-1].data + chunks[in_end-1].len);
				746	++in_end);
				747	}
				748
				749	if (in_end == in_start+1) {
				750	#if 0
				751	printf("chunk %d is now %d\n", in_start, out);
				752	#endif
				753	if (out != in_start) {
				754	memcpy(chunks+out, chunks+in_start, sizeof(ImageChunk));
				755	}
				756	} else {
				757	#if 0
				758	printf("collapse normal chunks %d-%d into %d\n", in_start, in_end-1, out);
				759	#endif
				760
				761	// Merge chunks [in_start, in_end-1] into one chunk. Since the
				762	// data member of each chunk is just a pointer into an in-memory
				763	// copy of the file, this can be done without recopying (the
				764	// output chunk has the first chunk's start location and data
				765	// pointer, and length equal to the sum of the input chunk
				766	// lengths).
				767	chunks[out].type = CHUNK_NORMAL;
				768	chunks[out].start = chunks[in_start].start;
				769	chunks[out].data = chunks[in_start].data;
				770	chunks[out].len = chunks[in_end-1].len +
				771	(chunks[in_end-1].start - chunks[in_start].start);
				772	}
				773
				774	++out;
				775	in_start = in_end;
				776	}
				777	*num_chunks = out;
				778	}
				779
				780	ImageChunk* FindChunkByName(const char* name,
				781	ImageChunk* chunks, int num_chunks) {
				782	int i;
				783	for (i = 0; i < num_chunks; ++i) {
				784	if (chunks[i].type == CHUNK_DEFLATE && chunks[i].filename &&
				785	strcmp(name, chunks[i].filename) == 0) {
				786	return chunks+i;
				787	}
				788	}
				789	return NULL;
				790	}
				791
				792	void DumpChunks(ImageChunk* chunks, int num_chunks) {
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	793	for (int i = 0; i < num_chunks; ++i) {
				794	printf("chunk %d: type %d start %zu len %zu\n",
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	795	i, chunks[i].type, chunks[i].start, chunks[i].len);
				796	}
				797	}
				798
				799	int main(int argc, char** argv) {
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	800	int zip_mode = 0;
				801
Doug Zongker	a3ccba6	2012-08-20 15:28:02 -0700	[diff] [blame]	802	if (argc >= 2 && strcmp(argv[1], "-z") == 0) {
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	803	zip_mode = 1;
				804	--argc;
				805	++argv;
				806	}
				807
Doug Zongker	a3ccba6	2012-08-20 15:28:02 -0700	[diff] [blame]	808	size_t bonus_size = 0;
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	809	unsigned char* bonus_data = NULL;
Doug Zongker	a3ccba6	2012-08-20 15:28:02 -0700	[diff] [blame]	810	if (argc >= 3 && strcmp(argv[1], "-b") == 0) {
				811	struct stat st;
				812	if (stat(argv[2], &st) != 0) {
				813	printf("failed to stat bonus file %s: %s\n", argv[2], strerror(errno));
				814	return 1;
				815	}
				816	bonus_size = st.st_size;
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	817	bonus_data = reinterpret_cast<unsigned char*>(malloc(bonus_size));
Doug Zongker	a3ccba6	2012-08-20 15:28:02 -0700	[diff] [blame]	818	FILE* f = fopen(argv[2], "rb");
				819	if (f == NULL) {
				820	printf("failed to open bonus file %s: %s\n", argv[2], strerror(errno));
				821	return 1;
				822	}
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	823	if (fread(bonus_data, 1, bonus_size, f) != bonus_size) {
Doug Zongker	a3ccba6	2012-08-20 15:28:02 -0700	[diff] [blame]	824	printf("failed to read bonus file %s: %s\n", argv[2], strerror(errno));
				825	return 1;
				826	}
				827	fclose(f);
				828
				829	argc -= 2;
				830	argv += 2;
				831	}
				832
				833	if (argc != 4) {
Doug Zongker	a3ccba6	2012-08-20 15:28:02 -0700	[diff] [blame]	834	printf("usage: %s [-z] [-b <bonus-file>] <src-img> <tgt-img> <patch-file>\n",
				835	argv[0]);
				836	return 2;
				837	}
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	838
				839	int num_src_chunks;
				840	ImageChunk* src_chunks;
				841	int num_tgt_chunks;
				842	ImageChunk* tgt_chunks;
				843	int i;
				844
				845	if (zip_mode) {
				846	if (ReadZip(argv[1], &num_src_chunks, &src_chunks, 1) == NULL) {
				847	printf("failed to break apart source zip file\n");
				848	return 1;
				849	}
				850	if (ReadZip(argv[2], &num_tgt_chunks, &tgt_chunks, 0) == NULL) {
				851	printf("failed to break apart target zip file\n");
				852	return 1;
				853	}
				854	} else {
				855	if (ReadImage(argv[1], &num_src_chunks, &src_chunks) == NULL) {
				856	printf("failed to break apart source image\n");
				857	return 1;
				858	}
				859	if (ReadImage(argv[2], &num_tgt_chunks, &tgt_chunks) == NULL) {
				860	printf("failed to break apart target image\n");
				861	return 1;
				862	}
				863
				864	// Verify that the source and target images have the same chunk
				865	// structure (ie, the same sequence of deflate and normal chunks).
				866
				867	if (!zip_mode) {
				868	// Merge the gzip header and footer in with any adjacent
				869	// normal chunks.
				870	MergeAdjacentNormalChunks(tgt_chunks, &num_tgt_chunks);
				871	MergeAdjacentNormalChunks(src_chunks, &num_src_chunks);
				872	}
				873
				874	if (num_src_chunks != num_tgt_chunks) {
				875	printf("source and target don't have same number of chunks!\n");
				876	printf("source chunks:\n");
				877	DumpChunks(src_chunks, num_src_chunks);
				878	printf("target chunks:\n");
				879	DumpChunks(tgt_chunks, num_tgt_chunks);
				880	return 1;
				881	}
				882	for (i = 0; i < num_src_chunks; ++i) {
				883	if (src_chunks[i].type != tgt_chunks[i].type) {
				884	printf("source and target don't have same chunk "
				885	"structure! (chunk %d)\n", i);
				886	printf("source chunks:\n");
				887	DumpChunks(src_chunks, num_src_chunks);
				888	printf("target chunks:\n");
				889	DumpChunks(tgt_chunks, num_tgt_chunks);
				890	return 1;
				891	}
				892	}
				893	}
				894
				895	for (i = 0; i < num_tgt_chunks; ++i) {
				896	if (tgt_chunks[i].type == CHUNK_DEFLATE) {
				897	// Confirm that given the uncompressed chunk data in the target, we
				898	// can recompress it and get exactly the same bits as are in the
				899	// input target image. If this fails, treat the chunk as a normal
				900	// non-deflated chunk.
				901	if (ReconstructDeflateChunk(tgt_chunks+i) < 0) {
				902	printf("failed to reconstruct target deflate chunk %d [%s]; "
				903	"treating as normal\n", i, tgt_chunks[i].filename);
				904	ChangeDeflateChunkToNormal(tgt_chunks+i);
				905	if (zip_mode) {
				906	ImageChunk* src = FindChunkByName(tgt_chunks[i].filename, src_chunks, num_src_chunks);
				907	if (src) {
				908	ChangeDeflateChunkToNormal(src);
				909	}
				910	} else {
				911	ChangeDeflateChunkToNormal(src_chunks+i);
				912	}
				913	continue;
				914	}
				915
				916	// If two deflate chunks are identical (eg, the kernel has not
				917	// changed between two builds), treat them as normal chunks.
				918	// This makes applypatch much faster -- it can apply a trivial
				919	// patch to the compressed data, rather than uncompressing and
				920	// recompressing to apply the trivial patch to the uncompressed
				921	// data.
				922	ImageChunk* src;
				923	if (zip_mode) {
				924	src = FindChunkByName(tgt_chunks[i].filename, src_chunks, num_src_chunks);
				925	} else {
				926	src = src_chunks+i;
				927	}
				928
				929	if (src == NULL \|\| AreChunksEqual(tgt_chunks+i, src)) {
				930	ChangeDeflateChunkToNormal(tgt_chunks+i);
				931	if (src) {
				932	ChangeDeflateChunkToNormal(src);
				933	}
				934	}
				935	}
				936	}
				937
				938	// Merging neighboring normal chunks.
				939	if (zip_mode) {
				940	// For zips, we only need to do this to the target: deflated
				941	// chunks are matched via filename, and normal chunks are patched
				942	// using the entire source file as the source.
				943	MergeAdjacentNormalChunks(tgt_chunks, &num_tgt_chunks);
				944	} else {
				945	// For images, we need to maintain the parallel structure of the
				946	// chunk lists, so do the merging in both the source and target
				947	// lists.
				948	MergeAdjacentNormalChunks(tgt_chunks, &num_tgt_chunks);
				949	MergeAdjacentNormalChunks(src_chunks, &num_src_chunks);
				950	if (num_src_chunks != num_tgt_chunks) {
				951	// This shouldn't happen.
				952	printf("merging normal chunks went awry\n");
				953	return 1;
				954	}
				955	}
				956
				957	// Compute bsdiff patches for each chunk's data (the uncompressed
				958	// data, in the case of deflate chunks).
				959
Doug Zongker	a3ccba6	2012-08-20 15:28:02 -0700	[diff] [blame]	960	DumpChunks(src_chunks, num_src_chunks);
				961
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	962	printf("Construct patches for %d chunks...\n", num_tgt_chunks);
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	963	unsigned char patch_data = reinterpret_cast<unsigned char>(malloc(
				964	num_tgt_chunks * sizeof(unsigned char*)));
				965	size_t* patch_size = reinterpret_cast<size_t>(malloc(num_tgt_chunks sizeof(size_t)));
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	966	for (i = 0; i < num_tgt_chunks; ++i) {
				967	if (zip_mode) {
				968	ImageChunk* src;
				969	if (tgt_chunks[i].type == CHUNK_DEFLATE &&
				970	(src = FindChunkByName(tgt_chunks[i].filename, src_chunks,
				971	num_src_chunks))) {
				972	patch_data[i] = MakePatch(src, tgt_chunks+i, patch_size+i);
				973	} else {
				974	patch_data[i] = MakePatch(src_chunks, tgt_chunks+i, patch_size+i);
				975	}
				976	} else {
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	977	if (i == 1 && bonus_data) {
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	978	printf(" using %zu bytes of bonus data for chunk %d\n", bonus_size, i);
				979	src_chunks[i].data = reinterpret_cast<unsigned char*>(realloc(src_chunks[i].data,
				980	src_chunks[i].len + bonus_size));
Tao Bao	a0c4011	2016-06-01 13:15:44 -0700	[diff] [blame]	981	memcpy(src_chunks[i].data+src_chunks[i].len, bonus_data, bonus_size);
Doug Zongker	a3ccba6	2012-08-20 15:28:02 -0700	[diff] [blame]	982	src_chunks[i].len += bonus_size;
				983	}
				984
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	985	patch_data[i] = MakePatch(src_chunks+i, tgt_chunks+i, patch_size+i);
				986	}
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	987	printf("patch %3d is %zu bytes (of %zu)\n",
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	988	i, patch_size[i], tgt_chunks[i].source_len);
				989	}
				990
				991	// Figure out how big the imgdiff file header is going to be, so
				992	// that we can correctly compute the offset of each bsdiff patch
				993	// within the file.
				994
				995	size_t total_header_size = 12;
				996	for (i = 0; i < num_tgt_chunks; ++i) {
				997	total_header_size += 4;
				998	switch (tgt_chunks[i].type) {
				999	case CHUNK_NORMAL:
				1000	total_header_size += 8*3;
				1001	break;
				1002	case CHUNK_DEFLATE:
				1003	total_header_size += 85 + 45;
				1004	break;
				1005	case CHUNK_RAW:
				1006	total_header_size += 4 + patch_size[i];
				1007	break;
				1008	}
				1009	}
				1010
				1011	size_t offset = total_header_size;
				1012
				1013	FILE* f = fopen(argv[3], "wb");
				1014
				1015	// Write out the headers.
				1016
				1017	fwrite("IMGDIFF2", 1, 8, f);
				1018	Write4(num_tgt_chunks, f);
				1019	for (i = 0; i < num_tgt_chunks; ++i) {
				1020	Write4(tgt_chunks[i].type, f);
				1021
				1022	switch (tgt_chunks[i].type) {
				1023	case CHUNK_NORMAL:
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	1024	printf("chunk %3d: normal (%10zu, %10zu) %10zu\n", i,
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	1025	tgt_chunks[i].start, tgt_chunks[i].len, patch_size[i]);
				1026	Write8(tgt_chunks[i].source_start, f);
				1027	Write8(tgt_chunks[i].source_len, f);
				1028	Write8(offset, f);
				1029	offset += patch_size[i];
				1030	break;
				1031
				1032	case CHUNK_DEFLATE:
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	1033	printf("chunk %3d: deflate (%10zu, %10zu) %10zu %s\n", i,
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	1034	tgt_chunks[i].start, tgt_chunks[i].deflate_len, patch_size[i],
				1035	tgt_chunks[i].filename);
				1036	Write8(tgt_chunks[i].source_start, f);
				1037	Write8(tgt_chunks[i].source_len, f);
				1038	Write8(offset, f);
				1039	Write8(tgt_chunks[i].source_uncompressed_len, f);
				1040	Write8(tgt_chunks[i].len, f);
				1041	Write4(tgt_chunks[i].level, f);
				1042	Write4(tgt_chunks[i].method, f);
				1043	Write4(tgt_chunks[i].windowBits, f);
				1044	Write4(tgt_chunks[i].memLevel, f);
				1045	Write4(tgt_chunks[i].strategy, f);
				1046	offset += patch_size[i];
				1047	break;
				1048
				1049	case CHUNK_RAW:
Tao Bao	ba9a42a	2015-06-23 23:23:33 -0700	[diff] [blame]	1050	printf("chunk %3d: raw (%10zu, %10zu)\n", i,
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	1051	tgt_chunks[i].start, tgt_chunks[i].len);
				1052	Write4(patch_size[i], f);
				1053	fwrite(patch_data[i], 1, patch_size[i], f);
				1054	break;
				1055	}
				1056	}
				1057
				1058	// Append each chunk's bsdiff patch, in order.
				1059
				1060	for (i = 0; i < num_tgt_chunks; ++i) {
				1061	if (tgt_chunks[i].type != CHUNK_RAW) {
				1062	fwrite(patch_data[i], 1, patch_size[i], f);
				1063	}
				1064	}
				1065
Rahul Chaudhry	3a5177b	2016-11-15 16:18:46 -0800	[diff] [blame^]	1066	free(patch_data);
				1067	free(patch_size);
				1068
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	1069	fclose(f);
Doug Zongker	512536a	2010-02-17 16:11:44 -0800	[diff] [blame]	1070
				1071	return 0;
				1072	}