OLD | NEW |
| (Empty) |
1 // Copyright (c) 2009 The Chromium Authors. All rights reserved. | |
2 // Use of this source code is governed by a BSD-style license that can be | |
3 // found in the LICENSE file. | |
4 | |
5 // The main idea in Courgette is to do patching *under a tranformation*. The | |
6 // input is transformed into a new representation, patching occurs in the new | |
7 // repesentation, and then the tranform is reversed to get the patched data. | |
8 // | |
9 // The idea is applied to pieces (or 'elements') of the whole (or 'ensemble'). | |
10 // Each of the elements has to go through the same set of steps in lock-step. | |
11 | |
12 // This file contains the code to create the patch. | |
13 | |
14 | |
15 #include "third_party/courgette/ensemble.h" | |
16 | |
17 #include <vector> | |
18 #include <limits> | |
19 | |
20 #include "base/basictypes.h" | |
21 #include "base/logging.h" | |
22 #include "base/time.h" | |
23 | |
24 #include "third_party/courgette/bsdiff.h" | |
25 #include "third_party/courgette/crc.h" | |
26 #include "third_party/courgette/difference_estimator.h" | |
27 #include "third_party/courgette/image_info.h" | |
28 #include "third_party/courgette/streams.h" | |
29 #include "third_party/courgette/region.h" | |
30 #include "third_party/courgette/simple_delta.h" | |
31 | |
32 #include "third_party/courgette/win32_x86_patcher.h" | |
33 #include "third_party/courgette/win32_x86_generator.h" | |
34 | |
35 namespace courgette { | |
36 | |
37 TransformationPatchGenerator::TransformationPatchGenerator( | |
38 Element* old_element, | |
39 Element* new_element, | |
40 TransformationPatcher* patcher) | |
41 : old_element_(old_element), | |
42 new_element_(new_element), | |
43 patcher_(patcher) { | |
44 } | |
45 | |
46 TransformationPatchGenerator::~TransformationPatchGenerator() { | |
47 delete patcher_; | |
48 } | |
49 | |
50 // The default implementation of PredictTransformParameters delegates to the | |
51 // patcher. | |
52 Status TransformationPatchGenerator::PredictTransformParameters( | |
53 SinkStreamSet* prediction) { | |
54 return patcher_->PredictTransformParameters(prediction); | |
55 } | |
56 | |
57 // The default implementation of Reform delegates to the patcher. | |
58 Status TransformationPatchGenerator::Reform( | |
59 SourceStreamSet* transformed_element, | |
60 SinkStream* reformed_element) { | |
61 return patcher_->Reform(transformed_element, reformed_element); | |
62 } | |
63 | |
64 // Makes a TransformationPatchGenerator of the appropriate variety for the | |
65 // Element kind. | |
66 TransformationPatchGenerator* MakeGenerator(Element* old_element, | |
67 Element* new_element) { | |
68 if (new_element->kind() == Element::WIN32_X86_WITH_CODE) { | |
69 CourgetteWin32X86PatchGenerator* generator = | |
70 new CourgetteWin32X86PatchGenerator( | |
71 old_element, | |
72 new_element, | |
73 new CourgetteWin32X86Patcher(old_element->region())); | |
74 return generator; | |
75 } else { | |
76 LOG(WARNING) << "Unexpected Element::Kind " << old_element->kind(); | |
77 return NULL; | |
78 } | |
79 } | |
80 | |
81 // FindGenerators finds TransformationPatchGenerators for the elements of | |
82 // |new_ensemble|. For each element of |new_ensemble| we find the closest | |
83 // matching element from |old_ensemble| and use that as the basis for | |
84 // differential compression. The elements have to be the same kind so as to | |
85 // support transformation into the same kind of 'new representation'. | |
86 // | |
87 Status FindGenerators(Ensemble* old_ensemble, Ensemble* new_ensemble, | |
88 std::vector<TransformationPatchGenerator*>* generators) { | |
89 base::Time start_find_time = base::Time::Now(); | |
90 old_ensemble->FindEmbeddedElements(); | |
91 new_ensemble->FindEmbeddedElements(); | |
92 LOG(INFO) << "done FindEmbeddedElements " | |
93 << (base::Time::Now() - start_find_time).InSecondsF(); | |
94 | |
95 std::vector<Element*> old_elements(old_ensemble->elements()); | |
96 std::vector<Element*> new_elements(new_ensemble->elements()); | |
97 | |
98 LOG(INFO) << "old has " << old_elements.size() << " elements"; | |
99 LOG(INFO) << "new has " << new_elements.size() << " elements"; | |
100 | |
101 DifferenceEstimator difference_estimator; | |
102 std::vector<DifferenceEstimator::Base*> bases; | |
103 | |
104 base::Time start_bases_time = base::Time::Now(); | |
105 for (size_t i = 0; i < old_elements.size(); ++i) { | |
106 bases.push_back( | |
107 difference_estimator.MakeBase(old_elements[i]->region())); | |
108 } | |
109 LOG(INFO) << "done make bases " | |
110 << (base::Time::Now() - start_bases_time).InSecondsF() | |
111 << "s"; | |
112 | |
113 for (size_t new_index = 0; new_index < new_elements.size(); ++new_index) { | |
114 Element* new_element = new_elements[new_index]; | |
115 DifferenceEstimator::Subject* new_subject = | |
116 difference_estimator.MakeSubject(new_element->region()); | |
117 | |
118 // Search through old elements to find the best match. | |
119 // | |
120 // TODO(sra): This is O(N x M), i.e. O(N^2) since old_ensemble and | |
121 // new_ensemble probably have a very similar structure. We can make the | |
122 // search faster by making the comparison provided by DifferenceEstimator | |
123 // more nuanced, returning early if the measured difference is greater than | |
124 // the current best. This will be most effective if we can arrange that the | |
125 // first elements we try to match are likely the 'right' ones. We could | |
126 // prioritize elements that are of a similar size or similar position in the | |
127 // sequence of elements. | |
128 // | |
129 Element* best_old_element = NULL; | |
130 size_t best_difference = std::numeric_limits<size_t>::max(); | |
131 for (size_t old_index = 0; old_index < old_elements.size(); ++old_index) { | |
132 Element* old_element = old_elements[old_index]; | |
133 // Elements of different kinds are incompatible. | |
134 if (old_element->kind() != new_element->kind()) | |
135 continue; | |
136 | |
137 base::Time start_compare = base::Time::Now(); | |
138 DifferenceEstimator::Base* old_base = bases[old_index]; | |
139 size_t difference = difference_estimator.Measure(old_base, new_subject); | |
140 | |
141 LOG(INFO) << "Compare " << old_element->Name() | |
142 << " to " << new_element->Name() | |
143 << " --> " << difference | |
144 << " in " << (base::Time::Now() - start_compare).InSecondsF() | |
145 << "s"; | |
146 if (difference == 0) { | |
147 LOG(INFO) << "Skip " << new_element->Name() | |
148 << " - identical to " << old_element->Name(); | |
149 best_difference = 0; | |
150 best_old_element = NULL; | |
151 break; | |
152 } | |
153 if (difference < best_difference) { | |
154 best_difference = difference; | |
155 best_old_element = old_element; | |
156 } | |
157 } | |
158 | |
159 if (best_old_element) { | |
160 LOG(INFO) << "Matched " << best_old_element->Name() | |
161 << " to " << new_element->Name() | |
162 << " --> " << best_difference; | |
163 TransformationPatchGenerator* generator = | |
164 MakeGenerator(best_old_element, new_element); | |
165 if (generator) | |
166 generators->push_back(generator); | |
167 } | |
168 } | |
169 | |
170 LOG(INFO) << "done FindGenerators " | |
171 << "found " << generators->size() << " in " | |
172 << (base::Time::Now() - start_find_time).InSecondsF() << "s"; | |
173 | |
174 return C_OK; | |
175 } | |
176 | |
177 void FreeGenerators(std::vector<TransformationPatchGenerator*>* generators) { | |
178 for (size_t i = 0; i < generators->size(); ++i) { | |
179 delete (*generators)[i]; | |
180 } | |
181 generators->clear(); | |
182 } | |
183 | |
184 //////////////////////////////////////////////////////////////////////////////// | |
185 | |
186 Status GenerateEnsemblePatch(SourceStream* base, | |
187 SourceStream* update, | |
188 SinkStream* final_patch) { | |
189 Region old_region(base->Buffer(), base->Remaining()); | |
190 Region new_region(update->Buffer(), update->Remaining()); | |
191 Ensemble old_ensemble(old_region, "old"); | |
192 Ensemble new_ensemble(new_region, "new"); | |
193 std::vector<TransformationPatchGenerator*> generators; | |
194 Status generators_status = FindGenerators(&old_ensemble, &new_ensemble, | |
195 &generators); | |
196 if (generators_status != C_OK) | |
197 return generators_status; | |
198 | |
199 SinkStreamSet patch_streams; | |
200 | |
201 SinkStream* tranformation_descriptions = patch_streams.stream(0); | |
202 SinkStream* parameter_correction = patch_streams.stream(1); | |
203 SinkStream* transformed_elements_correction = patch_streams.stream(2); | |
204 SinkStream* ensemble_correction = patch_streams.stream(3); | |
205 | |
206 uint32 number_of_transformations = generators.size(); | |
207 tranformation_descriptions->WriteVarint32(number_of_transformations); | |
208 | |
209 for (size_t i = 0; i < number_of_transformations; ++i) { | |
210 CourgettePatchFile::TransformationMethodId kind = generators[i]->Kind(); | |
211 tranformation_descriptions->WriteVarint32(kind); | |
212 } | |
213 | |
214 for (size_t i = 0; i < number_of_transformations; ++i) { | |
215 Status status = | |
216 generators[i]->WriteInitialParameters(tranformation_descriptions); | |
217 if (status != C_OK) | |
218 return status; | |
219 } | |
220 | |
221 // | |
222 // Generate sub-patch for parameters. | |
223 // | |
224 SinkStreamSet predicted_parameters_sink; | |
225 SinkStreamSet corrected_parameters_sink; | |
226 | |
227 for (size_t i = 0; i < number_of_transformations; ++i) { | |
228 SinkStreamSet single_predicted_parameters; | |
229 Status status; | |
230 status = generators[i]->PredictTransformParameters( | |
231 &single_predicted_parameters); | |
232 if (status != C_OK) | |
233 return status; | |
234 if (!predicted_parameters_sink.WriteSet(&single_predicted_parameters)) | |
235 return C_STREAM_ERROR; | |
236 | |
237 SinkStreamSet single_corrected_parameters; | |
238 status = generators[i]->CorrectedTransformParameters( | |
239 &single_corrected_parameters); | |
240 if (status != C_OK) | |
241 return status; | |
242 if (!corrected_parameters_sink.WriteSet(&single_corrected_parameters)) | |
243 return C_STREAM_ERROR; | |
244 } | |
245 | |
246 SinkStream linearized_predicted_parameters; | |
247 SinkStream linearized_corrected_parameters; | |
248 | |
249 if (!predicted_parameters_sink.CopyTo(&linearized_predicted_parameters)) | |
250 return C_STREAM_ERROR; | |
251 if (!corrected_parameters_sink.CopyTo(&linearized_corrected_parameters)) | |
252 return C_STREAM_ERROR; | |
253 | |
254 SourceStream predicted_parameters_source; | |
255 SourceStream corrected_parameters_source; | |
256 predicted_parameters_source.Init(linearized_predicted_parameters); | |
257 corrected_parameters_source.Init(linearized_corrected_parameters); | |
258 | |
259 Status delta1_status = GenerateSimpleDelta(&predicted_parameters_source, | |
260 &corrected_parameters_source, | |
261 parameter_correction); | |
262 if (delta1_status != C_OK) | |
263 return delta1_status; | |
264 | |
265 // | |
266 // Generate sub-patch for elements. | |
267 // | |
268 corrected_parameters_source.Init(linearized_corrected_parameters); | |
269 SourceStreamSet corrected_parameters_source_set; | |
270 if (!corrected_parameters_source_set.Init(&corrected_parameters_source)) | |
271 return C_STREAM_ERROR; | |
272 | |
273 SinkStreamSet predicted_transformed_elements; | |
274 SinkStreamSet corrected_transformed_elements; | |
275 | |
276 for (size_t i = 0; i < number_of_transformations; ++i) { | |
277 SourceStreamSet single_parameters; | |
278 if (!corrected_parameters_source_set.ReadSet(&single_parameters)) | |
279 return C_STREAM_ERROR; | |
280 SinkStreamSet single_predicted_transformed_element; | |
281 SinkStreamSet single_corrected_transformed_element; | |
282 Status status = generators[i]->Transform( | |
283 &single_parameters, | |
284 &single_predicted_transformed_element, | |
285 &single_corrected_transformed_element); | |
286 if (status != C_OK) | |
287 return status; | |
288 if (!single_parameters.Empty()) | |
289 return C_STREAM_NOT_CONSUMED; | |
290 if (!predicted_transformed_elements.WriteSet( | |
291 &single_predicted_transformed_element)) | |
292 return C_STREAM_ERROR; | |
293 if (!corrected_transformed_elements.WriteSet( | |
294 &single_corrected_transformed_element)) | |
295 return C_STREAM_ERROR; | |
296 } | |
297 | |
298 if (!corrected_parameters_source_set.Empty()) | |
299 return C_STREAM_NOT_CONSUMED; | |
300 | |
301 SinkStream linearized_predicted_transformed_elements; | |
302 SinkStream linearized_corrected_transformed_elements; | |
303 | |
304 if (!predicted_transformed_elements.CopyTo( | |
305 &linearized_predicted_transformed_elements)) | |
306 return C_STREAM_ERROR; | |
307 if (!corrected_transformed_elements.CopyTo( | |
308 &linearized_corrected_transformed_elements)) | |
309 return C_STREAM_ERROR; | |
310 | |
311 SourceStream predicted_transformed_elements_source; | |
312 SourceStream corrected_transformed_elements_source; | |
313 predicted_transformed_elements_source | |
314 .Init(linearized_predicted_transformed_elements); | |
315 corrected_transformed_elements_source | |
316 .Init(linearized_corrected_transformed_elements); | |
317 | |
318 Status delta2_status = | |
319 GenerateSimpleDelta(&predicted_transformed_elements_source, | |
320 &corrected_transformed_elements_source, | |
321 transformed_elements_correction); | |
322 if (delta2_status != C_OK) | |
323 return delta2_status; | |
324 | |
325 // | |
326 // Generate sub-patch for whole enchilada. | |
327 // | |
328 SinkStream predicted_ensemble; | |
329 | |
330 predicted_ensemble.Write(base->Buffer(), base->Remaining()); | |
331 | |
332 SourceStreamSet corrected_transformed_elements_source_set; | |
333 corrected_transformed_elements_source | |
334 .Init(linearized_corrected_transformed_elements); | |
335 if (!corrected_transformed_elements_source_set | |
336 .Init(&corrected_transformed_elements_source)) | |
337 return C_STREAM_ERROR; | |
338 | |
339 for (size_t i = 0; i < number_of_transformations; ++i) { | |
340 SourceStreamSet single_corrected_transformed_element; | |
341 if (!corrected_transformed_elements_source_set.ReadSet( | |
342 &single_corrected_transformed_element)) | |
343 return C_STREAM_ERROR; | |
344 Status status = generators[i]->Reform(&single_corrected_transformed_element, | |
345 &predicted_ensemble); | |
346 if (status != C_OK) | |
347 return status; | |
348 if (!single_corrected_transformed_element.Empty()) | |
349 return C_STREAM_NOT_CONSUMED; | |
350 } | |
351 | |
352 if (!corrected_transformed_elements_source_set.Empty()) | |
353 return C_STREAM_NOT_CONSUMED; | |
354 | |
355 FreeGenerators(&generators); | |
356 | |
357 SourceStream predicted_ensemble_source; | |
358 predicted_ensemble_source.Init(predicted_ensemble); | |
359 Status delta3_status = GenerateSimpleDelta(&predicted_ensemble_source, | |
360 update, | |
361 ensemble_correction); | |
362 if (delta3_status != C_OK) | |
363 return delta3_status; | |
364 | |
365 // | |
366 // Final output stream has a header followed by a StreamSet. | |
367 // | |
368 final_patch->WriteVarint32(CourgettePatchFile::kMagic); | |
369 final_patch->WriteVarint32(CourgettePatchFile::kVersion); | |
370 | |
371 final_patch->WriteVarint32( | |
372 CalculateCrc(old_region.start(), old_region.length())); | |
373 final_patch->WriteVarint32( | |
374 CalculateCrc(new_region.start(), new_region.length())); | |
375 | |
376 if (!patch_streams.CopyTo(final_patch)) | |
377 return C_STREAM_ERROR; | |
378 | |
379 return C_OK; | |
380 } | |
381 | |
382 } // namespace | |
OLD | NEW |