blob: c258a5823933130980afe2b41cca6cacee687430 [file] [log] [blame]
Don Garrettf4b28742012-03-27 20:48:06 -07001// Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
adlr@google.com3defe6a2009-12-04 20:57:17 +00002// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
5#ifndef CHROMEOS_PLATFORM_UPDATE_ENGINE_DELTA_DIFF_GENERATOR_H__
6#define CHROMEOS_PLATFORM_UPDATE_ENGINE_DELTA_DIFF_GENERATOR_H__
7
Andrew de los Reyesb10320d2010-03-31 16:44:44 -07008#include <string>
9#include <vector>
adlr@google.com3defe6a2009-12-04 20:57:17 +000010#include "base/basictypes.h"
Andrew de los Reyesb10320d2010-03-31 16:44:44 -070011#include "update_engine/graph_types.h"
12#include "update_engine/update_metadata.pb.h"
13
14// There is one function in DeltaDiffGenerator of importance to users
15// of the class: GenerateDeltaUpdateFile(). Before calling it,
16// the old and new images must be mounted. Call GenerateDeltaUpdateFile()
17// with both the mount-points of the images in addition to the paths of
18// the images (both old and new). A delta from old to new will be
19// generated and stored in output_path.
adlr@google.com3defe6a2009-12-04 20:57:17 +000020
21namespace chromeos_update_engine {
22
Andrew de los Reyesef017552010-10-06 17:57:52 -070023// This struct stores all relevant info for an edge that is cut between
24// nodes old_src -> old_dst by creating new vertex new_vertex. The new
25// relationship is:
26// old_src -(read before)-> new_vertex <-(write before)- old_dst
27// new_vertex is a MOVE operation that moves some existing blocks into
28// temp space. The temp extents are, by necessity, stored in new_vertex
29// (as dst extents) and old_dst (as src extents), but they are also broken
30// out into tmp_extents, as the nodes themselves may contain many more
31// extents.
32struct CutEdgeVertexes {
33 Vertex::Index new_vertex;
34 Vertex::Index old_src;
35 Vertex::Index old_dst;
36 std::vector<Extent> tmp_extents;
37};
38
adlr@google.com3defe6a2009-12-04 20:57:17 +000039class DeltaDiffGenerator {
Andrew de los Reyesb10320d2010-03-31 16:44:44 -070040 public:
41 // Represents a disk block on the install partition.
42 struct Block {
43 // During install, each block on the install partition will be written
44 // and some may be read (in all likelihood, many will be read).
45 // The reading and writing will be performed by InstallOperations,
46 // each of which has a corresponding vertex in a graph.
47 // A Block object tells which vertex will read or write this block
48 // at install time.
49 // Generally, there will be a vector of Block objects whose length
50 // is the number of blocks on the install partition.
51 Block() : reader(Vertex::kInvalidIndex), writer(Vertex::kInvalidIndex) {}
52 Vertex::Index reader;
53 Vertex::Index writer;
54 };
55
56 // This is the only function that external users of the class should call.
57 // old_image and new_image are paths to two image files. They should be
58 // mounted read-only at paths old_root and new_root respectively.
Andrew de los Reyesf4c7ef12010-04-30 10:37:00 -070059 // {old,new}_kernel_part are paths to the old and new kernel partition
60 // images, respectively.
Andrew de los Reyes932bc4c2010-08-23 18:14:09 -070061 // private_key_path points to a private key used to sign the update.
62 // Pass empty string to not sign the update.
Andrew de los Reyesb10320d2010-03-31 16:44:44 -070063 // output_path is the filename where the delta update should be written.
Darin Petkov8e447e02013-04-16 16:23:50 +020064 // If |chunk_size| is not -1, the delta payload is generated based on
65 // |chunk_size| chunks rather than whole files.
Chris Sosad5ae1562013-04-23 13:20:18 -070066 // This method computes scratch space based on |rootfs_partition_size|.
Jay Srinivasan738fdf32012-12-07 17:40:54 -080067 // Returns true on success. Also writes the size of the metadata into
68 // |metadata_size|.
Andrew de los Reyesb10320d2010-03-31 16:44:44 -070069 static bool GenerateDeltaUpdateFile(const std::string& old_root,
70 const std::string& old_image,
71 const std::string& new_root,
72 const std::string& new_image,
Andrew de los Reyesf4c7ef12010-04-30 10:37:00 -070073 const std::string& old_kernel_part,
74 const std::string& new_kernel_part,
Andrew de los Reyes932bc4c2010-08-23 18:14:09 -070075 const std::string& output_path,
Jay Srinivasan738fdf32012-12-07 17:40:54 -080076 const std::string& private_key_path,
Darin Petkov8e447e02013-04-16 16:23:50 +020077 off_t chunk_size,
Chris Sosad5ae1562013-04-23 13:20:18 -070078 size_t rootfs_partition_size,
Jay Srinivasan738fdf32012-12-07 17:40:54 -080079 uint64_t* metadata_size);
Andrew de los Reyesb10320d2010-03-31 16:44:44 -070080
81 // These functions are public so that the unit tests can access them:
82
Andrew de los Reyesef017552010-10-06 17:57:52 -070083 // Takes a graph, which is not a DAG, which represents the files just
84 // read from disk, and converts it into a DAG by breaking all cycles
85 // and finding temp space to resolve broken edges.
86 // The final order of the nodes is given in |final_order|
87 // Some files may need to be reread from disk, thus |fd| and
88 // |data_file_size| are be passed.
Andrew de los Reyes927179d2010-12-02 11:26:48 -080089 // If |scratch_vertex| is not kInvalidIndex, removes it from
90 // |final_order| before returning.
Andrew de los Reyesef017552010-10-06 17:57:52 -070091 // Returns true on success.
92 static bool ConvertGraphToDag(Graph* graph,
93 const std::string& new_root,
94 int fd,
95 off_t* data_file_size,
Andrew de los Reyes927179d2010-12-02 11:26:48 -080096 std::vector<Vertex::Index>* final_order,
97 Vertex::Index scratch_vertex);
Andrew de los Reyesef017552010-10-06 17:57:52 -070098
Andrew de los Reyesb10320d2010-03-31 16:44:44 -070099 // Reads old_filename (if it exists) and a new_filename and determines
100 // the smallest way to encode this file for the diff. It stores
101 // necessary data in out_data and fills in out_op.
102 // If there's no change in old and new files, it creates a MOVE
103 // operation. If there is a change, or the old file doesn't exist,
104 // the smallest of REPLACE, REPLACE_BZ, or BSDIFF wins.
105 // new_filename must contain at least one byte.
Darin Petkov8e447e02013-04-16 16:23:50 +0200106 // |new_filename| is read starting at |chunk_offset|.
107 // If |chunk_size| is not -1, only up to |chunk_size| bytes are diffed.
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700108 // Returns true on success.
109 static bool ReadFileToDiff(const std::string& old_filename,
110 const std::string& new_filename,
Darin Petkov8e447e02013-04-16 16:23:50 +0200111 off_t chunk_offset,
112 off_t chunk_size,
Don Garrett36e60772012-03-29 10:31:20 -0700113 bool bsdiff_allowed,
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700114 std::vector<char>* out_data,
Darin Petkov68c10d12010-10-14 09:24:37 -0700115 DeltaArchiveManifest_InstallOperation* out_op,
116 bool gather_extents);
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700117
Andrew de los Reyes927179d2010-12-02 11:26:48 -0800118 // Creates a dummy REPLACE_BZ node in the given |vertex|. This can be used
119 // to provide scratch space. The node writes |num_blocks| blocks starting at
120 // |start_block|The node should be marked invalid before writing all nodes to
121 // the output file.
122 static void CreateScratchNode(uint64_t start_block,
123 uint64_t num_blocks,
124 Vertex* vertex);
125
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700126 // Modifies blocks read by 'op' so that any blocks referred to by
127 // 'remove_extents' are replaced with blocks from 'replace_extents'.
128 // 'remove_extents' and 'replace_extents' must be the same number of blocks.
129 // Blocks will be substituted in the order listed in the vectors.
130 // E.g. if 'op' reads blocks 1, 2, 3, 4, 5, 6, 7, 8, remove_extents
131 // contains blocks 6, 2, 3, 5, and replace blocks contains
132 // 12, 13, 14, 15, then op will be changed to read from:
133 // 1, 13, 14, 4, 15, 12, 7, 8
Andrew de los Reyesef017552010-10-06 17:57:52 -0700134 static void SubstituteBlocks(Vertex* vertex,
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700135 const std::vector<Extent>& remove_extents,
136 const std::vector<Extent>& replace_extents);
137
138 // Cuts 'edges' from 'graph' according to the AU algorithm. This means
139 // for each edge A->B, remove the dependency that B occur before A.
140 // Do this by creating a new operation X that copies from the blocks
141 // specified by the edge's properties to temp space T. Modify B to read
142 // from T rather than the blocks in the edge. Modify A to depend on X,
143 // but not on B. Free space is found by looking in 'blocks'.
144 // Returns true on success.
145 static bool CutEdges(Graph* graph,
Andrew de los Reyesef017552010-10-06 17:57:52 -0700146 const std::set<Edge>& edges,
147 std::vector<CutEdgeVertexes>* out_cuts);
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700148
149 // Stores all Extents in 'extents' into 'out'.
Andrew de los Reyesef017552010-10-06 17:57:52 -0700150 static void StoreExtents(const std::vector<Extent>& extents,
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700151 google::protobuf::RepeatedPtrField<Extent>* out);
Darin Petkov7ea32332010-10-13 10:46:11 -0700152
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700153 // Creates all the edges for the graph. Writers of a block point to
154 // readers of the same block. This is because for an edge A->B, B
155 // must complete before A executes.
156 static void CreateEdges(Graph* graph, const std::vector<Block>& blocks);
Andrew de los Reyesef017552010-10-06 17:57:52 -0700157
158 // Given a topologically sorted graph |op_indexes| and |graph|, alters
159 // |op_indexes| to move all the full operations to the end of the vector.
160 // Full operations should not be depended on, so this is safe.
161 static void MoveFullOpsToBack(Graph* graph,
162 std::vector<Vertex::Index>* op_indexes);
163
164 // Sorts the vector |cuts| by its |cuts[].old_dest| member. Order is
165 // determined by the order of elements in op_indexes.
166 static void SortCutsByTopoOrder(std::vector<Vertex::Index>& op_indexes,
167 std::vector<CutEdgeVertexes>* cuts);
168
169 // Returns true iff there are no extents in the graph that refer to temp
170 // blocks. Temp blocks are in the range [kTempBlockStart, kSparseHole).
171 static bool NoTempBlocksRemain(const Graph& graph);
Darin Petkov7ea32332010-10-13 10:46:11 -0700172
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700173 // Install operations in the manifest may reference data blobs, which
174 // are in data_blobs_path. This function creates a new data blobs file
175 // with the data blobs in the same order as the referencing install
176 // operations in the manifest. E.g. if manifest[0] has a data blob
177 // "X" at offset 1, manifest[1] has a data blob "Y" at offset 0,
178 // and data_blobs_path's file contains "YX", new_data_blobs_path
179 // will set to be a file that contains "XY".
180 static bool ReorderDataBlobs(DeltaArchiveManifest* manifest,
181 const std::string& data_blobs_path,
182 const std::string& new_data_blobs_path);
Darin Petkov7ea32332010-10-13 10:46:11 -0700183
Jay Srinivasan00f76b62012-09-17 18:48:36 -0700184 // Computes a SHA256 hash of the given buf and sets the hash value in the
185 // operation so that update_engine could verify. This hash should be set
186 // for all operations that have a non-zero data blob. One exception is the
187 // dummy operation for signature blob because the contents of the signature
188 // blob will not be available at payload creation time. So, update_engine will
189 // gracefully ignore the dummy signature operation.
190 static bool AddOperationHash(DeltaArchiveManifest_InstallOperation* op,
191 const std::vector<char>& buf);
192
Andrew de los Reyesef017552010-10-06 17:57:52 -0700193 // Handles allocation of temp blocks to a cut edge by converting the
194 // dest node to a full op. This removes the need for temp blocks, but
195 // comes at the cost of a worse compression ratio.
196 // For example, say we have A->B->A. It would first be cut to form:
197 // A->B->N<-A, where N copies blocks to temp space. If there are no
198 // temp blocks, this function can be called to convert it to the form:
199 // A->B. Now, A is a full operation.
200 static bool ConvertCutToFullOp(Graph* graph,
201 const CutEdgeVertexes& cut,
202 const std::string& new_root,
203 int data_fd,
204 off_t* data_file_size);
Darin Petkov7ea32332010-10-13 10:46:11 -0700205
Andrew de los Reyesef017552010-10-06 17:57:52 -0700206 // Takes |op_indexes|, which is effectively a mapping from order in
207 // which the op is performed -> graph vertex index, and produces the
208 // reverse: a mapping from graph vertex index -> op_indexes index.
209 static void GenerateReverseTopoOrderMap(
210 std::vector<Vertex::Index>& op_indexes,
211 std::vector<std::vector<Vertex::Index>::size_type>* reverse_op_indexes);
Darin Petkov7ea32332010-10-13 10:46:11 -0700212
Andrew de los Reyesef017552010-10-06 17:57:52 -0700213 // Takes a |graph|, which has edges that must be cut, as listed in
214 // |cuts|. Cuts the edges. Maintains a list in which the operations
215 // will be performed (in |op_indexes|) and the reverse (in
216 // |reverse_op_indexes|). Cutting edges requires scratch space, and
217 // if insufficient scratch is found, the file is reread and will be
218 // send down (either as REPLACE or REPLACE_BZ). Returns true on
219 // success.
220 static bool AssignTempBlocks(
221 Graph* graph,
222 const std::string& new_root,
223 int data_fd,
224 off_t* data_file_size,
225 std::vector<Vertex::Index>* op_indexes,
226 std::vector<std::vector<Vertex::Index>::size_type>* reverse_op_indexes,
Andrew de los Reyes4ba850d2010-10-25 12:12:40 -0700227 const std::vector<CutEdgeVertexes>& cuts);
Andrew de los Reyesb10320d2010-03-31 16:44:44 -0700228
Darin Petkov9fa7ec52010-10-18 11:45:23 -0700229 // Returns true if |op| is a no-op operation that doesn't do any useful work
230 // (e.g., a move operation that copies blocks onto themselves).
231 static bool IsNoopOperation(const DeltaArchiveManifest_InstallOperation& op);
232
Andrew de los Reyes89f17be2010-10-22 13:39:09 -0700233 static bool InitializePartitionInfo(bool is_kernel,
234 const std::string& partition,
235 PartitionInfo* info);
236
Thieu Le5c7d9752010-12-15 16:09:28 -0800237 // Runs the bsdiff tool on two files and returns the resulting delta in
238 // |out|. Returns true on success.
239 static bool BsdiffFiles(const std::string& old_file,
240 const std::string& new_file,
241 std::vector<char>* out);
242
243 // The |blocks| vector contains a reader and writer for each block on the
244 // filesystem that's being in-place updated. We populate the reader/writer
245 // fields of |blocks| by calling this function.
246 // For each block in |operation| that is read or written, find that block
247 // in |blocks| and set the reader/writer field to the vertex passed.
248 // |graph| is not strictly necessary, but useful for printing out
249 // error messages.
250 static bool AddInstallOpToBlocksVector(
251 const DeltaArchiveManifest_InstallOperation& operation,
252 const Graph& graph,
253 Vertex::Index vertex,
254 std::vector<DeltaDiffGenerator::Block>* blocks);
255
Darin Petkov9574f7e2011-01-13 10:48:12 -0800256 // Adds to |manifest| a dummy operation that points to a signature blob
257 // located at the specified offset/length.
258 static void AddSignatureOp(uint64_t signature_blob_offset,
259 uint64_t signature_blob_length,
260 DeltaArchiveManifest* manifest);
261
adlr@google.com3defe6a2009-12-04 20:57:17 +0000262 private:
Jay Srinivasan738fdf32012-12-07 17:40:54 -0800263 // This should never be constructed
adlr@google.com3defe6a2009-12-04 20:57:17 +0000264 DISALLOW_IMPLICIT_CONSTRUCTORS(DeltaDiffGenerator);
265};
266
Andrew de los Reyes09e56d62010-04-23 13:45:53 -0700267extern const char* const kBsdiffPath;
268extern const char* const kBspatchPath;
269extern const char* const kDeltaMagic;
Chris Sosad5ae1562013-04-23 13:20:18 -0700270extern const size_t kRootFSPartitionSize;
Andrew de los Reyes09e56d62010-04-23 13:45:53 -0700271
adlr@google.com3defe6a2009-12-04 20:57:17 +0000272}; // namespace chromeos_update_engine
273
274#endif // CHROMEOS_PLATFORM_UPDATE_ENGINE_DELTA_DIFF_GENERATOR_H__