Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 1 | // Copyright (c) 2010 The Chromium Authors. All rights reserved. |
adlr@google.com | 3defe6a | 2009-12-04 20:57:17 +0000 | [diff] [blame] | 2 | // Use of this source code is governed by a BSD-style license that can be |
| 3 | // found in the LICENSE file. |
| 4 | |
| 5 | #ifndef CHROMEOS_PLATFORM_UPDATE_ENGINE_DELTA_DIFF_GENERATOR_H__ |
| 6 | #define CHROMEOS_PLATFORM_UPDATE_ENGINE_DELTA_DIFF_GENERATOR_H__ |
| 7 | |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 8 | #include <string> |
| 9 | #include <vector> |
adlr@google.com | 3defe6a | 2009-12-04 20:57:17 +0000 | [diff] [blame] | 10 | #include "base/basictypes.h" |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 11 | #include "update_engine/graph_types.h" |
| 12 | #include "update_engine/update_metadata.pb.h" |
| 13 | |
| 14 | // There is one function in DeltaDiffGenerator of importance to users |
| 15 | // of the class: GenerateDeltaUpdateFile(). Before calling it, |
| 16 | // the old and new images must be mounted. Call GenerateDeltaUpdateFile() |
| 17 | // with both the mount-points of the images in addition to the paths of |
| 18 | // the images (both old and new). A delta from old to new will be |
| 19 | // generated and stored in output_path. |
adlr@google.com | 3defe6a | 2009-12-04 20:57:17 +0000 | [diff] [blame] | 20 | |
| 21 | namespace chromeos_update_engine { |
| 22 | |
Andrew de los Reyes | ef01755 | 2010-10-06 17:57:52 -0700 | [diff] [blame^] | 23 | // This struct stores all relevant info for an edge that is cut between |
| 24 | // nodes old_src -> old_dst by creating new vertex new_vertex. The new |
| 25 | // relationship is: |
| 26 | // old_src -(read before)-> new_vertex <-(write before)- old_dst |
| 27 | // new_vertex is a MOVE operation that moves some existing blocks into |
| 28 | // temp space. The temp extents are, by necessity, stored in new_vertex |
| 29 | // (as dst extents) and old_dst (as src extents), but they are also broken |
| 30 | // out into tmp_extents, as the nodes themselves may contain many more |
| 31 | // extents. |
| 32 | struct CutEdgeVertexes { |
| 33 | Vertex::Index new_vertex; |
| 34 | Vertex::Index old_src; |
| 35 | Vertex::Index old_dst; |
| 36 | std::vector<Extent> tmp_extents; |
| 37 | }; |
| 38 | |
adlr@google.com | 3defe6a | 2009-12-04 20:57:17 +0000 | [diff] [blame] | 39 | class DeltaDiffGenerator { |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 40 | public: |
| 41 | // Represents a disk block on the install partition. |
| 42 | struct Block { |
| 43 | // During install, each block on the install partition will be written |
| 44 | // and some may be read (in all likelihood, many will be read). |
| 45 | // The reading and writing will be performed by InstallOperations, |
| 46 | // each of which has a corresponding vertex in a graph. |
| 47 | // A Block object tells which vertex will read or write this block |
| 48 | // at install time. |
| 49 | // Generally, there will be a vector of Block objects whose length |
| 50 | // is the number of blocks on the install partition. |
| 51 | Block() : reader(Vertex::kInvalidIndex), writer(Vertex::kInvalidIndex) {} |
| 52 | Vertex::Index reader; |
| 53 | Vertex::Index writer; |
| 54 | }; |
| 55 | |
| 56 | // This is the only function that external users of the class should call. |
| 57 | // old_image and new_image are paths to two image files. They should be |
| 58 | // mounted read-only at paths old_root and new_root respectively. |
Andrew de los Reyes | f4c7ef1 | 2010-04-30 10:37:00 -0700 | [diff] [blame] | 59 | // {old,new}_kernel_part are paths to the old and new kernel partition |
| 60 | // images, respectively. |
Andrew de los Reyes | 932bc4c | 2010-08-23 18:14:09 -0700 | [diff] [blame] | 61 | // private_key_path points to a private key used to sign the update. |
| 62 | // Pass empty string to not sign the update. |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 63 | // output_path is the filename where the delta update should be written. |
| 64 | // Returns true on success. |
| 65 | static bool GenerateDeltaUpdateFile(const std::string& old_root, |
| 66 | const std::string& old_image, |
| 67 | const std::string& new_root, |
| 68 | const std::string& new_image, |
Andrew de los Reyes | f4c7ef1 | 2010-04-30 10:37:00 -0700 | [diff] [blame] | 69 | const std::string& old_kernel_part, |
| 70 | const std::string& new_kernel_part, |
Andrew de los Reyes | 932bc4c | 2010-08-23 18:14:09 -0700 | [diff] [blame] | 71 | const std::string& output_path, |
| 72 | const std::string& private_key_path); |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 73 | |
| 74 | // These functions are public so that the unit tests can access them: |
| 75 | |
Andrew de los Reyes | ef01755 | 2010-10-06 17:57:52 -0700 | [diff] [blame^] | 76 | // Takes a graph, which is not a DAG, which represents the files just |
| 77 | // read from disk, and converts it into a DAG by breaking all cycles |
| 78 | // and finding temp space to resolve broken edges. |
| 79 | // The final order of the nodes is given in |final_order| |
| 80 | // Some files may need to be reread from disk, thus |fd| and |
| 81 | // |data_file_size| are be passed. |
| 82 | // Returns true on success. |
| 83 | static bool ConvertGraphToDag(Graph* graph, |
| 84 | const std::string& new_root, |
| 85 | int fd, |
| 86 | off_t* data_file_size, |
| 87 | std::vector<Vertex::Index>* final_order); |
| 88 | |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 89 | // Reads old_filename (if it exists) and a new_filename and determines |
| 90 | // the smallest way to encode this file for the diff. It stores |
| 91 | // necessary data in out_data and fills in out_op. |
| 92 | // If there's no change in old and new files, it creates a MOVE |
| 93 | // operation. If there is a change, or the old file doesn't exist, |
| 94 | // the smallest of REPLACE, REPLACE_BZ, or BSDIFF wins. |
| 95 | // new_filename must contain at least one byte. |
| 96 | // Returns true on success. |
| 97 | static bool ReadFileToDiff(const std::string& old_filename, |
| 98 | const std::string& new_filename, |
| 99 | std::vector<char>* out_data, |
| 100 | DeltaArchiveManifest_InstallOperation* out_op); |
| 101 | |
| 102 | // Modifies blocks read by 'op' so that any blocks referred to by |
| 103 | // 'remove_extents' are replaced with blocks from 'replace_extents'. |
| 104 | // 'remove_extents' and 'replace_extents' must be the same number of blocks. |
| 105 | // Blocks will be substituted in the order listed in the vectors. |
| 106 | // E.g. if 'op' reads blocks 1, 2, 3, 4, 5, 6, 7, 8, remove_extents |
| 107 | // contains blocks 6, 2, 3, 5, and replace blocks contains |
| 108 | // 12, 13, 14, 15, then op will be changed to read from: |
| 109 | // 1, 13, 14, 4, 15, 12, 7, 8 |
Andrew de los Reyes | ef01755 | 2010-10-06 17:57:52 -0700 | [diff] [blame^] | 110 | static void SubstituteBlocks(Vertex* vertex, |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 111 | const std::vector<Extent>& remove_extents, |
| 112 | const std::vector<Extent>& replace_extents); |
| 113 | |
| 114 | // Cuts 'edges' from 'graph' according to the AU algorithm. This means |
| 115 | // for each edge A->B, remove the dependency that B occur before A. |
| 116 | // Do this by creating a new operation X that copies from the blocks |
| 117 | // specified by the edge's properties to temp space T. Modify B to read |
| 118 | // from T rather than the blocks in the edge. Modify A to depend on X, |
| 119 | // but not on B. Free space is found by looking in 'blocks'. |
| 120 | // Returns true on success. |
| 121 | static bool CutEdges(Graph* graph, |
Andrew de los Reyes | ef01755 | 2010-10-06 17:57:52 -0700 | [diff] [blame^] | 122 | const std::set<Edge>& edges, |
| 123 | std::vector<CutEdgeVertexes>* out_cuts); |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 124 | |
| 125 | // Stores all Extents in 'extents' into 'out'. |
Andrew de los Reyes | ef01755 | 2010-10-06 17:57:52 -0700 | [diff] [blame^] | 126 | static void StoreExtents(const std::vector<Extent>& extents, |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 127 | google::protobuf::RepeatedPtrField<Extent>* out); |
| 128 | |
| 129 | // Creates all the edges for the graph. Writers of a block point to |
| 130 | // readers of the same block. This is because for an edge A->B, B |
| 131 | // must complete before A executes. |
| 132 | static void CreateEdges(Graph* graph, const std::vector<Block>& blocks); |
Andrew de los Reyes | ef01755 | 2010-10-06 17:57:52 -0700 | [diff] [blame^] | 133 | |
| 134 | // Given a topologically sorted graph |op_indexes| and |graph|, alters |
| 135 | // |op_indexes| to move all the full operations to the end of the vector. |
| 136 | // Full operations should not be depended on, so this is safe. |
| 137 | static void MoveFullOpsToBack(Graph* graph, |
| 138 | std::vector<Vertex::Index>* op_indexes); |
| 139 | |
| 140 | // Sorts the vector |cuts| by its |cuts[].old_dest| member. Order is |
| 141 | // determined by the order of elements in op_indexes. |
| 142 | static void SortCutsByTopoOrder(std::vector<Vertex::Index>& op_indexes, |
| 143 | std::vector<CutEdgeVertexes>* cuts); |
| 144 | |
| 145 | // Returns true iff there are no extents in the graph that refer to temp |
| 146 | // blocks. Temp blocks are in the range [kTempBlockStart, kSparseHole). |
| 147 | static bool NoTempBlocksRemain(const Graph& graph); |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 148 | |
| 149 | // Install operations in the manifest may reference data blobs, which |
| 150 | // are in data_blobs_path. This function creates a new data blobs file |
| 151 | // with the data blobs in the same order as the referencing install |
| 152 | // operations in the manifest. E.g. if manifest[0] has a data blob |
| 153 | // "X" at offset 1, manifest[1] has a data blob "Y" at offset 0, |
| 154 | // and data_blobs_path's file contains "YX", new_data_blobs_path |
| 155 | // will set to be a file that contains "XY". |
| 156 | static bool ReorderDataBlobs(DeltaArchiveManifest* manifest, |
| 157 | const std::string& data_blobs_path, |
| 158 | const std::string& new_data_blobs_path); |
Andrew de los Reyes | ef01755 | 2010-10-06 17:57:52 -0700 | [diff] [blame^] | 159 | |
| 160 | // Handles allocation of temp blocks to a cut edge by converting the |
| 161 | // dest node to a full op. This removes the need for temp blocks, but |
| 162 | // comes at the cost of a worse compression ratio. |
| 163 | // For example, say we have A->B->A. It would first be cut to form: |
| 164 | // A->B->N<-A, where N copies blocks to temp space. If there are no |
| 165 | // temp blocks, this function can be called to convert it to the form: |
| 166 | // A->B. Now, A is a full operation. |
| 167 | static bool ConvertCutToFullOp(Graph* graph, |
| 168 | const CutEdgeVertexes& cut, |
| 169 | const std::string& new_root, |
| 170 | int data_fd, |
| 171 | off_t* data_file_size); |
| 172 | |
| 173 | // Takes |op_indexes|, which is effectively a mapping from order in |
| 174 | // which the op is performed -> graph vertex index, and produces the |
| 175 | // reverse: a mapping from graph vertex index -> op_indexes index. |
| 176 | static void GenerateReverseTopoOrderMap( |
| 177 | std::vector<Vertex::Index>& op_indexes, |
| 178 | std::vector<std::vector<Vertex::Index>::size_type>* reverse_op_indexes); |
| 179 | |
| 180 | // Takes a |graph|, which has edges that must be cut, as listed in |
| 181 | // |cuts|. Cuts the edges. Maintains a list in which the operations |
| 182 | // will be performed (in |op_indexes|) and the reverse (in |
| 183 | // |reverse_op_indexes|). Cutting edges requires scratch space, and |
| 184 | // if insufficient scratch is found, the file is reread and will be |
| 185 | // send down (either as REPLACE or REPLACE_BZ). Returns true on |
| 186 | // success. |
| 187 | static bool AssignTempBlocks( |
| 188 | Graph* graph, |
| 189 | const std::string& new_root, |
| 190 | int data_fd, |
| 191 | off_t* data_file_size, |
| 192 | std::vector<Vertex::Index>* op_indexes, |
| 193 | std::vector<std::vector<Vertex::Index>::size_type>* reverse_op_indexes, |
| 194 | std::vector<CutEdgeVertexes>& cuts); |
Andrew de los Reyes | b10320d | 2010-03-31 16:44:44 -0700 | [diff] [blame] | 195 | |
adlr@google.com | 3defe6a | 2009-12-04 20:57:17 +0000 | [diff] [blame] | 196 | private: |
adlr@google.com | 3defe6a | 2009-12-04 20:57:17 +0000 | [diff] [blame] | 197 | // This should never be constructed |
| 198 | DISALLOW_IMPLICIT_CONSTRUCTORS(DeltaDiffGenerator); |
| 199 | }; |
| 200 | |
Andrew de los Reyes | 09e56d6 | 2010-04-23 13:45:53 -0700 | [diff] [blame] | 201 | extern const char* const kBsdiffPath; |
| 202 | extern const char* const kBspatchPath; |
| 203 | extern const char* const kDeltaMagic; |
| 204 | |
adlr@google.com | 3defe6a | 2009-12-04 20:57:17 +0000 | [diff] [blame] | 205 | }; // namespace chromeos_update_engine |
| 206 | |
| 207 | #endif // CHROMEOS_PLATFORM_UPDATE_ENGINE_DELTA_DIFF_GENERATOR_H__ |