| Kelvin Zhang | ee481e4 | 2021-12-20 12:59:10 -0800 | [diff] [blame] | 1 | // | 
 | 2 | // Copyright (C) 2021 The Android Open Source Project | 
 | 3 | // | 
 | 4 | // Licensed under the Apache License, Version 2.0 (the "License"); | 
 | 5 | // you may not use this file except in compliance with the License. | 
 | 6 | // You may obtain a copy of the License at | 
 | 7 | // | 
 | 8 | //      http://www.apache.org/licenses/LICENSE-2.0 | 
 | 9 | // | 
 | 10 | // Unless required by applicable law or agreed to in writing, software | 
 | 11 | // distributed under the License is distributed on an "AS IS" BASIS, | 
 | 12 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
 | 13 | // See the License for the specific language governing permissions and | 
 | 14 | // limitations under the License. | 
 | 15 | // | 
 | 16 |  | 
 | 17 | #include "lz4diff.h" | 
 | 18 | #include "lz4diff_compress.h" | 
 | 19 |  | 
 | 20 | #include <bsdiff/bsdiff.h> | 
 | 21 | #include <bsdiff/constants.h> | 
 | 22 | #include <bsdiff/patch_writer_factory.h> | 
 | 23 | #include <bsdiff/patch_writer.h> | 
 | 24 | #include <puffin/common.h> | 
 | 25 | #include <puffin/puffdiff.h> | 
 | 26 | #include <lz4.h> | 
 | 27 | #include <lz4hc.h> | 
 | 28 |  | 
 | 29 | #include "update_engine/common/utils.h" | 
 | 30 | #include "update_engine/common/hash_calculator.h" | 
 | 31 | #include "update_engine/payload_generator/deflate_utils.h" | 
 | 32 | #include "update_engine/payload_generator/delta_diff_generator.h" | 
 | 33 | #include "lz4diff/lz4diff.pb.h" | 
 | 34 | #include "lz4diff_format.h" | 
 | 35 |  | 
 | 36 | namespace chromeos_update_engine { | 
 | 37 |  | 
 | 38 | bool StoreDstCompressedFileInfo(std::string_view recompressed_blob, | 
 | 39 |                                 std::string_view target_blob, | 
 | 40 |                                 const CompressedFile& dst_file_info, | 
 | 41 |                                 Lz4diffHeader* output) { | 
 | 42 |   *output->mutable_dst_info()->mutable_algo() = dst_file_info.algo; | 
 | 43 |   output->mutable_dst_info()->set_zero_padding_enabled( | 
 | 44 |       dst_file_info.zero_padding_enabled); | 
 | 45 |   const auto& block_info = dst_file_info.blocks; | 
 | 46 |   auto& dst_block_info = *output->mutable_dst_info()->mutable_block_info(); | 
 | 47 |   dst_block_info.Clear(); | 
 | 48 |   size_t offset = 0; | 
 | 49 |   for (const auto& block : block_info) { | 
 | 50 |     auto& pb_block = *dst_block_info.Add(); | 
 | 51 |     pb_block.set_uncompressed_offset(block.uncompressed_offset); | 
 | 52 |     pb_block.set_uncompressed_length(block.uncompressed_length); | 
 | 53 |     pb_block.set_compressed_length(block.compressed_length); | 
 | 54 |     CHECK_LT(offset, recompressed_blob.size()); | 
 | 55 |     auto s1 = recompressed_blob.substr(offset, block.compressed_length); | 
 | 56 |     auto s2 = target_blob.substr(offset, block.compressed_length); | 
 | 57 |     if (s1 != s2) { | 
 | 58 |       ScopedTempFile patch; | 
 | 59 |       int err = | 
 | 60 |           bsdiff::bsdiff(reinterpret_cast<const unsigned char*>(s1.data()), | 
 | 61 |                          s1.size(), | 
 | 62 |                          reinterpret_cast<const unsigned char*>(s2.data()), | 
 | 63 |                          s2.size(), | 
 | 64 |                          patch.path().c_str(), | 
 | 65 |                          nullptr); | 
 | 66 |       CHECK_EQ(err, 0); | 
 | 67 |       LOG(WARNING) << "Recompress Postfix patch size: " | 
 | 68 |                    << utils::FileSize(patch.path()); | 
 | 69 |       std::string patch_content; | 
 | 70 |       TEST_AND_RETURN_FALSE(utils::ReadFile(patch.path(), &patch_content)); | 
 | 71 |       pb_block.set_postfix_bspatch(std::move(patch_content)); | 
 | 72 |     } | 
 | 73 |     // Include recompressed blob hash, so we can determine if the device | 
 | 74 |     // produces same compressed output | 
 | 75 |     Blob recompressed_blob_hash; | 
 | 76 |     TEST_AND_RETURN_FALSE(HashCalculator::RawHashOfBytes( | 
 | 77 |         s1.data(), s1.length(), &recompressed_blob_hash)); | 
 | 78 |     pb_block.set_sha256_hash(recompressed_blob_hash.data(), | 
 | 79 |                              recompressed_blob_hash.size()); | 
 | 80 |  | 
 | 81 |     offset += block.compressed_length; | 
 | 82 |   } | 
 | 83 |   return true; | 
 | 84 | } | 
 | 85 |  | 
 | 86 | template <typename Blob> | 
 | 87 | static bool TryBsdiff(Blob src, Blob dst, Blob* output) noexcept { | 
 | 88 |   static constexpr auto kLz4diffDefaultBrotliQuality = 9; | 
 | 89 |   CHECK_NE(output, nullptr); | 
 | 90 |   ScopedTempFile patch; | 
 | 91 |  | 
 | 92 |   Blob bsdiff_delta; | 
 | 93 |   bsdiff::BsdiffPatchWriter patch_writer(patch.path(), | 
 | 94 |                                          {bsdiff::CompressorType::kBrotli}, | 
 | 95 |                                          kLz4diffDefaultBrotliQuality); | 
 | 96 |   TEST_AND_RETURN_FALSE(0 == bsdiff::bsdiff(src.data(), | 
 | 97 |                                             src.size(), | 
 | 98 |                                             dst.data(), | 
 | 99 |                                             dst.size(), | 
 | 100 |                                             &patch_writer, | 
 | 101 |                                             nullptr)); | 
 | 102 |  | 
 | 103 |   TEST_AND_RETURN_FALSE(utils::ReadFile(patch.path(), &bsdiff_delta)); | 
 | 104 |   TEST_AND_RETURN_FALSE(!bsdiff_delta.empty()); | 
 | 105 |   *output = std::move(bsdiff_delta); | 
 | 106 |   return true; | 
 | 107 | } | 
 | 108 |  | 
 | 109 | bool TryFindDeflates(puffin::Buffer data, | 
 | 110 |                      std::vector<puffin::BitExtent>* deflates) { | 
 | 111 |   if (puffin::LocateDeflatesInZipArchive(data, deflates)) { | 
 | 112 |     return true; | 
 | 113 |   } | 
 | 114 |   deflates->clear(); | 
 | 115 |   if (puffin::LocateDeflatesInGzip(data, deflates)) { | 
 | 116 |     return true; | 
 | 117 |   } | 
 | 118 |   deflates->clear(); | 
 | 119 |   return false; | 
 | 120 | } | 
 | 121 |  | 
 | 122 | static bool ConstructLz4diffPatch(Blob inner_patch, | 
 | 123 |                                   const Lz4diffHeader& header, | 
 | 124 |                                   Blob* output) { | 
| Kelvin Zhang | 893b3a1 | 2021-12-30 12:28:53 -0800 | [diff] [blame] | 125 |   Blob patch(kLz4diffHeaderSize); | 
| Kelvin Zhang | ee481e4 | 2021-12-20 12:59:10 -0800 | [diff] [blame] | 126 |   std::memcpy(patch.data(), kLz4diffMagic.data(), kLz4diffMagic.size()); | 
 | 127 |   *reinterpret_cast<uint32_t*>(patch.data() + kLz4diffMagic.size()) = | 
 | 128 |       htobe32(kLz4diffVersion); | 
 | 129 |  | 
 | 130 |   std::string serialized_pb; | 
 | 131 |   TEST_AND_RETURN_FALSE(header.SerializeToString(&serialized_pb)); | 
 | 132 |   *reinterpret_cast<uint32_t*>(patch.data() + kLz4diffMagic.size() + 4) = | 
 | 133 |       htobe32(serialized_pb.size()); | 
 | 134 |   patch.insert(patch.end(), serialized_pb.begin(), serialized_pb.end()); | 
 | 135 |   patch.insert(patch.end(), inner_patch.begin(), inner_patch.end()); | 
 | 136 |  | 
 | 137 |   *output = std::move(patch); | 
 | 138 |   return true; | 
 | 139 | } | 
 | 140 |  | 
 | 141 | static bool TryPuffdiff(puffin::Buffer src, | 
 | 142 |                         puffin::Buffer dst, | 
 | 143 |                         Blob* output) noexcept { | 
 | 144 |   CHECK_NE(output, nullptr); | 
 | 145 |   std::vector<puffin::BitExtent> src_deflates; | 
 | 146 |   TEST_AND_RETURN_FALSE(TryFindDeflates(src, &src_deflates)); | 
 | 147 |   std::vector<puffin::BitExtent> dst_deflates; | 
 | 148 |   TEST_AND_RETURN_FALSE(TryFindDeflates(dst, &dst_deflates)); | 
 | 149 |   if (src_deflates.empty() || dst_deflates.empty()) { | 
 | 150 |     return false; | 
 | 151 |   } | 
 | 152 |  | 
 | 153 |   Blob puffdiff_delta; | 
 | 154 |   ScopedTempFile temp_file("puffdiff-delta.XXXXXX"); | 
 | 155 |   // Perform PuffDiff operation. | 
 | 156 |   TEST_AND_RETURN_FALSE(puffin::PuffDiff( | 
 | 157 |       src, dst, src_deflates, dst_deflates, temp_file.path(), &puffdiff_delta)); | 
 | 158 |   TEST_AND_RETURN_FALSE(!puffdiff_delta.empty()); | 
 | 159 |  | 
 | 160 |   *output = std::move(puffdiff_delta); | 
 | 161 |   return true; | 
 | 162 | } | 
 | 163 |  | 
 | 164 | static void StoreSrcCompressedFileInfo(const CompressedFile& src_file_info, | 
 | 165 |                                        Lz4diffHeader* header) { | 
 | 166 |   *header->mutable_src_info()->mutable_algo() = src_file_info.algo; | 
| Kelvin Zhang | 4eae81e | 2021-12-09 17:07:17 -0800 | [diff] [blame] | 167 |   header->mutable_src_info()->set_zero_padding_enabled( | 
 | 168 |       src_file_info.zero_padding_enabled); | 
| Kelvin Zhang | ee481e4 | 2021-12-20 12:59:10 -0800 | [diff] [blame] | 169 |   auto& src_blocks = *header->mutable_src_info()->mutable_block_info(); | 
 | 170 |   src_blocks.Clear(); | 
 | 171 |   for (const auto& block : src_file_info.blocks) { | 
 | 172 |     auto& block_info = *src_blocks.Add(); | 
 | 173 |     block_info.set_uncompressed_length(block.uncompressed_length); | 
 | 174 |     block_info.set_uncompressed_offset(block.uncompressed_offset); | 
 | 175 |     block_info.set_compressed_length(block.compressed_length); | 
 | 176 |   } | 
 | 177 |   return; | 
 | 178 | } | 
 | 179 |  | 
 | 180 | bool Lz4Diff(std::string_view src, | 
 | 181 |              std::string_view dst, | 
 | 182 |              const CompressedFile& src_file_info, | 
 | 183 |              const CompressedFile& dst_file_info, | 
| Kelvin Zhang | ee481e4 | 2021-12-20 12:59:10 -0800 | [diff] [blame] | 184 |              Blob* output, | 
 | 185 |              InstallOperation::Type* op_type) noexcept { | 
 | 186 |   const auto& src_block_info = src_file_info.blocks; | 
 | 187 |   const auto& dst_block_info = dst_file_info.blocks; | 
 | 188 |  | 
| Kelvin Zhang | 893b3a1 | 2021-12-30 12:28:53 -0800 | [diff] [blame] | 189 |   auto decompressed_src = TryDecompressBlob( | 
 | 190 |       src, src_block_info, src_file_info.zero_padding_enabled); | 
 | 191 |   auto decompressed_dst = TryDecompressBlob( | 
 | 192 |       dst, dst_block_info, dst_file_info.zero_padding_enabled); | 
| Kelvin Zhang | ee481e4 | 2021-12-20 12:59:10 -0800 | [diff] [blame] | 193 |   if (decompressed_src.empty() || decompressed_dst.empty()) { | 
 | 194 |     LOG(ERROR) << "Failed to decompress input data"; | 
 | 195 |     return false; | 
 | 196 |   } | 
 | 197 |  | 
 | 198 |   Lz4diffHeader header; | 
 | 199 |   // BSDIFF isn't supposed to fail, so return error if BSDIFF failed. | 
 | 200 |   Blob patch_data; | 
 | 201 |   TEST_AND_RETURN_FALSE( | 
 | 202 |       TryBsdiff(decompressed_src, decompressed_dst, &patch_data)); | 
 | 203 |   header.set_inner_type(InnerPatchType::BSDIFF); | 
 | 204 |   if (op_type) { | 
 | 205 |     *op_type = InstallOperation::LZ4DIFF_BSDIFF; | 
 | 206 |   } | 
 | 207 |   // PUFFDIFF might fail, as the input data might not be deflate compressed. | 
 | 208 |  | 
 | 209 |   Blob puffdiff_delta; | 
 | 210 |   if (TryPuffdiff(decompressed_src, decompressed_dst, &puffdiff_delta) && | 
 | 211 |       puffdiff_delta.size() < patch_data.size()) { | 
 | 212 |     patch_data = std::move(puffdiff_delta); | 
 | 213 |     header.set_inner_type(InnerPatchType::PUFFDIFF); | 
 | 214 |     if (op_type) { | 
 | 215 |       *op_type = InstallOperation::LZ4DIFF_PUFFDIFF; | 
 | 216 |     } | 
 | 217 |   } | 
 | 218 |   // Free up memory used by |decompressed_src| , as we don't need it anymore. | 
 | 219 |   decompressed_src = {}; | 
 | 220 |  | 
 | 221 |   auto recompressed_blob = TryCompressBlob(ToStringView(decompressed_dst), | 
 | 222 |                                            dst_block_info, | 
| Kelvin Zhang | 893b3a1 | 2021-12-30 12:28:53 -0800 | [diff] [blame] | 223 |                                            dst_file_info.zero_padding_enabled, | 
| Kelvin Zhang | ee481e4 | 2021-12-20 12:59:10 -0800 | [diff] [blame] | 224 |                                            dst_file_info.algo); | 
 | 225 |   TEST_AND_RETURN_FALSE(recompressed_blob.size() > 0); | 
 | 226 |  | 
 | 227 |   StoreSrcCompressedFileInfo(src_file_info, &header); | 
 | 228 |   StoreDstCompressedFileInfo( | 
 | 229 |       ToStringView(recompressed_blob), dst, dst_file_info, &header); | 
 | 230 |   return ConstructLz4diffPatch(std::move(patch_data), header, output); | 
 | 231 | } | 
 | 232 |  | 
 | 233 | bool Lz4Diff(const Blob& src, | 
 | 234 |              const Blob& dst, | 
 | 235 |              const CompressedFile& src_file_info, | 
 | 236 |              const CompressedFile& dst_file_info, | 
| Kelvin Zhang | ee481e4 | 2021-12-20 12:59:10 -0800 | [diff] [blame] | 237 |              Blob* output, | 
 | 238 |              InstallOperation::Type* op_type) noexcept { | 
 | 239 |   return Lz4Diff(ToStringView(src), | 
 | 240 |                  ToStringView(dst), | 
 | 241 |                  src_file_info, | 
 | 242 |                  dst_file_info, | 
| Kelvin Zhang | ee481e4 | 2021-12-20 12:59:10 -0800 | [diff] [blame] | 243 |                  output, | 
 | 244 |                  op_type); | 
 | 245 | } | 
 | 246 |  | 
 | 247 | }  // namespace chromeos_update_engine |