CompressedBlob.cpp 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400
  1. // Copyright 2008 Dolphin Emulator Project
  2. // SPDX-License-Identifier: GPL-2.0-or-later
  3. #include "DiscIO/CompressedBlob.h"
  4. #include <algorithm>
  5. #include <cstdio>
  6. #include <cstring>
  7. #include <memory>
  8. #include <string>
  9. #include <utility>
  10. #include <vector>
  11. #include <zlib.h>
  12. #ifdef _WIN32
  13. #include <windows.h>
  14. #include <io.h>
  15. #endif
  16. #include "Common/Assert.h"
  17. #include "Common/CommonTypes.h"
  18. #include "Common/FileUtil.h"
  19. #include "Common/Hash.h"
  20. #include "Common/IOFile.h"
  21. #include "Common/Logging/Log.h"
  22. #include "Common/MsgHandler.h"
  23. #include "DiscIO/Blob.h"
  24. #include "DiscIO/DiscScrubber.h"
  25. #include "DiscIO/MultithreadedCompressor.h"
  26. #include "DiscIO/Volume.h"
  27. namespace DiscIO
  28. {
  29. bool IsGCZBlob(File::IOFile& file);
  30. CompressedBlobReader::CompressedBlobReader(File::IOFile file, const std::string& filename)
  31. : m_file(std::move(file)), m_file_name(filename)
  32. {
  33. m_file_size = m_file.GetSize();
  34. m_file.Seek(0, File::SeekOrigin::Begin);
  35. m_file.ReadArray(&m_header, 1);
  36. SetSectorSize(m_header.block_size);
  37. // cache block pointers and hashes
  38. m_block_pointers.resize(m_header.num_blocks);
  39. m_file.ReadArray(m_block_pointers.data(), m_header.num_blocks);
  40. m_hashes.resize(m_header.num_blocks);
  41. m_file.ReadArray(m_hashes.data(), m_header.num_blocks);
  42. m_data_offset = (sizeof(CompressedBlobHeader)) +
  43. (sizeof(u64)) * m_header.num_blocks // skip block pointers
  44. + (sizeof(u32)) * m_header.num_blocks; // skip hashes
  45. // A compressed block is never ever longer than a decompressed block, so just header.block_size
  46. // should be fine.
  47. // I still add some safety margin.
  48. const u32 zlib_buffer_size = m_header.block_size + 64;
  49. m_zlib_buffer.resize(zlib_buffer_size);
  50. }
  51. std::unique_ptr<CompressedBlobReader> CompressedBlobReader::Create(File::IOFile file,
  52. const std::string& filename)
  53. {
  54. if (IsGCZBlob(file))
  55. return std::unique_ptr<CompressedBlobReader>(
  56. new CompressedBlobReader(std::move(file), filename));
  57. return nullptr;
  58. }
  59. CompressedBlobReader::~CompressedBlobReader() = default;
  60. std::unique_ptr<BlobReader> CompressedBlobReader::CopyReader() const
  61. {
  62. return Create(m_file.Duplicate("rb"), m_file_name);
  63. }
  64. // IMPORTANT: Calling this function invalidates all earlier pointers gotten from this function.
  65. u64 CompressedBlobReader::GetBlockCompressedSize(u64 block_num) const
  66. {
  67. u64 start = m_block_pointers[block_num];
  68. if (block_num < m_header.num_blocks - 1)
  69. return m_block_pointers[block_num + 1] - start;
  70. else if (block_num == m_header.num_blocks - 1)
  71. return m_header.compressed_data_size - start;
  72. else
  73. ERROR_LOG_FMT(DISCIO, "{} - illegal block number {}", __func__, block_num);
  74. return 0;
  75. }
  76. bool CompressedBlobReader::GetBlock(u64 block_num, u8* out_ptr)
  77. {
  78. bool uncompressed = false;
  79. u32 comp_block_size = (u32)GetBlockCompressedSize(block_num);
  80. u64 offset = m_block_pointers[block_num] + m_data_offset;
  81. if (offset & (1ULL << 63))
  82. {
  83. if (comp_block_size != m_header.block_size)
  84. ERROR_LOG_FMT(DISCIO, "Uncompressed block with wrong size");
  85. uncompressed = true;
  86. offset &= ~(1ULL << 63);
  87. }
  88. // clear unused part of zlib buffer. maybe this can be deleted when it works fully.
  89. memset(&m_zlib_buffer[comp_block_size], 0, m_zlib_buffer.size() - comp_block_size);
  90. m_file.Seek(offset, File::SeekOrigin::Begin);
  91. if (!m_file.ReadBytes(m_zlib_buffer.data(), comp_block_size))
  92. {
  93. ERROR_LOG_FMT(DISCIO, "The disc image \"{}\" is truncated, some of the data is missing.",
  94. m_file_name);
  95. m_file.ClearError();
  96. return false;
  97. }
  98. // First, check hash.
  99. const u32 block_hash = Common::HashAdler32(m_zlib_buffer.data(), comp_block_size);
  100. if (block_hash != m_hashes[block_num])
  101. {
  102. ERROR_LOG_FMT(DISCIO,
  103. "The disc image \"{}\" is corrupt.\n"
  104. "Hash of block {} is {:08x} instead of {:08x}.",
  105. m_file_name, block_num, block_hash, m_hashes[block_num]);
  106. }
  107. if (uncompressed)
  108. {
  109. std::copy_n(m_zlib_buffer.begin(), comp_block_size, out_ptr);
  110. }
  111. else
  112. {
  113. z_stream z = {};
  114. z.next_in = m_zlib_buffer.data();
  115. z.avail_in = comp_block_size;
  116. if (z.avail_in > m_header.block_size)
  117. {
  118. ERROR_LOG_FMT(DISCIO, "Compressed block size is larger than uncompressed block size");
  119. }
  120. z.next_out = out_ptr;
  121. z.avail_out = m_header.block_size;
  122. inflateInit(&z);
  123. int status = inflate(&z, Z_FULL_FLUSH);
  124. u32 uncomp_size = m_header.block_size - z.avail_out;
  125. if (status != Z_STREAM_END)
  126. {
  127. // this seem to fire wrongly from time to time
  128. // to be sure, don't use compressed isos :P
  129. ERROR_LOG_FMT(DISCIO, "Failure reading block {} - out of data and not at end.", block_num);
  130. }
  131. inflateEnd(&z);
  132. if (uncomp_size != m_header.block_size)
  133. {
  134. ERROR_LOG_FMT(DISCIO, "Wrong block size");
  135. return false;
  136. }
  137. }
  138. return true;
  139. }
  140. struct CompressThreadState
  141. {
  142. CompressThreadState() : z{} {}
  143. ~CompressThreadState() { deflateEnd(&z); }
  144. // z_stream will stop working if it changes address, so this object must not be moved
  145. CompressThreadState(const CompressThreadState&) = delete;
  146. CompressThreadState(CompressThreadState&&) = delete;
  147. CompressThreadState& operator=(const CompressThreadState&) = delete;
  148. CompressThreadState& operator=(CompressThreadState&&) = delete;
  149. std::vector<u8> compressed_buffer;
  150. z_stream z;
  151. };
  152. struct CompressParameters
  153. {
  154. std::vector<u8> data{};
  155. u32 block_number = 0;
  156. u64 inpos = 0;
  157. };
  158. struct OutputParameters
  159. {
  160. std::vector<u8> data{};
  161. u32 block_number = 0;
  162. bool compressed = false;
  163. u64 inpos = 0;
  164. };
  165. static ConversionResultCode SetUpCompressThreadState(CompressThreadState* state)
  166. {
  167. return deflateInit(&state->z, 9) == Z_OK ? ConversionResultCode::Success :
  168. ConversionResultCode::InternalError;
  169. }
  170. static ConversionResult<OutputParameters> Compress(CompressThreadState* state,
  171. CompressParameters parameters, int block_size,
  172. std::vector<u32>* hashes, int* num_stored,
  173. int* num_compressed)
  174. {
  175. state->compressed_buffer.resize(block_size);
  176. int retval = deflateReset(&state->z);
  177. state->z.next_in = parameters.data.data();
  178. state->z.avail_in = block_size;
  179. state->z.next_out = state->compressed_buffer.data();
  180. state->z.avail_out = block_size;
  181. if (retval != Z_OK)
  182. {
  183. ERROR_LOG_FMT(DISCIO, "Deflate failed");
  184. return ConversionResultCode::InternalError;
  185. }
  186. const int status = deflate(&state->z, Z_FINISH);
  187. state->compressed_buffer.resize(block_size - state->z.avail_out);
  188. OutputParameters output_parameters;
  189. if ((status != Z_STREAM_END) || (state->z.avail_out < 10))
  190. {
  191. // let's store uncompressed
  192. ++*num_stored;
  193. output_parameters = OutputParameters{std::move(parameters.data), parameters.block_number, false,
  194. parameters.inpos};
  195. }
  196. else
  197. {
  198. // let's store compressed
  199. ++*num_compressed;
  200. output_parameters = OutputParameters{std::move(state->compressed_buffer),
  201. parameters.block_number, true, parameters.inpos};
  202. }
  203. (*hashes)[parameters.block_number] =
  204. Common::HashAdler32(output_parameters.data.data(), output_parameters.data.size());
  205. return std::move(output_parameters);
  206. }
  207. static ConversionResultCode Output(OutputParameters parameters, File::IOFile* outfile,
  208. u64* position, std::vector<u64>* offsets, int progress_monitor,
  209. u32 num_blocks, const CompressCB& callback)
  210. {
  211. u64 offset = *position;
  212. if (!parameters.compressed)
  213. offset |= 0x8000000000000000ULL;
  214. (*offsets)[parameters.block_number] = offset;
  215. *position += parameters.data.size();
  216. if (!outfile->WriteBytes(parameters.data.data(), parameters.data.size()))
  217. return ConversionResultCode::WriteFailed;
  218. if (parameters.block_number % progress_monitor == 0)
  219. {
  220. const int ratio =
  221. parameters.inpos == 0 ? 0 : static_cast<int>(100 * *position / parameters.inpos);
  222. const std::string text = Common::FmtFormatT("{0} of {1} blocks. Compression ratio {2}%",
  223. parameters.block_number, num_blocks, ratio);
  224. const float completion = static_cast<float>(parameters.block_number) / num_blocks;
  225. if (!callback(text, completion))
  226. return ConversionResultCode::Canceled;
  227. }
  228. return ConversionResultCode::Success;
  229. }
  230. bool ConvertToGCZ(BlobReader* infile, const std::string& infile_path,
  231. const std::string& outfile_path, u32 sub_type, int block_size,
  232. const CompressCB& callback)
  233. {
  234. ASSERT(infile->GetDataSizeType() == DataSizeType::Accurate);
  235. File::IOFile outfile(outfile_path, "wb");
  236. if (!outfile)
  237. {
  238. PanicAlertFmtT(
  239. "Failed to open the output file \"{0}\".\n"
  240. "Check that you have permissions to write the target folder and that the media can "
  241. "be written.",
  242. outfile_path);
  243. return false;
  244. }
  245. callback(Common::GetStringT("Files opened, ready to compress."), 0);
  246. CompressedBlobHeader header;
  247. header.magic_cookie = GCZ_MAGIC;
  248. header.sub_type = sub_type;
  249. header.block_size = block_size;
  250. header.data_size = infile->GetDataSize();
  251. // round upwards!
  252. header.num_blocks = (u32)((header.data_size + (block_size - 1)) / block_size);
  253. std::vector<u64> offsets(header.num_blocks);
  254. std::vector<u32> hashes(header.num_blocks);
  255. // seek past the header (we will write it at the end)
  256. outfile.Seek(sizeof(CompressedBlobHeader), File::SeekOrigin::Current);
  257. // seek past the offset and hash tables (we will write them at the end)
  258. outfile.Seek((sizeof(u64) + sizeof(u32)) * header.num_blocks, File::SeekOrigin::Current);
  259. // Now we are ready to write compressed data!
  260. u64 inpos = 0;
  261. u64 position = 0;
  262. int num_compressed = 0;
  263. int num_stored = 0;
  264. int progress_monitor = std::max<int>(1, header.num_blocks / 1000);
  265. const auto compress = [&](CompressThreadState* state, CompressParameters parameters) {
  266. return Compress(state, std::move(parameters), block_size, &hashes, &num_stored,
  267. &num_compressed);
  268. };
  269. const auto output = [&](OutputParameters parameters) {
  270. return Output(std::move(parameters), &outfile, &position, &offsets, progress_monitor,
  271. header.num_blocks, callback);
  272. };
  273. MultithreadedCompressor<CompressThreadState, CompressParameters, OutputParameters> compressor(
  274. SetUpCompressThreadState, compress, output);
  275. std::vector<u8> in_buf(block_size);
  276. for (u32 i = 0; i < header.num_blocks; i++)
  277. {
  278. if (compressor.GetStatus() != ConversionResultCode::Success)
  279. break;
  280. const u64 bytes_to_read = std::min<u64>(block_size, header.data_size - inpos);
  281. if (!infile->Read(inpos, bytes_to_read, in_buf.data()))
  282. {
  283. compressor.SetError(ConversionResultCode::ReadFailed);
  284. break;
  285. }
  286. std::fill(in_buf.begin() + bytes_to_read, in_buf.begin() + header.block_size, 0);
  287. inpos += block_size;
  288. compressor.CompressAndWrite(CompressParameters{in_buf, i, inpos});
  289. }
  290. compressor.Shutdown();
  291. header.compressed_data_size = position;
  292. const ConversionResultCode result = compressor.GetStatus();
  293. if (result != ConversionResultCode::Success)
  294. {
  295. // Remove the incomplete output file.
  296. outfile.Close();
  297. File::Delete(outfile_path);
  298. }
  299. else
  300. {
  301. // Okay, go back and fill in headers
  302. outfile.Seek(0, File::SeekOrigin::Begin);
  303. outfile.WriteArray(&header, 1);
  304. outfile.WriteArray(offsets.data(), header.num_blocks);
  305. outfile.WriteArray(hashes.data(), header.num_blocks);
  306. callback(Common::GetStringT("Done compressing disc image."), 1.0f);
  307. }
  308. if (result == ConversionResultCode::ReadFailed)
  309. PanicAlertFmtT("Failed to read from the input file \"{0}\".", infile_path);
  310. if (result == ConversionResultCode::WriteFailed)
  311. {
  312. PanicAlertFmtT("Failed to write the output file \"{0}\".\n"
  313. "Check that you have enough space available on the target drive.",
  314. outfile_path);
  315. }
  316. return result == ConversionResultCode::Success;
  317. }
  318. bool IsGCZBlob(File::IOFile& file)
  319. {
  320. const u64 position = file.Tell();
  321. if (!file.Seek(0, File::SeekOrigin::Begin))
  322. return false;
  323. CompressedBlobHeader header;
  324. bool is_gcz = file.ReadArray(&header, 1) && header.magic_cookie == GCZ_MAGIC;
  325. file.Seek(position, File::SeekOrigin::Begin);
  326. return is_gcz;
  327. }
  328. } // namespace DiscIO