unzip.cpp 7.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208
  1. /*
  2. * Copyright (c) 2020, Andrés Vieira <anvieiravazquez@gmail.com>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <AK/Assertions.h>
  7. #include <AK/DOSPackedTime.h>
  8. #include <AK/NumberFormat.h>
  9. #include <AK/StringUtils.h>
  10. #include <LibArchive/Zip.h>
  11. #include <LibCompress/Deflate.h>
  12. #include <LibCore/ArgsParser.h>
  13. #include <LibCore/DateTime.h>
  14. #include <LibCore/Directory.h>
  15. #include <LibCore/File.h>
  16. #include <LibCore/MappedFile.h>
  17. #include <LibCore/System.h>
  18. #include <LibCrypto/Checksum/CRC32.h>
  19. #include <LibFileSystem/FileSystem.h>
  20. #include <sys/stat.h>
  21. static ErrorOr<void> adjust_modification_time(Archive::ZipMember const& zip_member)
  22. {
  23. auto time = time_from_packed_dos(zip_member.modification_date, zip_member.modification_time);
  24. auto seconds = static_cast<time_t>(time.seconds_since_epoch());
  25. struct utimbuf buf {
  26. .actime = seconds,
  27. .modtime = seconds
  28. };
  29. return Core::System::utime(zip_member.name, buf);
  30. }
  31. static bool unpack_zip_member(Archive::ZipMember zip_member, bool quiet)
  32. {
  33. if (zip_member.is_directory) {
  34. if (auto maybe_error = Core::System::mkdir(zip_member.name, 0755); maybe_error.is_error()) {
  35. warnln("Failed to create directory '{}': {}", zip_member.name, maybe_error.error());
  36. return false;
  37. }
  38. if (!quiet)
  39. outln(" extracting: {}", zip_member.name);
  40. return true;
  41. }
  42. MUST(Core::Directory::create(LexicalPath(zip_member.name.to_deprecated_string()).parent(), Core::Directory::CreateDirectories::Yes));
  43. auto new_file_or_error = Core::File::open(zip_member.name.to_deprecated_string(), Core::File::OpenMode::Write);
  44. if (new_file_or_error.is_error()) {
  45. warnln("Can't write file {}: {}", zip_member.name, new_file_or_error.release_error());
  46. return false;
  47. }
  48. auto new_file = new_file_or_error.release_value();
  49. if (!quiet)
  50. outln(" extracting: {}", zip_member.name);
  51. Crypto::Checksum::CRC32 checksum;
  52. switch (zip_member.compression_method) {
  53. case Archive::ZipCompressionMethod::Store: {
  54. if (auto maybe_error = new_file->write_until_depleted(zip_member.compressed_data); maybe_error.is_error()) {
  55. warnln("Can't write file contents in {}: {}", zip_member.name, maybe_error.release_error());
  56. return false;
  57. }
  58. checksum.update({ zip_member.compressed_data.data(), zip_member.compressed_data.size() });
  59. break;
  60. }
  61. case Archive::ZipCompressionMethod::Deflate: {
  62. auto decompressed_data = Compress::DeflateDecompressor::decompress_all(zip_member.compressed_data);
  63. if (decompressed_data.is_error()) {
  64. warnln("Failed decompressing file {}: {}", zip_member.name, decompressed_data.error());
  65. return false;
  66. }
  67. if (decompressed_data.value().size() != zip_member.uncompressed_size) {
  68. warnln("Failed decompressing file {}", zip_member.name);
  69. return false;
  70. }
  71. if (auto maybe_error = new_file->write_until_depleted(decompressed_data.value()); maybe_error.is_error()) {
  72. warnln("Can't write file contents in {}: {}", zip_member.name, maybe_error.release_error());
  73. return false;
  74. }
  75. checksum.update(decompressed_data.value());
  76. break;
  77. }
  78. default:
  79. VERIFY_NOT_REACHED();
  80. }
  81. if (adjust_modification_time(zip_member).is_error()) {
  82. warnln("Failed setting modification_time for file {}", zip_member.name);
  83. return false;
  84. }
  85. new_file->close();
  86. if (checksum.digest() != zip_member.crc32) {
  87. warnln("Failed decompressing file {}: CRC32 mismatch", zip_member.name);
  88. MUST(FileSystem::remove(zip_member.name, FileSystem::RecursionMode::Disallowed));
  89. return false;
  90. }
  91. return true;
  92. }
  93. ErrorOr<int> serenity_main(Main::Arguments arguments)
  94. {
  95. StringView zip_file_path;
  96. bool quiet { false };
  97. bool list_files { false };
  98. StringView output_directory_path;
  99. Vector<StringView> file_filters;
  100. Core::ArgsParser args_parser;
  101. args_parser.add_option(list_files, "Only list files in the archive", "list", 'l');
  102. args_parser.add_option(output_directory_path, "Directory to receive the archive content", "output-directory", 'd', "path");
  103. args_parser.add_option(quiet, "Be less verbose", "quiet", 'q');
  104. args_parser.add_positional_argument(zip_file_path, "File to unzip", "path", Core::ArgsParser::Required::Yes);
  105. args_parser.add_positional_argument(file_filters, "Files or filters in the archive to extract", "files", Core::ArgsParser::Required::No);
  106. args_parser.parse(arguments);
  107. struct stat st = TRY(Core::System::stat(zip_file_path));
  108. // FIXME: Map file chunk-by-chunk once we have mmap() with offset.
  109. // This will require mapping some parts then unmapping them repeatedly,
  110. // but it would be significantly faster and less syscall heavy than seek()/read() at every read.
  111. RefPtr<Core::MappedFile> mapped_file;
  112. ReadonlyBytes input_bytes;
  113. if (st.st_size > 0) {
  114. mapped_file = TRY(Core::MappedFile::map(zip_file_path));
  115. input_bytes = mapped_file->bytes();
  116. }
  117. if (!quiet)
  118. warnln("Archive: {}", zip_file_path);
  119. auto zip_file = Archive::Zip::try_create(input_bytes);
  120. if (!zip_file.has_value()) {
  121. warnln("Invalid zip file {}", zip_file_path);
  122. return 1;
  123. }
  124. if (!output_directory_path.is_null()) {
  125. TRY(Core::Directory::create(output_directory_path, Core::Directory::CreateDirectories::Yes));
  126. TRY(Core::System::chdir(output_directory_path));
  127. }
  128. if (list_files) {
  129. outln(" Length Date Time Name");
  130. outln("--------- ---------- -------- ----");
  131. u32 members_count = 0;
  132. u64 total_size = 0;
  133. TRY(zip_file->for_each_member([&](auto zip_member) -> ErrorOr<IterationDecision> {
  134. members_count++;
  135. auto time = time_from_packed_dos(zip_member.modification_date, zip_member.modification_time);
  136. auto time_str = TRY(Core::DateTime::from_timestamp(time.seconds_since_epoch()).to_string());
  137. total_size += zip_member.uncompressed_size;
  138. outln("{:>9} {} {}", zip_member.uncompressed_size, time_str, zip_member.name);
  139. return IterationDecision::Continue;
  140. }));
  141. outln("--------- ----");
  142. outln("{:>9} {} files", total_size, members_count);
  143. return 0;
  144. }
  145. Vector<Archive::ZipMember> zip_directories;
  146. auto success = TRY(zip_file->for_each_member([&](auto zip_member) {
  147. bool keep_file = false;
  148. if (!file_filters.is_empty()) {
  149. for (auto& filter : file_filters) {
  150. // Convert underscore wildcards (usual unzip convention) to question marks (as used by StringUtils)
  151. auto string_filter = filter.replace("_"sv, "?"sv, ReplaceMode::All);
  152. if (zip_member.name.bytes_as_string_view().matches(string_filter, CaseSensitivity::CaseSensitive)) {
  153. keep_file = true;
  154. break;
  155. }
  156. }
  157. } else {
  158. keep_file = true;
  159. }
  160. if (keep_file) {
  161. if (!unpack_zip_member(zip_member, quiet))
  162. return IterationDecision::Break;
  163. if (zip_member.is_directory)
  164. zip_directories.append(zip_member);
  165. }
  166. return IterationDecision::Continue;
  167. }));
  168. if (!success) {
  169. return 1;
  170. }
  171. for (auto& directory : zip_directories) {
  172. if (adjust_modification_time(directory).is_error()) {
  173. warnln("Failed setting modification time for directory {}", directory.name);
  174. return 1;
  175. }
  176. }
  177. return success ? 0 : 1;
  178. }