Heap.cpp 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281
  1. /*
  2. * Copyright (c) 2021, Jan de Visser <jan@de-visser.net>
  3. * Copyright (c) 2023, Jelle Raaijmakers <jelle@gmta.nl>
  4. *
  5. * SPDX-License-Identifier: BSD-2-Clause
  6. */
  7. #include <AK/DeprecatedString.h>
  8. #include <AK/Format.h>
  9. #include <AK/QuickSort.h>
  10. #include <LibCore/IODevice.h>
  11. #include <LibCore/System.h>
  12. #include <LibSQL/Heap.h>
  13. #include <sys/stat.h>
  14. namespace SQL {
  15. Heap::Heap(DeprecatedString file_name)
  16. {
  17. set_name(move(file_name));
  18. }
  19. Heap::~Heap()
  20. {
  21. if (m_file && !m_write_ahead_log.is_empty()) {
  22. if (auto maybe_error = flush(); maybe_error.is_error())
  23. warnln("~Heap({}): {}", name(), maybe_error.error());
  24. }
  25. }
  26. ErrorOr<void> Heap::open()
  27. {
  28. size_t file_size = 0;
  29. struct stat stat_buffer;
  30. if (stat(name().characters(), &stat_buffer) != 0) {
  31. if (errno != ENOENT) {
  32. warnln("Heap::open({}): could not stat: {}"sv, name(), strerror(errno));
  33. return Error::from_string_literal("Heap::open(): could not stat file");
  34. }
  35. } else if (!S_ISREG(stat_buffer.st_mode)) {
  36. warnln("Heap::open({}): can only use regular files"sv, name());
  37. return Error::from_string_literal("Heap::open(): can only use regular files");
  38. } else {
  39. file_size = stat_buffer.st_size;
  40. }
  41. if (file_size > 0) {
  42. m_next_block = file_size / Block::SIZE;
  43. m_highest_block_written = m_next_block - 1;
  44. }
  45. auto file = TRY(Core::File::open(name(), Core::File::OpenMode::ReadWrite));
  46. m_file = TRY(Core::BufferedFile::create(move(file)));
  47. if (file_size > 0) {
  48. if (auto error_maybe = read_zero_block(); error_maybe.is_error()) {
  49. m_file = nullptr;
  50. return error_maybe.release_error();
  51. }
  52. } else {
  53. TRY(initialize_zero_block());
  54. }
  55. // FIXME: We should more gracefully handle version incompatibilities. For now, we drop the database.
  56. if (m_version != VERSION) {
  57. dbgln_if(SQL_DEBUG, "Heap file {} opened has incompatible version {}. Deleting for version {}.", name(), m_version, VERSION);
  58. m_file = nullptr;
  59. TRY(Core::System::unlink(name()));
  60. return open();
  61. }
  62. dbgln_if(SQL_DEBUG, "Heap file {} opened; number of blocks = {}", name(), m_highest_block_written);
  63. return {};
  64. }
  65. bool Heap::has_block(Block::Index index) const
  66. {
  67. return index <= m_highest_block_written || m_write_ahead_log.contains(index);
  68. }
  69. ErrorOr<ByteBuffer> Heap::read_storage(Block::Index index)
  70. {
  71. dbgln_if(SQL_DEBUG, "{}({})", __FUNCTION__, index);
  72. // Reconstruct the data storage from a potential chain of blocks
  73. ByteBuffer data;
  74. while (index > 0) {
  75. auto block = TRY(read_block(index));
  76. dbgln_if(SQL_DEBUG, " -> {} bytes", block.size_in_bytes());
  77. TRY(data.try_append(block.data().bytes().slice(0, block.size_in_bytes())));
  78. index = block.next_block();
  79. }
  80. return data;
  81. }
  82. ErrorOr<void> Heap::write_storage(Block::Index index, ReadonlyBytes data)
  83. {
  84. dbgln_if(SQL_DEBUG, "{}({}, {} bytes)", __FUNCTION__, index, data.size());
  85. VERIFY(data.size() > 0);
  86. // Split up the storage across multiple blocks if necessary, creating a chain
  87. u32 remaining_size = static_cast<u32>(data.size());
  88. u32 offset_in_data = 0;
  89. while (remaining_size > 0) {
  90. auto block_data_size = AK::min(remaining_size, Block::DATA_SIZE);
  91. remaining_size -= block_data_size;
  92. auto next_block_index = (remaining_size > 0) ? request_new_block_index() : 0;
  93. auto block_data = TRY(ByteBuffer::create_uninitialized(block_data_size));
  94. block_data.bytes().overwrite(0, data.offset(offset_in_data), block_data_size);
  95. TRY(write_block({ index, block_data_size, next_block_index, move(block_data) }));
  96. index = next_block_index;
  97. offset_in_data += block_data_size;
  98. }
  99. return {};
  100. }
  101. ErrorOr<ByteBuffer> Heap::read_raw_block(Block::Index index)
  102. {
  103. VERIFY(m_file);
  104. VERIFY(index < m_next_block);
  105. if (auto data = m_write_ahead_log.get(index); data.has_value())
  106. return data.value();
  107. TRY(m_file->seek(index * Block::SIZE, SeekMode::SetPosition));
  108. auto buffer = TRY(ByteBuffer::create_uninitialized(Block::SIZE));
  109. TRY(m_file->read_until_filled(buffer));
  110. return buffer;
  111. }
  112. ErrorOr<Block> Heap::read_block(Block::Index index)
  113. {
  114. dbgln_if(SQL_DEBUG, "Read heap block {}", index);
  115. auto buffer = TRY(read_raw_block(index));
  116. auto size_in_bytes = *reinterpret_cast<u32*>(buffer.offset_pointer(0));
  117. auto next_block = *reinterpret_cast<Block::Index*>(buffer.offset_pointer(sizeof(u32)));
  118. auto data = TRY(buffer.slice(Block::HEADER_SIZE, Block::DATA_SIZE));
  119. return Block { index, size_in_bytes, next_block, move(data) };
  120. }
  121. ErrorOr<void> Heap::write_raw_block(Block::Index index, ReadonlyBytes data)
  122. {
  123. dbgln_if(SQL_DEBUG, "Write raw block {}", index);
  124. VERIFY(m_file);
  125. VERIFY(data.size() == Block::SIZE);
  126. TRY(m_file->seek(index * Block::SIZE, SeekMode::SetPosition));
  127. TRY(m_file->write_until_depleted(data));
  128. if (index > m_highest_block_written)
  129. m_highest_block_written = index;
  130. return {};
  131. }
  132. ErrorOr<void> Heap::write_raw_block_to_wal(Block::Index index, ByteBuffer&& data)
  133. {
  134. dbgln_if(SQL_DEBUG, "{}(): adding raw block {} to WAL", __FUNCTION__, index);
  135. VERIFY(index < m_next_block);
  136. VERIFY(data.size() == Block::SIZE);
  137. TRY(m_write_ahead_log.try_set(index, move(data)));
  138. return {};
  139. }
  140. ErrorOr<void> Heap::write_block(Block const& block)
  141. {
  142. VERIFY(block.index() < m_next_block);
  143. VERIFY(block.next_block() < m_next_block);
  144. VERIFY(block.data().size() <= Block::DATA_SIZE);
  145. auto size_in_bytes = block.size_in_bytes();
  146. auto next_block = block.next_block();
  147. auto heap_data = TRY(ByteBuffer::create_zeroed(Block::SIZE));
  148. heap_data.overwrite(0, &size_in_bytes, sizeof(size_in_bytes));
  149. heap_data.overwrite(sizeof(size_in_bytes), &next_block, sizeof(next_block));
  150. block.data().bytes().copy_to(heap_data.bytes().slice(Block::HEADER_SIZE));
  151. return write_raw_block_to_wal(block.index(), move(heap_data));
  152. }
  153. ErrorOr<void> Heap::flush()
  154. {
  155. VERIFY(m_file);
  156. auto indices = m_write_ahead_log.keys();
  157. quick_sort(indices);
  158. for (auto index : indices) {
  159. dbgln_if(SQL_DEBUG, "Flushing block {} to {}", index, name());
  160. auto& data = m_write_ahead_log.get(index).value();
  161. TRY(write_raw_block(index, data));
  162. }
  163. m_write_ahead_log.clear();
  164. dbgln_if(SQL_DEBUG, "WAL flushed; new number of blocks = {}", m_highest_block_written);
  165. return {};
  166. }
  167. constexpr static auto FILE_ID = "SerenitySQL "sv;
  168. constexpr static auto VERSION_OFFSET = FILE_ID.length();
  169. constexpr static auto SCHEMAS_ROOT_OFFSET = VERSION_OFFSET + sizeof(u32);
  170. constexpr static auto TABLES_ROOT_OFFSET = SCHEMAS_ROOT_OFFSET + sizeof(u32);
  171. constexpr static auto TABLE_COLUMNS_ROOT_OFFSET = TABLES_ROOT_OFFSET + sizeof(u32);
  172. constexpr static auto USER_VALUES_OFFSET = TABLE_COLUMNS_ROOT_OFFSET + sizeof(u32);
  173. ErrorOr<void> Heap::read_zero_block()
  174. {
  175. dbgln_if(SQL_DEBUG, "Read zero block from {}", name());
  176. auto block = TRY(read_raw_block(0));
  177. auto file_id_buffer = TRY(block.slice(0, FILE_ID.length()));
  178. auto file_id = StringView(file_id_buffer);
  179. if (file_id != FILE_ID) {
  180. warnln("{}: Zero page corrupt. This is probably not a {} heap file"sv, name(), FILE_ID);
  181. return Error::from_string_literal("Heap()::read_zero_block(): Zero page corrupt. This is probably not a SerenitySQL heap file");
  182. }
  183. memcpy(&m_version, block.offset_pointer(VERSION_OFFSET), sizeof(u32));
  184. dbgln_if(SQL_DEBUG, "Version: {}.{}", (m_version & 0xFFFF0000) >> 16, (m_version & 0x0000FFFF));
  185. memcpy(&m_schemas_root, block.offset_pointer(SCHEMAS_ROOT_OFFSET), sizeof(u32));
  186. dbgln_if(SQL_DEBUG, "Schemas root node: {}", m_schemas_root);
  187. memcpy(&m_tables_root, block.offset_pointer(TABLES_ROOT_OFFSET), sizeof(u32));
  188. dbgln_if(SQL_DEBUG, "Tables root node: {}", m_tables_root);
  189. memcpy(&m_table_columns_root, block.offset_pointer(TABLE_COLUMNS_ROOT_OFFSET), sizeof(u32));
  190. dbgln_if(SQL_DEBUG, "Table columns root node: {}", m_table_columns_root);
  191. memcpy(m_user_values.data(), block.offset_pointer(USER_VALUES_OFFSET), m_user_values.size() * sizeof(u32));
  192. for (auto ix = 0u; ix < m_user_values.size(); ix++) {
  193. if (m_user_values[ix])
  194. dbgln_if(SQL_DEBUG, "User value {}: {}", ix, m_user_values[ix]);
  195. }
  196. return {};
  197. }
  198. ErrorOr<void> Heap::update_zero_block()
  199. {
  200. dbgln_if(SQL_DEBUG, "Write zero block to {}", name());
  201. dbgln_if(SQL_DEBUG, "Version: {}.{}", (m_version & 0xFFFF0000) >> 16, (m_version & 0x0000FFFF));
  202. dbgln_if(SQL_DEBUG, "Schemas root node: {}", m_schemas_root);
  203. dbgln_if(SQL_DEBUG, "Tables root node: {}", m_tables_root);
  204. dbgln_if(SQL_DEBUG, "Table Columns root node: {}", m_table_columns_root);
  205. for (auto ix = 0u; ix < m_user_values.size(); ix++) {
  206. if (m_user_values[ix] > 0)
  207. dbgln_if(SQL_DEBUG, "User value {}: {}", ix, m_user_values[ix]);
  208. }
  209. auto buffer = TRY(ByteBuffer::create_zeroed(Block::SIZE));
  210. auto buffer_bytes = buffer.bytes();
  211. buffer_bytes.overwrite(0, FILE_ID.characters_without_null_termination(), FILE_ID.length());
  212. buffer_bytes.overwrite(VERSION_OFFSET, &m_version, sizeof(u32));
  213. buffer_bytes.overwrite(SCHEMAS_ROOT_OFFSET, &m_schemas_root, sizeof(u32));
  214. buffer_bytes.overwrite(TABLES_ROOT_OFFSET, &m_tables_root, sizeof(u32));
  215. buffer_bytes.overwrite(TABLE_COLUMNS_ROOT_OFFSET, &m_table_columns_root, sizeof(u32));
  216. buffer_bytes.overwrite(USER_VALUES_OFFSET, m_user_values.data(), m_user_values.size() * sizeof(u32));
  217. return write_raw_block_to_wal(0, move(buffer));
  218. }
  219. ErrorOr<void> Heap::initialize_zero_block()
  220. {
  221. m_version = VERSION;
  222. m_schemas_root = 0;
  223. m_tables_root = 0;
  224. m_table_columns_root = 0;
  225. m_next_block = 1;
  226. for (auto& user : m_user_values)
  227. user = 0u;
  228. return update_zero_block();
  229. }
  230. }