@nxtedition/rocksdb 5.2.21 → 5.2.28

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (923) hide show
  1. package/binding.cc +510 -967
  2. package/binding.gyp +78 -72
  3. package/chained-batch.js +1 -2
  4. package/deps/rocksdb/build_version.cc +70 -4
  5. package/deps/rocksdb/rocksdb/CMakeLists.txt +281 -149
  6. package/deps/rocksdb/rocksdb/Makefile +459 -469
  7. package/deps/rocksdb/rocksdb/TARGETS +5244 -1500
  8. package/deps/rocksdb/rocksdb/cache/cache.cc +12 -3
  9. package/deps/rocksdb/rocksdb/cache/cache_bench.cc +7 -368
  10. package/deps/rocksdb/rocksdb/cache/cache_bench_tool.cc +924 -0
  11. package/deps/rocksdb/rocksdb/cache/cache_entry_roles.cc +128 -0
  12. package/deps/rocksdb/rocksdb/cache/cache_entry_roles.h +103 -0
  13. package/deps/rocksdb/rocksdb/cache/cache_entry_stats.h +183 -0
  14. package/deps/rocksdb/rocksdb/cache/cache_helpers.h +11 -0
  15. package/deps/rocksdb/rocksdb/cache/cache_key.cc +344 -0
  16. package/deps/rocksdb/rocksdb/cache/cache_key.h +132 -0
  17. package/deps/rocksdb/rocksdb/cache/cache_reservation_manager.cc +183 -0
  18. package/deps/rocksdb/rocksdb/cache/cache_reservation_manager.h +288 -0
  19. package/deps/rocksdb/rocksdb/cache/cache_reservation_manager_test.cc +468 -0
  20. package/deps/rocksdb/rocksdb/cache/cache_test.cc +85 -8
  21. package/deps/rocksdb/rocksdb/cache/clock_cache.cc +121 -51
  22. package/deps/rocksdb/rocksdb/cache/compressed_secondary_cache.cc +171 -0
  23. package/deps/rocksdb/rocksdb/cache/compressed_secondary_cache.h +86 -0
  24. package/deps/rocksdb/rocksdb/cache/compressed_secondary_cache_test.cc +607 -0
  25. package/deps/rocksdb/rocksdb/cache/lru_cache.cc +381 -154
  26. package/deps/rocksdb/rocksdb/cache/lru_cache.h +176 -33
  27. package/deps/rocksdb/rocksdb/cache/lru_cache_test.cc +1659 -3
  28. package/deps/rocksdb/rocksdb/cache/sharded_cache.cc +94 -23
  29. package/deps/rocksdb/rocksdb/cache/sharded_cache.h +49 -28
  30. package/deps/rocksdb/rocksdb/cmake/modules/CxxFlags.cmake +7 -0
  31. package/deps/rocksdb/rocksdb/cmake/modules/FindJeMalloc.cmake +29 -0
  32. package/deps/rocksdb/rocksdb/cmake/modules/FindNUMA.cmake +29 -0
  33. package/deps/rocksdb/rocksdb/cmake/modules/FindSnappy.cmake +29 -0
  34. package/deps/rocksdb/rocksdb/cmake/modules/FindTBB.cmake +33 -0
  35. package/deps/rocksdb/rocksdb/cmake/modules/Findgflags.cmake +29 -0
  36. package/deps/rocksdb/rocksdb/cmake/modules/Findlz4.cmake +29 -0
  37. package/deps/rocksdb/rocksdb/cmake/modules/Finduring.cmake +26 -0
  38. package/deps/rocksdb/rocksdb/cmake/modules/Findzstd.cmake +29 -0
  39. package/deps/rocksdb/rocksdb/cmake/modules/ReadVersion.cmake +10 -0
  40. package/deps/rocksdb/rocksdb/crash_test.mk +93 -0
  41. package/deps/rocksdb/rocksdb/db/arena_wrapped_db_iter.cc +54 -31
  42. package/deps/rocksdb/rocksdb/db/arena_wrapped_db_iter.h +10 -6
  43. package/deps/rocksdb/rocksdb/db/blob/blob_counting_iterator.h +146 -0
  44. package/deps/rocksdb/rocksdb/db/blob/blob_counting_iterator_test.cc +326 -0
  45. package/deps/rocksdb/rocksdb/db/blob/blob_fetcher.cc +34 -0
  46. package/deps/rocksdb/rocksdb/db/blob/blob_fetcher.h +37 -0
  47. package/deps/rocksdb/rocksdb/db/blob/blob_file_addition.cc +4 -2
  48. package/deps/rocksdb/rocksdb/db/blob/blob_file_addition_test.cc +8 -4
  49. package/deps/rocksdb/rocksdb/db/blob/blob_file_builder.cc +99 -40
  50. package/deps/rocksdb/rocksdb/db/blob/blob_file_builder.h +20 -8
  51. package/deps/rocksdb/rocksdb/db/blob/blob_file_builder_test.cc +95 -83
  52. package/deps/rocksdb/rocksdb/db/blob/blob_file_cache.cc +13 -10
  53. package/deps/rocksdb/rocksdb/db/blob/blob_file_cache.h +7 -4
  54. package/deps/rocksdb/rocksdb/db/blob/blob_file_cache_test.cc +37 -37
  55. package/deps/rocksdb/rocksdb/db/blob/blob_file_completion_callback.h +101 -0
  56. package/deps/rocksdb/rocksdb/db/blob/blob_file_meta.cc +8 -1
  57. package/deps/rocksdb/rocksdb/db/blob/blob_file_meta.h +6 -0
  58. package/deps/rocksdb/rocksdb/db/blob/blob_file_reader.cc +209 -44
  59. package/deps/rocksdb/rocksdb/db/blob/blob_file_reader.h +37 -11
  60. package/deps/rocksdb/rocksdb/db/blob/blob_file_reader_test.cc +382 -179
  61. package/deps/rocksdb/rocksdb/db/blob/blob_garbage_meter.cc +100 -0
  62. package/deps/rocksdb/rocksdb/db/blob/blob_garbage_meter.h +102 -0
  63. package/deps/rocksdb/rocksdb/db/blob/blob_garbage_meter_test.cc +196 -0
  64. package/deps/rocksdb/rocksdb/db/blob/blob_index.h +3 -0
  65. package/deps/rocksdb/rocksdb/db/blob/blob_log_format.h +2 -1
  66. package/deps/rocksdb/rocksdb/db/blob/blob_log_sequential_reader.cc +7 -5
  67. package/deps/rocksdb/rocksdb/db/blob/blob_log_sequential_reader.h +10 -3
  68. package/deps/rocksdb/rocksdb/db/blob/blob_log_writer.cc +12 -8
  69. package/deps/rocksdb/rocksdb/db/blob/blob_log_writer.h +5 -5
  70. package/deps/rocksdb/rocksdb/db/blob/db_blob_basic_test.cc +772 -9
  71. package/deps/rocksdb/rocksdb/db/blob/db_blob_compaction_test.cc +730 -0
  72. package/deps/rocksdb/rocksdb/db/blob/db_blob_corruption_test.cc +82 -0
  73. package/deps/rocksdb/rocksdb/db/blob/db_blob_index_test.cc +155 -17
  74. package/deps/rocksdb/rocksdb/db/blob/prefetch_buffer_collection.cc +21 -0
  75. package/deps/rocksdb/rocksdb/db/blob/prefetch_buffer_collection.h +38 -0
  76. package/deps/rocksdb/rocksdb/db/builder.cc +137 -89
  77. package/deps/rocksdb/rocksdb/db/builder.h +16 -37
  78. package/deps/rocksdb/rocksdb/db/c.cc +413 -208
  79. package/deps/rocksdb/rocksdb/db/c_test.c +227 -138
  80. package/deps/rocksdb/rocksdb/db/column_family.cc +118 -103
  81. package/deps/rocksdb/rocksdb/db/column_family.h +86 -44
  82. package/deps/rocksdb/rocksdb/db/column_family_test.cc +38 -24
  83. package/deps/rocksdb/rocksdb/db/compact_files_test.cc +81 -0
  84. package/deps/rocksdb/rocksdb/db/compaction/clipping_iterator.h +275 -0
  85. package/deps/rocksdb/rocksdb/db/compaction/clipping_iterator_test.cc +258 -0
  86. package/deps/rocksdb/rocksdb/db/compaction/compaction.cc +81 -28
  87. package/deps/rocksdb/rocksdb/db/compaction/compaction.h +43 -12
  88. package/deps/rocksdb/rocksdb/db/compaction/compaction_iteration_stats.h +12 -0
  89. package/deps/rocksdb/rocksdb/db/compaction/compaction_iterator.cc +406 -215
  90. package/deps/rocksdb/rocksdb/db/compaction/compaction_iterator.h +147 -50
  91. package/deps/rocksdb/rocksdb/db/compaction/compaction_iterator_test.cc +167 -61
  92. package/deps/rocksdb/rocksdb/db/compaction/compaction_job.cc +1321 -156
  93. package/deps/rocksdb/rocksdb/db/compaction/compaction_job.h +197 -28
  94. package/deps/rocksdb/rocksdb/db/compaction/compaction_job_stats_test.cc +2 -3
  95. package/deps/rocksdb/rocksdb/db/compaction/compaction_job_test.cc +246 -43
  96. package/deps/rocksdb/rocksdb/db/compaction/compaction_picker.cc +65 -26
  97. package/deps/rocksdb/rocksdb/db/compaction/compaction_picker.h +7 -7
  98. package/deps/rocksdb/rocksdb/db/compaction/compaction_picker_fifo.cc +122 -9
  99. package/deps/rocksdb/rocksdb/db/compaction/compaction_picker_fifo.h +8 -2
  100. package/deps/rocksdb/rocksdb/db/compaction/compaction_picker_level.cc +18 -6
  101. package/deps/rocksdb/rocksdb/db/compaction/compaction_picker_level.h +1 -1
  102. package/deps/rocksdb/rocksdb/db/compaction/compaction_picker_test.cc +536 -44
  103. package/deps/rocksdb/rocksdb/db/compaction/compaction_picker_universal.cc +311 -30
  104. package/deps/rocksdb/rocksdb/db/compaction/compaction_picker_universal.h +1 -1
  105. package/deps/rocksdb/rocksdb/db/compaction/compaction_service_test.cc +849 -0
  106. package/deps/rocksdb/rocksdb/db/compaction/file_pri.h +92 -0
  107. package/deps/rocksdb/rocksdb/db/compaction/sst_partitioner.cc +46 -0
  108. package/deps/rocksdb/rocksdb/db/comparator_db_test.cc +1 -1
  109. package/deps/rocksdb/rocksdb/db/convenience.cc +6 -3
  110. package/deps/rocksdb/rocksdb/db/corruption_test.cc +383 -28
  111. package/deps/rocksdb/rocksdb/db/cuckoo_table_db_test.cc +7 -2
  112. package/deps/rocksdb/rocksdb/db/db_basic_test.cc +154 -45
  113. package/deps/rocksdb/rocksdb/db/db_block_cache_test.cc +1095 -33
  114. package/deps/rocksdb/rocksdb/db/db_bloom_filter_test.cc +1249 -203
  115. package/deps/rocksdb/rocksdb/db/db_compaction_filter_test.cc +135 -9
  116. package/deps/rocksdb/rocksdb/db/db_compaction_test.cc +1348 -166
  117. package/deps/rocksdb/rocksdb/db/db_dynamic_level_test.cc +3 -5
  118. package/deps/rocksdb/rocksdb/db/db_encryption_test.cc +1 -1
  119. package/deps/rocksdb/rocksdb/db/db_filesnapshot.cc +312 -45
  120. package/deps/rocksdb/rocksdb/db/db_flush_test.cc +1734 -48
  121. package/deps/rocksdb/rocksdb/db/{compacted_db_impl.cc → db_impl/compacted_db_impl.cc} +24 -7
  122. package/deps/rocksdb/rocksdb/db/{compacted_db_impl.h → db_impl/compacted_db_impl.h} +1 -1
  123. package/deps/rocksdb/rocksdb/db/db_impl/db_impl.cc +644 -333
  124. package/deps/rocksdb/rocksdb/db/db_impl/db_impl.h +365 -92
  125. package/deps/rocksdb/rocksdb/db/db_impl/db_impl_compaction_flush.cc +578 -210
  126. package/deps/rocksdb/rocksdb/db/db_impl/db_impl_debug.cc +38 -16
  127. package/deps/rocksdb/rocksdb/db/db_impl/db_impl_experimental.cc +17 -10
  128. package/deps/rocksdb/rocksdb/db/db_impl/db_impl_files.cc +75 -74
  129. package/deps/rocksdb/rocksdb/db/db_impl/db_impl_open.cc +450 -183
  130. package/deps/rocksdb/rocksdb/db/db_impl/db_impl_readonly.cc +42 -9
  131. package/deps/rocksdb/rocksdb/db/db_impl/db_impl_secondary.cc +232 -15
  132. package/deps/rocksdb/rocksdb/db/db_impl/db_impl_secondary.h +42 -4
  133. package/deps/rocksdb/rocksdb/db/db_impl/db_impl_write.cc +297 -100
  134. package/deps/rocksdb/rocksdb/db/db_info_dumper.cc +16 -15
  135. package/deps/rocksdb/rocksdb/db/db_inplace_update_test.cc +31 -1
  136. package/deps/rocksdb/rocksdb/db/db_io_failure_test.cc +6 -5
  137. package/deps/rocksdb/rocksdb/db/db_iter.cc +218 -153
  138. package/deps/rocksdb/rocksdb/db/db_iter.h +14 -12
  139. package/deps/rocksdb/rocksdb/db/db_iter_stress_test.cc +1 -1
  140. package/deps/rocksdb/rocksdb/db/db_iter_test.cc +84 -160
  141. package/deps/rocksdb/rocksdb/db/db_iterator_test.cc +47 -6
  142. package/deps/rocksdb/rocksdb/db/db_kv_checksum_test.cc +204 -0
  143. package/deps/rocksdb/rocksdb/db/db_log_iter_test.cc +21 -13
  144. package/deps/rocksdb/rocksdb/db/db_logical_block_size_cache_test.cc +17 -10
  145. package/deps/rocksdb/rocksdb/db/db_memtable_test.cc +38 -24
  146. package/deps/rocksdb/rocksdb/db/db_merge_operand_test.cc +184 -19
  147. package/deps/rocksdb/rocksdb/db/db_merge_operator_test.cc +1 -1
  148. package/deps/rocksdb/rocksdb/db/db_options_test.cc +183 -3
  149. package/deps/rocksdb/rocksdb/db/db_properties_test.cc +409 -9
  150. package/deps/rocksdb/rocksdb/db/db_range_del_test.cc +92 -23
  151. package/deps/rocksdb/rocksdb/db/db_rate_limiter_test.cc +446 -0
  152. package/deps/rocksdb/rocksdb/db/{db_impl/db_secondary_test.cc → db_secondary_test.cc} +363 -35
  153. package/deps/rocksdb/rocksdb/db/db_sst_test.cc +520 -15
  154. package/deps/rocksdb/rocksdb/db/db_statistics_test.cc +50 -1
  155. package/deps/rocksdb/rocksdb/db/db_table_properties_test.cc +139 -4
  156. package/deps/rocksdb/rocksdb/db/db_tailing_iter_test.cc +1 -1
  157. package/deps/rocksdb/rocksdb/db/db_test.cc +669 -359
  158. package/deps/rocksdb/rocksdb/db/db_test2.cc +2110 -304
  159. package/deps/rocksdb/rocksdb/db/db_test_util.cc +76 -43
  160. package/deps/rocksdb/rocksdb/db/db_test_util.h +231 -103
  161. package/deps/rocksdb/rocksdb/db/db_universal_compaction_test.cc +19 -11
  162. package/deps/rocksdb/rocksdb/db/db_wal_test.cc +490 -71
  163. package/deps/rocksdb/rocksdb/db/db_with_timestamp_basic_test.cc +980 -349
  164. package/deps/rocksdb/rocksdb/db/db_with_timestamp_compaction_test.cc +11 -12
  165. package/deps/rocksdb/rocksdb/db/db_write_buffer_manager_test.cc +793 -0
  166. package/deps/rocksdb/rocksdb/db/db_write_test.cc +2 -1
  167. package/deps/rocksdb/rocksdb/db/dbformat.cc +4 -12
  168. package/deps/rocksdb/rocksdb/db/dbformat.h +28 -18
  169. package/deps/rocksdb/rocksdb/db/dbformat_test.cc +3 -0
  170. package/deps/rocksdb/rocksdb/db/deletefile_test.cc +50 -15
  171. package/deps/rocksdb/rocksdb/db/error_handler.cc +127 -41
  172. package/deps/rocksdb/rocksdb/db/error_handler.h +12 -5
  173. package/deps/rocksdb/rocksdb/db/error_handler_fs_test.cc +524 -255
  174. package/deps/rocksdb/rocksdb/db/event_helpers.cc +136 -11
  175. package/deps/rocksdb/rocksdb/db/event_helpers.h +27 -2
  176. package/deps/rocksdb/rocksdb/db/experimental.cc +100 -0
  177. package/deps/rocksdb/rocksdb/db/external_sst_file_basic_test.cc +307 -4
  178. package/deps/rocksdb/rocksdb/db/external_sst_file_ingestion_job.cc +137 -60
  179. package/deps/rocksdb/rocksdb/db/external_sst_file_ingestion_job.h +12 -8
  180. package/deps/rocksdb/rocksdb/db/external_sst_file_test.cc +86 -55
  181. package/deps/rocksdb/rocksdb/db/fault_injection_test.cc +86 -5
  182. package/deps/rocksdb/rocksdb/db/filename_test.cc +63 -0
  183. package/deps/rocksdb/rocksdb/db/flush_job.cc +619 -64
  184. package/deps/rocksdb/rocksdb/db/flush_job.h +30 -7
  185. package/deps/rocksdb/rocksdb/db/flush_job_test.cc +33 -16
  186. package/deps/rocksdb/rocksdb/db/flush_scheduler.h +2 -1
  187. package/deps/rocksdb/rocksdb/db/forward_iterator.cc +18 -17
  188. package/deps/rocksdb/rocksdb/db/forward_iterator.h +5 -4
  189. package/deps/rocksdb/rocksdb/db/forward_iterator_bench.cc +0 -1
  190. package/deps/rocksdb/rocksdb/db/history_trimming_iterator.h +91 -0
  191. package/deps/rocksdb/rocksdb/db/import_column_family_job.cc +25 -14
  192. package/deps/rocksdb/rocksdb/db/import_column_family_job.h +6 -5
  193. package/deps/rocksdb/rocksdb/db/import_column_family_test.cc +1 -1
  194. package/deps/rocksdb/rocksdb/db/internal_stats.cc +471 -50
  195. package/deps/rocksdb/rocksdb/db/internal_stats.h +129 -25
  196. package/deps/rocksdb/rocksdb/db/job_context.h +22 -9
  197. package/deps/rocksdb/rocksdb/db/kv_checksum.h +394 -0
  198. package/deps/rocksdb/rocksdb/db/listener_test.cc +518 -41
  199. package/deps/rocksdb/rocksdb/db/log_format.h +4 -1
  200. package/deps/rocksdb/rocksdb/db/log_reader.cc +129 -6
  201. package/deps/rocksdb/rocksdb/db/log_reader.h +17 -1
  202. package/deps/rocksdb/rocksdb/db/log_test.cc +161 -11
  203. package/deps/rocksdb/rocksdb/db/log_writer.cc +92 -13
  204. package/deps/rocksdb/rocksdb/db/log_writer.h +18 -5
  205. package/deps/rocksdb/rocksdb/db/logs_with_prep_tracker.h +1 -1
  206. package/deps/rocksdb/rocksdb/db/lookup_key.h +0 -1
  207. package/deps/rocksdb/rocksdb/db/malloc_stats.cc +2 -2
  208. package/deps/rocksdb/rocksdb/db/manual_compaction_test.cc +21 -8
  209. package/deps/rocksdb/rocksdb/db/memtable.cc +144 -54
  210. package/deps/rocksdb/rocksdb/db/memtable.h +72 -15
  211. package/deps/rocksdb/rocksdb/db/memtable_list.cc +95 -47
  212. package/deps/rocksdb/rocksdb/db/memtable_list.h +33 -13
  213. package/deps/rocksdb/rocksdb/db/memtable_list_test.cc +61 -31
  214. package/deps/rocksdb/rocksdb/db/merge_context.h +20 -8
  215. package/deps/rocksdb/rocksdb/db/merge_helper.cc +54 -11
  216. package/deps/rocksdb/rocksdb/db/merge_helper.h +17 -6
  217. package/deps/rocksdb/rocksdb/db/merge_helper_test.cc +13 -7
  218. package/deps/rocksdb/rocksdb/db/merge_test.cc +40 -19
  219. package/deps/rocksdb/rocksdb/db/obsolete_files_test.cc +14 -25
  220. package/deps/rocksdb/rocksdb/db/output_validator.cc +3 -0
  221. package/deps/rocksdb/rocksdb/db/output_validator.h +5 -4
  222. package/deps/rocksdb/rocksdb/db/perf_context_test.cc +32 -28
  223. package/deps/rocksdb/rocksdb/db/periodic_work_scheduler.cc +43 -29
  224. package/deps/rocksdb/rocksdb/db/periodic_work_scheduler.h +9 -7
  225. package/deps/rocksdb/rocksdb/db/periodic_work_scheduler_test.cc +21 -16
  226. package/deps/rocksdb/rocksdb/db/pinned_iterators_manager.h +1 -1
  227. package/deps/rocksdb/rocksdb/db/plain_table_db_test.cc +29 -36
  228. package/deps/rocksdb/rocksdb/db/pre_release_callback.h +1 -2
  229. package/deps/rocksdb/rocksdb/db/prefix_test.cc +4 -4
  230. package/deps/rocksdb/rocksdb/db/range_del_aggregator.h +2 -2
  231. package/deps/rocksdb/rocksdb/db/range_del_aggregator_bench.cc +11 -11
  232. package/deps/rocksdb/rocksdb/db/range_del_aggregator_test.cc +3 -2
  233. package/deps/rocksdb/rocksdb/db/range_tombstone_fragmenter.cc +14 -8
  234. package/deps/rocksdb/rocksdb/db/range_tombstone_fragmenter.h +17 -0
  235. package/deps/rocksdb/rocksdb/db/range_tombstone_fragmenter_test.cc +4 -2
  236. package/deps/rocksdb/rocksdb/db/read_callback.h +1 -0
  237. package/deps/rocksdb/rocksdb/db/repair.cc +87 -58
  238. package/deps/rocksdb/rocksdb/db/repair_test.cc +35 -5
  239. package/deps/rocksdb/rocksdb/db/snapshot_impl.h +2 -1
  240. package/deps/rocksdb/rocksdb/db/table_cache.cc +95 -69
  241. package/deps/rocksdb/rocksdb/db/table_cache.h +63 -53
  242. package/deps/rocksdb/rocksdb/db/table_properties_collector.cc +4 -4
  243. package/deps/rocksdb/rocksdb/db/table_properties_collector.h +78 -10
  244. package/deps/rocksdb/rocksdb/db/table_properties_collector_test.cc +28 -33
  245. package/deps/rocksdb/rocksdb/db/transaction_log_impl.cc +30 -51
  246. package/deps/rocksdb/rocksdb/db/transaction_log_impl.h +12 -8
  247. package/deps/rocksdb/rocksdb/db/version_builder.cc +564 -341
  248. package/deps/rocksdb/rocksdb/db/version_builder.h +8 -8
  249. package/deps/rocksdb/rocksdb/db/version_builder_test.cc +327 -155
  250. package/deps/rocksdb/rocksdb/db/version_edit.cc +89 -27
  251. package/deps/rocksdb/rocksdb/db/version_edit.h +42 -17
  252. package/deps/rocksdb/rocksdb/db/version_edit_handler.cc +324 -43
  253. package/deps/rocksdb/rocksdb/db/version_edit_handler.h +79 -22
  254. package/deps/rocksdb/rocksdb/db/version_edit_test.cc +165 -20
  255. package/deps/rocksdb/rocksdb/db/version_set.cc +935 -1034
  256. package/deps/rocksdb/rocksdb/db/version_set.h +183 -122
  257. package/deps/rocksdb/rocksdb/db/version_set_test.cc +556 -138
  258. package/deps/rocksdb/rocksdb/db/version_util.h +68 -0
  259. package/deps/rocksdb/rocksdb/db/wal_manager.cc +23 -21
  260. package/deps/rocksdb/rocksdb/db/wal_manager.h +5 -2
  261. package/deps/rocksdb/rocksdb/db/wal_manager_test.cc +30 -27
  262. package/deps/rocksdb/rocksdb/db/write_batch.cc +704 -209
  263. package/deps/rocksdb/rocksdb/db/write_batch_internal.h +135 -2
  264. package/deps/rocksdb/rocksdb/db/write_batch_test.cc +209 -5
  265. package/deps/rocksdb/rocksdb/db/write_callback_test.cc +2 -0
  266. package/deps/rocksdb/rocksdb/db/write_controller.cc +47 -54
  267. package/deps/rocksdb/rocksdb/db/write_controller.h +12 -9
  268. package/deps/rocksdb/rocksdb/db/write_controller_test.cc +215 -103
  269. package/deps/rocksdb/rocksdb/db/write_thread.cc +11 -0
  270. package/deps/rocksdb/rocksdb/db/write_thread.h +14 -8
  271. package/deps/rocksdb/rocksdb/db_stress_tool/CMakeLists.txt +7 -4
  272. package/deps/rocksdb/rocksdb/db_stress_tool/batched_ops_stress.cc +10 -3
  273. package/deps/rocksdb/rocksdb/db_stress_tool/cf_consistency_stress.cc +6 -0
  274. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress.cc +1 -1
  275. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_common.cc +19 -2
  276. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_common.h +78 -25
  277. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_compaction_filter.h +13 -2
  278. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_driver.cc +29 -12
  279. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_env_wrapper.h +5 -1
  280. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_gflags.cc +199 -32
  281. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_listener.cc +188 -0
  282. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_listener.h +59 -10
  283. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_shared_state.h +77 -109
  284. package/deps/rocksdb/rocksdb/{third-party/folly/folly/synchronization/WaitOptions.cpp → db_stress_tool/db_stress_stat.cc} +9 -4
  285. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_stat.h +7 -6
  286. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_table_properties_collector.h +1 -0
  287. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_test_base.cc +699 -143
  288. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_test_base.h +20 -2
  289. package/deps/rocksdb/rocksdb/db_stress_tool/db_stress_tool.cc +49 -39
  290. package/deps/rocksdb/rocksdb/db_stress_tool/expected_state.cc +631 -0
  291. package/deps/rocksdb/rocksdb/db_stress_tool/expected_state.h +287 -0
  292. package/deps/rocksdb/rocksdb/db_stress_tool/multi_ops_txns_stress.cc +1565 -0
  293. package/deps/rocksdb/rocksdb/db_stress_tool/multi_ops_txns_stress.h +374 -0
  294. package/deps/rocksdb/rocksdb/db_stress_tool/no_batched_ops_stress.cc +149 -18
  295. package/deps/rocksdb/rocksdb/env/composite_env.cc +464 -0
  296. package/deps/rocksdb/rocksdb/env/composite_env_wrapper.h +98 -646
  297. package/deps/rocksdb/rocksdb/env/emulated_clock.h +114 -0
  298. package/deps/rocksdb/rocksdb/env/env.cc +632 -42
  299. package/deps/rocksdb/rocksdb/env/env_basic_test.cc +84 -36
  300. package/deps/rocksdb/rocksdb/env/env_chroot.cc +88 -286
  301. package/deps/rocksdb/rocksdb/env/env_chroot.h +34 -1
  302. package/deps/rocksdb/rocksdb/env/env_encryption.cc +469 -277
  303. package/deps/rocksdb/rocksdb/env/env_encryption_ctr.h +9 -30
  304. package/deps/rocksdb/rocksdb/env/env_posix.cc +110 -119
  305. package/deps/rocksdb/rocksdb/env/env_test.cc +1128 -39
  306. package/deps/rocksdb/rocksdb/env/file_system.cc +147 -8
  307. package/deps/rocksdb/rocksdb/env/file_system_tracer.cc +207 -136
  308. package/deps/rocksdb/rocksdb/env/file_system_tracer.h +86 -54
  309. package/deps/rocksdb/rocksdb/env/fs_posix.cc +192 -64
  310. package/deps/rocksdb/rocksdb/env/fs_readonly.h +107 -0
  311. package/deps/rocksdb/rocksdb/env/fs_remap.cc +339 -0
  312. package/deps/rocksdb/rocksdb/env/fs_remap.h +139 -0
  313. package/deps/rocksdb/rocksdb/env/io_posix.cc +245 -41
  314. package/deps/rocksdb/rocksdb/env/io_posix.h +66 -1
  315. package/deps/rocksdb/rocksdb/env/mock_env.cc +147 -149
  316. package/deps/rocksdb/rocksdb/env/mock_env.h +113 -11
  317. package/deps/rocksdb/rocksdb/env/mock_env_test.cc +2 -4
  318. package/deps/rocksdb/rocksdb/env/unique_id_gen.cc +164 -0
  319. package/deps/rocksdb/rocksdb/env/unique_id_gen.h +71 -0
  320. package/deps/rocksdb/rocksdb/file/delete_scheduler.cc +9 -5
  321. package/deps/rocksdb/rocksdb/file/delete_scheduler.h +6 -4
  322. package/deps/rocksdb/rocksdb/file/delete_scheduler_test.cc +19 -12
  323. package/deps/rocksdb/rocksdb/file/file_prefetch_buffer.cc +459 -70
  324. package/deps/rocksdb/rocksdb/file/file_prefetch_buffer.h +205 -28
  325. package/deps/rocksdb/rocksdb/file/file_util.cc +39 -28
  326. package/deps/rocksdb/rocksdb/file/file_util.h +18 -27
  327. package/deps/rocksdb/rocksdb/file/filename.cc +59 -22
  328. package/deps/rocksdb/rocksdb/file/filename.h +13 -8
  329. package/deps/rocksdb/rocksdb/file/line_file_reader.cc +68 -0
  330. package/deps/rocksdb/rocksdb/file/line_file_reader.h +59 -0
  331. package/deps/rocksdb/rocksdb/file/prefetch_test.cc +1130 -6
  332. package/deps/rocksdb/rocksdb/file/random_access_file_reader.cc +220 -36
  333. package/deps/rocksdb/rocksdb/file/random_access_file_reader.h +69 -17
  334. package/deps/rocksdb/rocksdb/file/random_access_file_reader_test.cc +13 -12
  335. package/deps/rocksdb/rocksdb/file/read_write_util.cc +3 -38
  336. package/deps/rocksdb/rocksdb/file/read_write_util.h +0 -4
  337. package/deps/rocksdb/rocksdb/file/readahead_file_info.h +33 -0
  338. package/deps/rocksdb/rocksdb/file/sequence_file_reader.cc +57 -9
  339. package/deps/rocksdb/rocksdb/file/sequence_file_reader.h +58 -6
  340. package/deps/rocksdb/rocksdb/file/sst_file_manager_impl.cc +29 -54
  341. package/deps/rocksdb/rocksdb/file/sst_file_manager_impl.h +22 -29
  342. package/deps/rocksdb/rocksdb/file/writable_file_writer.cc +424 -50
  343. package/deps/rocksdb/rocksdb/file/writable_file_writer.h +66 -19
  344. package/deps/rocksdb/rocksdb/include/rocksdb/advanced_options.h +157 -66
  345. package/deps/rocksdb/rocksdb/include/rocksdb/c.h +224 -121
  346. package/deps/rocksdb/rocksdb/include/rocksdb/cache.h +333 -30
  347. package/deps/rocksdb/rocksdb/include/rocksdb/cache_bench_tool.h +14 -0
  348. package/deps/rocksdb/rocksdb/include/rocksdb/cleanable.h +1 -1
  349. package/deps/rocksdb/rocksdb/include/rocksdb/compaction_filter.h +90 -50
  350. package/deps/rocksdb/rocksdb/include/rocksdb/compaction_job_stats.h +13 -5
  351. package/deps/rocksdb/rocksdb/include/rocksdb/comparator.h +20 -4
  352. package/deps/rocksdb/rocksdb/include/rocksdb/concurrent_task_limiter.h +8 -3
  353. package/deps/rocksdb/rocksdb/include/rocksdb/configurable.h +53 -12
  354. package/deps/rocksdb/rocksdb/include/rocksdb/convenience.h +31 -6
  355. package/deps/rocksdb/rocksdb/include/rocksdb/customizable.h +102 -7
  356. package/deps/rocksdb/rocksdb/include/rocksdb/data_structure.h +51 -0
  357. package/deps/rocksdb/rocksdb/include/rocksdb/db.h +370 -262
  358. package/deps/rocksdb/rocksdb/include/rocksdb/env.h +286 -87
  359. package/deps/rocksdb/rocksdb/include/rocksdb/env_encryption.h +124 -64
  360. package/deps/rocksdb/rocksdb/include/rocksdb/experimental.h +27 -0
  361. package/deps/rocksdb/rocksdb/include/rocksdb/file_checksum.h +21 -4
  362. package/deps/rocksdb/rocksdb/include/rocksdb/file_system.h +384 -41
  363. package/deps/rocksdb/rocksdb/include/rocksdb/filter_policy.h +111 -143
  364. package/deps/rocksdb/rocksdb/include/rocksdb/flush_block_policy.h +20 -6
  365. package/deps/rocksdb/rocksdb/include/rocksdb/functor_wrapper.h +56 -0
  366. package/deps/rocksdb/rocksdb/include/rocksdb/io_status.h +15 -33
  367. package/deps/rocksdb/rocksdb/include/rocksdb/iostats_context.h +37 -1
  368. package/deps/rocksdb/rocksdb/include/rocksdb/iterator.h +1 -3
  369. package/deps/rocksdb/rocksdb/include/rocksdb/listener.h +314 -26
  370. package/deps/rocksdb/rocksdb/include/rocksdb/memory_allocator.h +11 -7
  371. package/deps/rocksdb/rocksdb/include/rocksdb/memtablerep.h +50 -15
  372. package/deps/rocksdb/rocksdb/include/rocksdb/merge_operator.h +10 -3
  373. package/deps/rocksdb/rocksdb/include/rocksdb/metadata.h +186 -96
  374. package/deps/rocksdb/rocksdb/include/rocksdb/options.h +373 -103
  375. package/deps/rocksdb/rocksdb/include/rocksdb/perf_context.h +13 -3
  376. package/deps/rocksdb/rocksdb/include/rocksdb/persistent_cache.h +2 -2
  377. package/deps/rocksdb/rocksdb/include/rocksdb/rate_limiter.h +37 -7
  378. package/deps/rocksdb/rocksdb/include/rocksdb/rocksdb_namespace.h +6 -0
  379. package/deps/rocksdb/rocksdb/include/rocksdb/secondary_cache.h +87 -0
  380. package/deps/rocksdb/rocksdb/include/rocksdb/slice.h +5 -12
  381. package/deps/rocksdb/rocksdb/include/rocksdb/slice_transform.h +59 -30
  382. package/deps/rocksdb/rocksdb/include/rocksdb/sst_file_manager.h +11 -11
  383. package/deps/rocksdb/rocksdb/include/rocksdb/sst_file_writer.h +22 -0
  384. package/deps/rocksdb/rocksdb/include/rocksdb/sst_partitioner.h +17 -10
  385. package/deps/rocksdb/rocksdb/include/rocksdb/statistics.h +121 -41
  386. package/deps/rocksdb/rocksdb/include/rocksdb/stats_history.h +1 -0
  387. package/deps/rocksdb/rocksdb/include/rocksdb/status.h +114 -136
  388. package/deps/rocksdb/rocksdb/include/rocksdb/system_clock.h +116 -0
  389. package/deps/rocksdb/rocksdb/include/rocksdb/table.h +160 -18
  390. package/deps/rocksdb/rocksdb/include/rocksdb/table_properties.h +57 -15
  391. package/deps/rocksdb/rocksdb/include/rocksdb/thread_status.h +3 -1
  392. package/deps/rocksdb/rocksdb/include/rocksdb/trace_reader_writer.h +10 -6
  393. package/deps/rocksdb/rocksdb/include/rocksdb/trace_record.h +247 -0
  394. package/deps/rocksdb/rocksdb/include/rocksdb/trace_record_result.h +187 -0
  395. package/deps/rocksdb/rocksdb/include/rocksdb/transaction_log.h +1 -1
  396. package/deps/rocksdb/rocksdb/include/rocksdb/types.h +14 -24
  397. package/deps/rocksdb/rocksdb/include/rocksdb/unique_id.h +46 -0
  398. package/deps/rocksdb/rocksdb/include/rocksdb/universal_compaction.h +14 -4
  399. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/agg_merge.h +138 -0
  400. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/backup_engine.h +631 -0
  401. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/cache_dump_load.h +142 -0
  402. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/checkpoint.h +12 -9
  403. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/customizable_util.h +368 -0
  404. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/ldb_cmd.h +24 -0
  405. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/ldb_cmd_execute_result.h +4 -0
  406. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/object_registry.h +418 -63
  407. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/options_type.h +143 -73
  408. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/options_util.h +2 -2
  409. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/replayer.h +87 -0
  410. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/sim_cache.h +2 -2
  411. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/stackable_db.h +43 -5
  412. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/table_properties_collectors.h +18 -23
  413. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/transaction.h +26 -0
  414. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/transaction_db.h +32 -6
  415. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/transaction_db_mutex.h +1 -2
  416. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/write_batch_with_index.h +20 -1
  417. package/deps/rocksdb/rocksdb/include/rocksdb/version.h +30 -3
  418. package/deps/rocksdb/rocksdb/include/rocksdb/wal_filter.h +11 -2
  419. package/deps/rocksdb/rocksdb/include/rocksdb/write_batch.h +89 -11
  420. package/deps/rocksdb/rocksdb/include/rocksdb/write_batch_base.h +11 -0
  421. package/deps/rocksdb/rocksdb/include/rocksdb/write_buffer_manager.h +108 -38
  422. package/deps/rocksdb/rocksdb/logging/auto_roll_logger.cc +40 -23
  423. package/deps/rocksdb/rocksdb/logging/auto_roll_logger.h +12 -5
  424. package/deps/rocksdb/rocksdb/logging/auto_roll_logger_test.cc +100 -49
  425. package/deps/rocksdb/rocksdb/logging/env_logger.h +7 -5
  426. package/deps/rocksdb/rocksdb/logging/env_logger_test.cc +0 -1
  427. package/deps/rocksdb/rocksdb/logging/posix_logger.h +3 -9
  428. package/deps/rocksdb/rocksdb/memory/arena.cc +3 -1
  429. package/deps/rocksdb/rocksdb/memory/arena.h +1 -1
  430. package/deps/rocksdb/rocksdb/memory/jemalloc_nodump_allocator.cc +171 -106
  431. package/deps/rocksdb/rocksdb/memory/jemalloc_nodump_allocator.h +31 -15
  432. package/deps/rocksdb/rocksdb/memory/memkind_kmem_allocator.cc +15 -4
  433. package/deps/rocksdb/rocksdb/memory/memkind_kmem_allocator.h +24 -8
  434. package/deps/rocksdb/rocksdb/memory/memory_allocator.cc +91 -0
  435. package/deps/rocksdb/rocksdb/memory/memory_allocator_test.cc +239 -0
  436. package/deps/rocksdb/rocksdb/memory/memory_usage.h +14 -1
  437. package/deps/rocksdb/rocksdb/memtable/hash_linklist_rep.cc +72 -9
  438. package/deps/rocksdb/rocksdb/memtable/hash_skiplist_rep.cc +52 -6
  439. package/deps/rocksdb/rocksdb/memtable/inlineskiplist.h +53 -0
  440. package/deps/rocksdb/rocksdb/memtable/inlineskiplist_test.cc +5 -5
  441. package/deps/rocksdb/rocksdb/memtable/memtablerep_bench.cc +17 -5
  442. package/deps/rocksdb/rocksdb/memtable/skiplist_test.cc +1 -1
  443. package/deps/rocksdb/rocksdb/memtable/skiplistrep.cc +87 -0
  444. package/deps/rocksdb/rocksdb/memtable/vectorrep.cc +20 -10
  445. package/deps/rocksdb/rocksdb/memtable/write_buffer_manager.cc +148 -94
  446. package/deps/rocksdb/rocksdb/memtable/write_buffer_manager_test.cc +160 -62
  447. package/deps/rocksdb/rocksdb/microbench/CMakeLists.txt +17 -0
  448. package/deps/rocksdb/rocksdb/microbench/db_basic_bench.cc +1360 -0
  449. package/deps/rocksdb/rocksdb/microbench/ribbon_bench.cc +153 -0
  450. package/deps/rocksdb/rocksdb/monitoring/histogram.cc +8 -15
  451. package/deps/rocksdb/rocksdb/monitoring/histogram.h +0 -1
  452. package/deps/rocksdb/rocksdb/monitoring/histogram_test.cc +18 -16
  453. package/deps/rocksdb/rocksdb/monitoring/histogram_windowing.cc +9 -7
  454. package/deps/rocksdb/rocksdb/monitoring/histogram_windowing.h +5 -3
  455. package/deps/rocksdb/rocksdb/monitoring/instrumented_mutex.cc +7 -5
  456. package/deps/rocksdb/rocksdb/monitoring/instrumented_mutex.h +37 -12
  457. package/deps/rocksdb/rocksdb/monitoring/iostats_context.cc +26 -6
  458. package/deps/rocksdb/rocksdb/monitoring/iostats_context_imp.h +6 -10
  459. package/deps/rocksdb/rocksdb/monitoring/perf_context.cc +14 -13
  460. package/deps/rocksdb/rocksdb/monitoring/perf_context_imp.h +19 -20
  461. package/deps/rocksdb/rocksdb/monitoring/perf_step_timer.h +18 -18
  462. package/deps/rocksdb/rocksdb/monitoring/statistics.cc +84 -2
  463. package/deps/rocksdb/rocksdb/monitoring/statistics.h +6 -0
  464. package/deps/rocksdb/rocksdb/monitoring/statistics_test.cc +47 -2
  465. package/deps/rocksdb/rocksdb/monitoring/stats_history_test.cc +67 -54
  466. package/deps/rocksdb/rocksdb/monitoring/thread_status_updater.cc +4 -1
  467. package/deps/rocksdb/rocksdb/monitoring/thread_status_util.cc +2 -1
  468. package/deps/rocksdb/rocksdb/monitoring/thread_status_util_debug.cc +2 -2
  469. package/deps/rocksdb/rocksdb/options/cf_options.cc +280 -212
  470. package/deps/rocksdb/rocksdb/options/cf_options.h +51 -57
  471. package/deps/rocksdb/rocksdb/options/configurable.cc +242 -138
  472. package/deps/rocksdb/rocksdb/options/configurable_helper.h +4 -68
  473. package/deps/rocksdb/rocksdb/options/configurable_test.cc +144 -21
  474. package/deps/rocksdb/rocksdb/options/configurable_test.h +2 -3
  475. package/deps/rocksdb/rocksdb/options/customizable.cc +67 -7
  476. package/deps/rocksdb/rocksdb/options/customizable_test.cc +1773 -151
  477. package/deps/rocksdb/rocksdb/options/db_options.cc +275 -47
  478. package/deps/rocksdb/rocksdb/options/db_options.h +36 -7
  479. package/deps/rocksdb/rocksdb/options/options.cc +49 -17
  480. package/deps/rocksdb/rocksdb/options/options_helper.cc +369 -352
  481. package/deps/rocksdb/rocksdb/options/options_helper.h +23 -23
  482. package/deps/rocksdb/rocksdb/options/options_parser.cc +18 -13
  483. package/deps/rocksdb/rocksdb/options/options_settable_test.cc +67 -54
  484. package/deps/rocksdb/rocksdb/options/options_test.cc +1162 -187
  485. package/deps/rocksdb/rocksdb/port/jemalloc_helper.h +1 -1
  486. package/deps/rocksdb/rocksdb/port/lang.h +52 -0
  487. package/deps/rocksdb/rocksdb/port/port_example.h +1 -1
  488. package/deps/rocksdb/rocksdb/port/port_posix.cc +31 -2
  489. package/deps/rocksdb/rocksdb/port/port_posix.h +20 -2
  490. package/deps/rocksdb/rocksdb/port/stack_trace.cc +20 -4
  491. package/deps/rocksdb/rocksdb/port/sys_time.h +2 -2
  492. package/deps/rocksdb/rocksdb/port/win/env_default.cc +7 -7
  493. package/deps/rocksdb/rocksdb/port/win/env_win.cc +44 -74
  494. package/deps/rocksdb/rocksdb/port/win/env_win.h +25 -23
  495. package/deps/rocksdb/rocksdb/port/win/io_win.cc +32 -34
  496. package/deps/rocksdb/rocksdb/port/win/io_win.h +12 -6
  497. package/deps/rocksdb/rocksdb/port/win/port_win.cc +55 -35
  498. package/deps/rocksdb/rocksdb/port/win/port_win.h +22 -5
  499. package/deps/rocksdb/rocksdb/port/win/win_logger.cc +3 -3
  500. package/deps/rocksdb/rocksdb/port/win/win_logger.h +3 -5
  501. package/deps/rocksdb/rocksdb/port/win/win_thread.cc +7 -1
  502. package/deps/rocksdb/rocksdb/port/win/win_thread.h +12 -17
  503. package/deps/rocksdb/rocksdb/python.mk +9 -0
  504. package/deps/rocksdb/rocksdb/src.mk +82 -34
  505. package/deps/rocksdb/rocksdb/table/adaptive/adaptive_table_factory.cc +3 -4
  506. package/deps/rocksdb/rocksdb/table/adaptive/adaptive_table_factory.h +1 -1
  507. package/deps/rocksdb/rocksdb/table/block_based/block.cc +158 -80
  508. package/deps/rocksdb/rocksdb/table/block_based/block.h +64 -36
  509. package/deps/rocksdb/rocksdb/table/block_based/block_based_filter_block.cc +23 -14
  510. package/deps/rocksdb/rocksdb/table/block_based/block_based_filter_block.h +13 -5
  511. package/deps/rocksdb/rocksdb/table/block_based/block_based_filter_block_test.cc +3 -218
  512. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_builder.cc +603 -328
  513. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_builder.h +28 -22
  514. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_factory.cc +220 -82
  515. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_factory.h +8 -2
  516. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_iterator.cc +3 -4
  517. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_iterator.h +28 -4
  518. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_reader.cc +598 -492
  519. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_reader.h +151 -96
  520. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_reader_impl.h +31 -58
  521. package/deps/rocksdb/rocksdb/table/block_based/block_based_table_reader_test.cc +330 -92
  522. package/deps/rocksdb/rocksdb/table/block_based/block_builder.cc +50 -19
  523. package/deps/rocksdb/rocksdb/table/block_based/block_builder.h +23 -0
  524. package/deps/rocksdb/rocksdb/table/block_based/block_like_traits.h +226 -0
  525. package/deps/rocksdb/rocksdb/table/block_based/block_prefetcher.cc +56 -22
  526. package/deps/rocksdb/rocksdb/table/block_based/block_prefetcher.h +42 -4
  527. package/deps/rocksdb/rocksdb/table/block_based/block_test.cc +5 -2
  528. package/deps/rocksdb/rocksdb/table/block_based/block_type.h +2 -0
  529. package/deps/rocksdb/rocksdb/table/block_based/cachable_entry.h +34 -20
  530. package/deps/rocksdb/rocksdb/table/block_based/data_block_hash_index_test.cc +9 -10
  531. package/deps/rocksdb/rocksdb/table/block_based/filter_block.h +26 -3
  532. package/deps/rocksdb/rocksdb/table/block_based/filter_block_reader_common.cc +2 -1
  533. package/deps/rocksdb/rocksdb/table/block_based/filter_policy.cc +844 -202
  534. package/deps/rocksdb/rocksdb/table/block_based/filter_policy_internal.h +281 -81
  535. package/deps/rocksdb/rocksdb/table/block_based/flush_block_policy.cc +62 -2
  536. package/deps/rocksdb/rocksdb/table/block_based/flush_block_policy.h +2 -3
  537. package/deps/rocksdb/rocksdb/table/block_based/full_filter_block.cc +28 -7
  538. package/deps/rocksdb/rocksdb/table/block_based/full_filter_block.h +22 -6
  539. package/deps/rocksdb/rocksdb/table/block_based/full_filter_block_test.cc +28 -26
  540. package/deps/rocksdb/rocksdb/table/block_based/hash_index_reader.cc +1 -1
  541. package/deps/rocksdb/rocksdb/table/block_based/index_builder.cc +1 -2
  542. package/deps/rocksdb/rocksdb/table/block_based/index_reader_common.cc +2 -1
  543. package/deps/rocksdb/rocksdb/table/block_based/mock_block_based_table.h +11 -4
  544. package/deps/rocksdb/rocksdb/table/block_based/parsed_full_filter_block.cc +2 -1
  545. package/deps/rocksdb/rocksdb/table/block_based/parsed_full_filter_block.h +2 -0
  546. package/deps/rocksdb/rocksdb/table/block_based/partitioned_filter_block.cc +68 -26
  547. package/deps/rocksdb/rocksdb/table/block_based/partitioned_filter_block.h +44 -9
  548. package/deps/rocksdb/rocksdb/table/block_based/partitioned_filter_block_test.cc +12 -10
  549. package/deps/rocksdb/rocksdb/table/block_based/partitioned_index_iterator.cc +3 -4
  550. package/deps/rocksdb/rocksdb/table/block_based/partitioned_index_iterator.h +23 -4
  551. package/deps/rocksdb/rocksdb/table/block_based/partitioned_index_reader.cc +44 -19
  552. package/deps/rocksdb/rocksdb/table/block_based/partitioned_index_reader.h +5 -1
  553. package/deps/rocksdb/rocksdb/table/block_based/reader_common.cc +16 -28
  554. package/deps/rocksdb/rocksdb/table/block_based/uncompression_dict_reader.cc +7 -4
  555. package/deps/rocksdb/rocksdb/table/block_based/uncompression_dict_reader.h +2 -2
  556. package/deps/rocksdb/rocksdb/table/block_fetcher.cc +77 -57
  557. package/deps/rocksdb/rocksdb/table/block_fetcher.h +23 -12
  558. package/deps/rocksdb/rocksdb/table/block_fetcher_test.cc +43 -56
  559. package/deps/rocksdb/rocksdb/table/cuckoo/cuckoo_table_builder.cc +8 -8
  560. package/deps/rocksdb/rocksdb/table/cuckoo/cuckoo_table_builder.h +2 -1
  561. package/deps/rocksdb/rocksdb/table/cuckoo/cuckoo_table_builder_test.cc +52 -70
  562. package/deps/rocksdb/rocksdb/table/cuckoo/cuckoo_table_factory.cc +5 -8
  563. package/deps/rocksdb/rocksdb/table/cuckoo/cuckoo_table_factory.h +1 -1
  564. package/deps/rocksdb/rocksdb/table/cuckoo/cuckoo_table_reader.cc +17 -11
  565. package/deps/rocksdb/rocksdb/table/cuckoo/cuckoo_table_reader.h +2 -3
  566. package/deps/rocksdb/rocksdb/table/cuckoo/cuckoo_table_reader_test.cc +42 -51
  567. package/deps/rocksdb/rocksdb/table/format.cc +258 -104
  568. package/deps/rocksdb/rocksdb/table/format.h +120 -109
  569. package/deps/rocksdb/rocksdb/table/get_context.cc +97 -65
  570. package/deps/rocksdb/rocksdb/table/get_context.h +19 -12
  571. package/deps/rocksdb/rocksdb/table/internal_iterator.h +14 -0
  572. package/deps/rocksdb/rocksdb/table/iterator_wrapper.h +8 -0
  573. package/deps/rocksdb/rocksdb/table/merger_test.cc +3 -2
  574. package/deps/rocksdb/rocksdb/table/merging_iterator.cc +11 -21
  575. package/deps/rocksdb/rocksdb/table/merging_iterator.h +3 -3
  576. package/deps/rocksdb/rocksdb/table/meta_blocks.cc +176 -171
  577. package/deps/rocksdb/rocksdb/table/meta_blocks.h +47 -33
  578. package/deps/rocksdb/rocksdb/table/mock_table.cc +7 -9
  579. package/deps/rocksdb/rocksdb/table/mock_table.h +3 -2
  580. package/deps/rocksdb/rocksdb/table/multiget_context.h +15 -8
  581. package/deps/rocksdb/rocksdb/table/persistent_cache_helper.cc +22 -29
  582. package/deps/rocksdb/rocksdb/table/persistent_cache_options.h +6 -3
  583. package/deps/rocksdb/rocksdb/table/plain/plain_table_bloom.h +5 -8
  584. package/deps/rocksdb/rocksdb/table/plain/plain_table_builder.cc +29 -26
  585. package/deps/rocksdb/rocksdb/table/plain/plain_table_builder.h +12 -16
  586. package/deps/rocksdb/rocksdb/table/plain/plain_table_factory.cc +145 -69
  587. package/deps/rocksdb/rocksdb/table/plain/plain_table_factory.h +1 -1
  588. package/deps/rocksdb/rocksdb/table/plain/plain_table_index.cc +7 -6
  589. package/deps/rocksdb/rocksdb/table/plain/plain_table_index.h +3 -4
  590. package/deps/rocksdb/rocksdb/table/plain/plain_table_key_coding.cc +3 -1
  591. package/deps/rocksdb/rocksdb/table/plain/plain_table_key_coding.h +1 -1
  592. package/deps/rocksdb/rocksdb/table/plain/plain_table_reader.cc +13 -18
  593. package/deps/rocksdb/rocksdb/table/plain/plain_table_reader.h +4 -9
  594. package/deps/rocksdb/rocksdb/table/sst_file_dumper.cc +55 -37
  595. package/deps/rocksdb/rocksdb/table/sst_file_dumper.h +10 -5
  596. package/deps/rocksdb/rocksdb/table/sst_file_reader.cc +11 -8
  597. package/deps/rocksdb/rocksdb/table/sst_file_reader_test.cc +222 -16
  598. package/deps/rocksdb/rocksdb/table/sst_file_writer.cc +106 -58
  599. package/deps/rocksdb/rocksdb/table/sst_file_writer_collectors.h +6 -5
  600. package/deps/rocksdb/rocksdb/table/table_builder.h +68 -44
  601. package/deps/rocksdb/rocksdb/table/table_factory.cc +37 -10
  602. package/deps/rocksdb/rocksdb/table/table_properties.cc +109 -54
  603. package/deps/rocksdb/rocksdb/table/table_properties_internal.h +4 -20
  604. package/deps/rocksdb/rocksdb/table/table_reader_bench.cc +33 -32
  605. package/deps/rocksdb/rocksdb/table/table_reader_caller.h +2 -0
  606. package/deps/rocksdb/rocksdb/table/table_test.cc +989 -326
  607. package/deps/rocksdb/rocksdb/table/two_level_iterator.cc +4 -0
  608. package/deps/rocksdb/rocksdb/table/unique_id.cc +166 -0
  609. package/deps/rocksdb/rocksdb/table/unique_id_impl.h +59 -0
  610. package/deps/rocksdb/rocksdb/test_util/mock_time_env.cc +1 -1
  611. package/deps/rocksdb/rocksdb/test_util/mock_time_env.h +13 -10
  612. package/deps/rocksdb/rocksdb/test_util/sync_point.cc +1 -2
  613. package/deps/rocksdb/rocksdb/test_util/sync_point.h +35 -16
  614. package/deps/rocksdb/rocksdb/test_util/sync_point_impl.cc +32 -10
  615. package/deps/rocksdb/rocksdb/test_util/sync_point_impl.h +31 -4
  616. package/deps/rocksdb/rocksdb/test_util/testharness.cc +53 -1
  617. package/deps/rocksdb/rocksdb/test_util/testharness.h +67 -3
  618. package/deps/rocksdb/rocksdb/test_util/testutil.cc +236 -66
  619. package/deps/rocksdb/rocksdb/test_util/testutil.h +63 -100
  620. package/deps/rocksdb/rocksdb/test_util/transaction_test_util.cc +12 -1
  621. package/deps/rocksdb/rocksdb/tools/blob_dump.cc +2 -2
  622. package/deps/rocksdb/rocksdb/tools/block_cache_analyzer/block_cache_trace_analyzer.cc +6 -3
  623. package/deps/rocksdb/rocksdb/tools/block_cache_analyzer/block_cache_trace_analyzer.h +1 -0
  624. package/deps/rocksdb/rocksdb/tools/block_cache_analyzer/block_cache_trace_analyzer_test.cc +9 -3
  625. package/deps/rocksdb/rocksdb/tools/db_bench.cc +1 -1
  626. package/deps/rocksdb/rocksdb/tools/db_bench_tool.cc +1420 -611
  627. package/deps/rocksdb/rocksdb/tools/db_bench_tool_test.cc +11 -8
  628. package/deps/rocksdb/rocksdb/tools/db_repl_stress.cc +11 -1
  629. package/deps/rocksdb/rocksdb/tools/io_tracer_parser_test.cc +4 -2
  630. package/deps/rocksdb/rocksdb/tools/io_tracer_parser_tool.cc +46 -22
  631. package/deps/rocksdb/rocksdb/tools/ldb_cmd.cc +655 -179
  632. package/deps/rocksdb/rocksdb/tools/ldb_cmd_impl.h +58 -6
  633. package/deps/rocksdb/rocksdb/tools/ldb_cmd_test.cc +472 -29
  634. package/deps/rocksdb/rocksdb/tools/ldb_tool.cc +23 -2
  635. package/deps/rocksdb/rocksdb/tools/reduce_levels_test.cc +2 -2
  636. package/deps/rocksdb/rocksdb/tools/simulated_hybrid_file_system.cc +246 -0
  637. package/deps/rocksdb/rocksdb/tools/simulated_hybrid_file_system.h +126 -0
  638. package/deps/rocksdb/rocksdb/tools/sst_dump_test.cc +83 -29
  639. package/deps/rocksdb/rocksdb/tools/sst_dump_tool.cc +38 -17
  640. package/deps/rocksdb/rocksdb/tools/trace_analyzer_test.cc +191 -55
  641. package/deps/rocksdb/rocksdb/tools/trace_analyzer_tool.cc +219 -296
  642. package/deps/rocksdb/rocksdb/tools/trace_analyzer_tool.h +87 -53
  643. package/deps/rocksdb/rocksdb/tools/write_stress.cc +8 -7
  644. package/deps/rocksdb/rocksdb/trace_replay/block_cache_tracer.cc +6 -5
  645. package/deps/rocksdb/rocksdb/trace_replay/block_cache_tracer.h +5 -4
  646. package/deps/rocksdb/rocksdb/trace_replay/block_cache_tracer_test.cc +14 -9
  647. package/deps/rocksdb/rocksdb/trace_replay/io_tracer.cc +134 -60
  648. package/deps/rocksdb/rocksdb/trace_replay/io_tracer.h +49 -38
  649. package/deps/rocksdb/rocksdb/trace_replay/io_tracer_test.cc +152 -15
  650. package/deps/rocksdb/rocksdb/trace_replay/trace_record.cc +206 -0
  651. package/deps/rocksdb/rocksdb/trace_replay/trace_record_handler.cc +190 -0
  652. package/deps/rocksdb/rocksdb/trace_replay/trace_record_handler.h +46 -0
  653. package/deps/rocksdb/rocksdb/trace_replay/trace_record_result.cc +146 -0
  654. package/deps/rocksdb/rocksdb/trace_replay/trace_replay.cc +475 -344
  655. package/deps/rocksdb/rocksdb/trace_replay/trace_replay.h +83 -95
  656. package/deps/rocksdb/rocksdb/util/autovector.h +38 -18
  657. package/deps/rocksdb/rocksdb/util/autovector_test.cc +1 -1
  658. package/deps/rocksdb/rocksdb/util/bloom_impl.h +4 -0
  659. package/deps/rocksdb/rocksdb/util/bloom_test.cc +276 -94
  660. package/deps/rocksdb/rocksdb/util/build_version.cc.in +81 -4
  661. package/deps/rocksdb/rocksdb/util/cast_util.h +22 -0
  662. package/deps/rocksdb/rocksdb/util/channel.h +2 -0
  663. package/deps/rocksdb/rocksdb/util/coding.h +1 -33
  664. package/deps/rocksdb/rocksdb/util/compaction_job_stats_impl.cc +8 -0
  665. package/deps/rocksdb/rocksdb/util/comparator.cc +163 -3
  666. package/deps/rocksdb/rocksdb/util/compression.cc +122 -0
  667. package/deps/rocksdb/rocksdb/util/compression.h +212 -7
  668. package/deps/rocksdb/rocksdb/util/compression_context_cache.cc +1 -3
  669. package/deps/rocksdb/rocksdb/util/crc32c.cc +165 -2
  670. package/deps/rocksdb/rocksdb/util/crc32c.h +6 -0
  671. package/deps/rocksdb/rocksdb/util/crc32c_arm64.cc +14 -0
  672. package/deps/rocksdb/rocksdb/util/crc32c_ppc.h +3 -0
  673. package/deps/rocksdb/rocksdb/util/crc32c_test.cc +47 -0
  674. package/deps/rocksdb/rocksdb/util/defer.h +30 -1
  675. package/deps/rocksdb/rocksdb/util/defer_test.cc +11 -0
  676. package/deps/rocksdb/rocksdb/util/duplicate_detector.h +3 -1
  677. package/deps/rocksdb/rocksdb/util/dynamic_bloom.h +3 -3
  678. package/deps/rocksdb/rocksdb/util/dynamic_bloom_test.cc +5 -4
  679. package/deps/rocksdb/rocksdb/util/fastrange.h +2 -0
  680. package/deps/rocksdb/rocksdb/util/file_checksum_helper.cc +36 -0
  681. package/deps/rocksdb/rocksdb/util/file_checksum_helper.h +3 -1
  682. package/deps/rocksdb/rocksdb/util/file_reader_writer_test.cc +512 -52
  683. package/deps/rocksdb/rocksdb/util/filter_bench.cc +65 -10
  684. package/deps/rocksdb/rocksdb/util/gflags_compat.h +6 -1
  685. package/deps/rocksdb/rocksdb/util/hash.cc +121 -3
  686. package/deps/rocksdb/rocksdb/util/hash.h +31 -1
  687. package/deps/rocksdb/rocksdb/util/hash128.h +26 -0
  688. package/deps/rocksdb/rocksdb/util/hash_containers.h +51 -0
  689. package/deps/rocksdb/rocksdb/util/hash_test.cc +194 -2
  690. package/deps/rocksdb/rocksdb/util/heap.h +6 -1
  691. package/deps/rocksdb/rocksdb/util/kv_map.h +1 -1
  692. package/deps/rocksdb/rocksdb/util/log_write_bench.cc +8 -6
  693. package/deps/rocksdb/rocksdb/util/math.h +74 -7
  694. package/deps/rocksdb/rocksdb/util/math128.h +13 -1
  695. package/deps/rocksdb/rocksdb/util/murmurhash.h +3 -3
  696. package/deps/rocksdb/rocksdb/util/random.cc +9 -0
  697. package/deps/rocksdb/rocksdb/util/random.h +6 -0
  698. package/deps/rocksdb/rocksdb/util/rate_limiter.cc +298 -144
  699. package/deps/rocksdb/rocksdb/util/rate_limiter.h +68 -19
  700. package/deps/rocksdb/rocksdb/util/rate_limiter_test.cc +335 -23
  701. package/deps/rocksdb/rocksdb/util/repeatable_thread.h +10 -12
  702. package/deps/rocksdb/rocksdb/util/repeatable_thread_test.cc +18 -15
  703. package/deps/rocksdb/rocksdb/util/ribbon_alg.h +98 -74
  704. package/deps/rocksdb/rocksdb/util/ribbon_config.cc +506 -0
  705. package/deps/rocksdb/rocksdb/util/ribbon_config.h +182 -0
  706. package/deps/rocksdb/rocksdb/util/ribbon_impl.h +154 -79
  707. package/deps/rocksdb/rocksdb/util/ribbon_test.cc +742 -365
  708. package/deps/rocksdb/rocksdb/util/set_comparator.h +2 -0
  709. package/deps/rocksdb/rocksdb/util/slice.cc +198 -35
  710. package/deps/rocksdb/rocksdb/util/slice_test.cc +30 -1
  711. package/deps/rocksdb/rocksdb/util/status.cc +32 -29
  712. package/deps/rocksdb/rocksdb/util/stop_watch.h +18 -18
  713. package/deps/rocksdb/rocksdb/util/string_util.cc +85 -6
  714. package/deps/rocksdb/rocksdb/util/string_util.h +47 -2
  715. package/deps/rocksdb/rocksdb/util/thread_guard.h +41 -0
  716. package/deps/rocksdb/rocksdb/util/thread_local.h +2 -2
  717. package/deps/rocksdb/rocksdb/util/thread_local_test.cc +22 -24
  718. package/deps/rocksdb/rocksdb/util/threadpool_imp.cc +7 -6
  719. package/deps/rocksdb/rocksdb/util/timer.h +55 -46
  720. package/deps/rocksdb/rocksdb/util/timer_test.cc +50 -48
  721. package/deps/rocksdb/rocksdb/util/user_comparator_wrapper.h +4 -0
  722. package/deps/rocksdb/rocksdb/util/vector_iterator.h +31 -15
  723. package/deps/rocksdb/rocksdb/util/work_queue.h +2 -0
  724. package/deps/rocksdb/rocksdb/util/xxhash.cc +35 -1144
  725. package/deps/rocksdb/rocksdb/util/xxhash.h +5117 -373
  726. package/deps/rocksdb/rocksdb/util/xxph3.h +1762 -0
  727. package/deps/rocksdb/rocksdb/utilities/agg_merge/agg_merge.cc +238 -0
  728. package/deps/rocksdb/rocksdb/utilities/agg_merge/agg_merge.h +49 -0
  729. package/deps/rocksdb/rocksdb/utilities/agg_merge/agg_merge_test.cc +134 -0
  730. package/deps/rocksdb/rocksdb/utilities/agg_merge/test_agg_merge.cc +104 -0
  731. package/deps/rocksdb/rocksdb/utilities/agg_merge/test_agg_merge.h +47 -0
  732. package/deps/rocksdb/rocksdb/utilities/backup/backup_engine.cc +3164 -0
  733. package/deps/rocksdb/rocksdb/utilities/backup/backup_engine_impl.h +29 -0
  734. package/deps/rocksdb/rocksdb/utilities/{backupable/backupable_db_test.cc → backup/backup_engine_test.cc} +1679 -485
  735. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_compaction_filter.cc +6 -4
  736. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_compaction_filter.h +14 -9
  737. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_db.cc +2 -0
  738. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_db.h +1 -0
  739. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_db_gc_stats.h +4 -0
  740. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_db_impl.cc +37 -27
  741. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_db_impl.h +8 -4
  742. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_db_impl_filesnapshot.cc +1 -1
  743. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_db_iterator.h +13 -10
  744. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_db_listener.h +5 -0
  745. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_db_test.cc +44 -25
  746. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_dump_tool.cc +3 -4
  747. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_file.cc +27 -19
  748. package/deps/rocksdb/rocksdb/utilities/blob_db/blob_file.h +4 -2
  749. package/deps/rocksdb/rocksdb/utilities/cache_dump_load.cc +69 -0
  750. package/deps/rocksdb/rocksdb/utilities/cache_dump_load_impl.cc +489 -0
  751. package/deps/rocksdb/rocksdb/utilities/cache_dump_load_impl.h +366 -0
  752. package/deps/rocksdb/rocksdb/utilities/cassandra/cassandra_compaction_filter.cc +67 -4
  753. package/deps/rocksdb/rocksdb/utilities/cassandra/cassandra_compaction_filter.h +21 -6
  754. package/deps/rocksdb/rocksdb/utilities/cassandra/cassandra_functional_test.cc +107 -7
  755. package/deps/rocksdb/rocksdb/utilities/cassandra/cassandra_options.h +43 -0
  756. package/deps/rocksdb/rocksdb/utilities/cassandra/format.h +1 -1
  757. package/deps/rocksdb/rocksdb/utilities/cassandra/merge_operator.cc +24 -8
  758. package/deps/rocksdb/rocksdb/utilities/cassandra/merge_operator.h +7 -7
  759. package/deps/rocksdb/rocksdb/utilities/cassandra/serialize.h +5 -0
  760. package/deps/rocksdb/rocksdb/utilities/checkpoint/checkpoint_impl.cc +99 -218
  761. package/deps/rocksdb/rocksdb/utilities/checkpoint/checkpoint_impl.h +8 -24
  762. package/deps/rocksdb/rocksdb/utilities/checkpoint/checkpoint_test.cc +114 -1
  763. package/deps/rocksdb/rocksdb/utilities/compaction_filters/layered_compaction_filter_base.h +6 -2
  764. package/deps/rocksdb/rocksdb/utilities/compaction_filters/remove_emptyvalue_compactionfilter.cc +0 -4
  765. package/deps/rocksdb/rocksdb/utilities/compaction_filters/remove_emptyvalue_compactionfilter.h +7 -6
  766. package/deps/rocksdb/rocksdb/utilities/compaction_filters.cc +56 -0
  767. package/deps/rocksdb/rocksdb/utilities/convenience/info_log_finder.cc +2 -2
  768. package/deps/rocksdb/rocksdb/utilities/counted_fs.cc +355 -0
  769. package/deps/rocksdb/rocksdb/utilities/counted_fs.h +152 -0
  770. package/deps/rocksdb/rocksdb/utilities/env_mirror.cc +13 -0
  771. package/deps/rocksdb/rocksdb/utilities/env_timed.cc +164 -122
  772. package/deps/rocksdb/rocksdb/utilities/env_timed.h +97 -0
  773. package/deps/rocksdb/rocksdb/utilities/fault_injection_env.cc +75 -17
  774. package/deps/rocksdb/rocksdb/utilities/fault_injection_env.h +19 -3
  775. package/deps/rocksdb/rocksdb/utilities/fault_injection_fs.cc +539 -126
  776. package/deps/rocksdb/rocksdb/utilities/fault_injection_fs.h +162 -17
  777. package/deps/rocksdb/rocksdb/utilities/fault_injection_secondary_cache.cc +110 -0
  778. package/deps/rocksdb/rocksdb/utilities/fault_injection_secondary_cache.h +94 -0
  779. package/deps/rocksdb/rocksdb/utilities/memory/memory_test.cc +5 -2
  780. package/deps/rocksdb/rocksdb/utilities/memory_allocators.h +104 -0
  781. package/deps/rocksdb/rocksdb/utilities/merge_operators/bytesxor.h +5 -3
  782. package/deps/rocksdb/rocksdb/utilities/merge_operators/max.cc +4 -1
  783. package/deps/rocksdb/rocksdb/utilities/merge_operators/put.cc +11 -3
  784. package/deps/rocksdb/rocksdb/utilities/merge_operators/sortlist.cc +0 -2
  785. package/deps/rocksdb/rocksdb/utilities/merge_operators/sortlist.h +5 -1
  786. package/deps/rocksdb/rocksdb/utilities/merge_operators/string_append/stringappend.cc +29 -10
  787. package/deps/rocksdb/rocksdb/utilities/merge_operators/string_append/stringappend.h +6 -3
  788. package/deps/rocksdb/rocksdb/utilities/merge_operators/string_append/stringappend2.cc +29 -14
  789. package/deps/rocksdb/rocksdb/utilities/merge_operators/string_append/stringappend2.h +6 -3
  790. package/deps/rocksdb/rocksdb/utilities/merge_operators/string_append/stringappend_test.cc +71 -18
  791. package/deps/rocksdb/rocksdb/utilities/merge_operators/uint64add.cc +15 -9
  792. package/deps/rocksdb/rocksdb/utilities/merge_operators.cc +120 -0
  793. package/deps/rocksdb/rocksdb/utilities/merge_operators.h +3 -23
  794. package/deps/rocksdb/rocksdb/utilities/object_registry.cc +267 -42
  795. package/deps/rocksdb/rocksdb/utilities/object_registry_test.cc +702 -76
  796. package/deps/rocksdb/rocksdb/utilities/option_change_migration/option_change_migration.cc +1 -1
  797. package/deps/rocksdb/rocksdb/utilities/option_change_migration/option_change_migration_test.cc +26 -5
  798. package/deps/rocksdb/rocksdb/utilities/options/options_util.cc +1 -1
  799. package/deps/rocksdb/rocksdb/utilities/options/options_util_test.cc +124 -1
  800. package/deps/rocksdb/rocksdb/utilities/persistent_cache/block_cache_tier.cc +2 -3
  801. package/deps/rocksdb/rocksdb/utilities/persistent_cache/block_cache_tier.h +8 -9
  802. package/deps/rocksdb/rocksdb/utilities/persistent_cache/block_cache_tier_file.cc +15 -13
  803. package/deps/rocksdb/rocksdb/utilities/persistent_cache/block_cache_tier_file.h +1 -1
  804. package/deps/rocksdb/rocksdb/utilities/persistent_cache/block_cache_tier_metadata.h +4 -4
  805. package/deps/rocksdb/rocksdb/utilities/persistent_cache/hash_table_evictable.h +2 -2
  806. package/deps/rocksdb/rocksdb/utilities/persistent_cache/persistent_cache_bench.cc +8 -9
  807. package/deps/rocksdb/rocksdb/utilities/persistent_cache/persistent_cache_test.cc +1 -1
  808. package/deps/rocksdb/rocksdb/utilities/persistent_cache/persistent_cache_tier.h +6 -3
  809. package/deps/rocksdb/rocksdb/utilities/persistent_cache/volatile_tier_impl.h +2 -2
  810. package/deps/rocksdb/rocksdb/utilities/simulator_cache/cache_simulator.cc +3 -0
  811. package/deps/rocksdb/rocksdb/utilities/simulator_cache/cache_simulator_test.cc +2 -0
  812. package/deps/rocksdb/rocksdb/utilities/simulator_cache/sim_cache.cc +43 -35
  813. package/deps/rocksdb/rocksdb/utilities/simulator_cache/sim_cache_test.cc +20 -18
  814. package/deps/rocksdb/rocksdb/utilities/table_properties_collectors/compact_on_deletion_collector.cc +107 -2
  815. package/deps/rocksdb/rocksdb/utilities/trace/file_trace_reader_writer.cc +23 -15
  816. package/deps/rocksdb/rocksdb/utilities/trace/file_trace_reader_writer.h +2 -2
  817. package/deps/rocksdb/rocksdb/utilities/trace/replayer_impl.cc +316 -0
  818. package/deps/rocksdb/rocksdb/utilities/trace/replayer_impl.h +86 -0
  819. package/deps/rocksdb/rocksdb/utilities/transactions/lock/point/point_lock_manager.cc +4 -5
  820. package/deps/rocksdb/rocksdb/utilities/transactions/lock/point/point_lock_manager.h +4 -3
  821. package/deps/rocksdb/rocksdb/utilities/transactions/lock/point/point_lock_manager_test.h +1 -1
  822. package/deps/rocksdb/rocksdb/utilities/transactions/lock/range/range_locking_test.cc +119 -3
  823. package/deps/rocksdb/rocksdb/utilities/transactions/lock/range/range_tree/lib/locktree/locktree.cc +20 -3
  824. package/deps/rocksdb/rocksdb/utilities/transactions/lock/range/range_tree/lib/locktree/locktree.h +20 -0
  825. package/deps/rocksdb/rocksdb/utilities/transactions/lock/range/range_tree/lib/portability/toku_external_pthread.h +3 -2
  826. package/deps/rocksdb/rocksdb/utilities/transactions/lock/range/range_tree/lib/portability/toku_time.h +4 -0
  827. package/deps/rocksdb/rocksdb/utilities/transactions/lock/range/range_tree/range_tree_lock_manager.cc +38 -14
  828. package/deps/rocksdb/rocksdb/utilities/transactions/lock/range/range_tree/range_tree_lock_manager.h +17 -10
  829. package/deps/rocksdb/rocksdb/utilities/transactions/optimistic_transaction_db_impl.h +1 -0
  830. package/deps/rocksdb/rocksdb/utilities/transactions/optimistic_transaction_test.cc +1 -2
  831. package/deps/rocksdb/rocksdb/utilities/transactions/pessimistic_transaction.cc +423 -34
  832. package/deps/rocksdb/rocksdb/utilities/transactions/pessimistic_transaction.h +82 -2
  833. package/deps/rocksdb/rocksdb/utilities/transactions/pessimistic_transaction_db.cc +72 -40
  834. package/deps/rocksdb/rocksdb/utilities/transactions/pessimistic_transaction_db.h +32 -1
  835. package/deps/rocksdb/rocksdb/utilities/transactions/transaction_base.cc +13 -5
  836. package/deps/rocksdb/rocksdb/utilities/transactions/transaction_base.h +7 -3
  837. package/deps/rocksdb/rocksdb/utilities/transactions/transaction_test.cc +207 -43
  838. package/deps/rocksdb/rocksdb/utilities/transactions/transaction_test.h +50 -7
  839. package/deps/rocksdb/rocksdb/utilities/transactions/transaction_util.cc +28 -10
  840. package/deps/rocksdb/rocksdb/utilities/transactions/transaction_util.h +11 -6
  841. package/deps/rocksdb/rocksdb/utilities/transactions/write_committed_transaction_ts_test.cc +516 -0
  842. package/deps/rocksdb/rocksdb/utilities/transactions/write_prepared_transaction_test.cc +506 -15
  843. package/deps/rocksdb/rocksdb/utilities/transactions/write_prepared_txn.cc +27 -13
  844. package/deps/rocksdb/rocksdb/utilities/transactions/write_prepared_txn_db.cc +14 -14
  845. package/deps/rocksdb/rocksdb/utilities/transactions/write_prepared_txn_db.h +3 -0
  846. package/deps/rocksdb/rocksdb/utilities/transactions/write_unprepared_transaction_test.cc +2 -2
  847. package/deps/rocksdb/rocksdb/utilities/transactions/write_unprepared_txn.cc +14 -5
  848. package/deps/rocksdb/rocksdb/utilities/ttl/db_ttl_impl.cc +305 -27
  849. package/deps/rocksdb/rocksdb/utilities/ttl/db_ttl_impl.h +55 -159
  850. package/deps/rocksdb/rocksdb/utilities/ttl/ttl_test.cc +209 -2
  851. package/deps/rocksdb/rocksdb/utilities/wal_filter.cc +23 -0
  852. package/deps/rocksdb/rocksdb/utilities/write_batch_with_index/write_batch_with_index.cc +157 -88
  853. package/deps/rocksdb/rocksdb/utilities/write_batch_with_index/write_batch_with_index_internal.cc +501 -114
  854. package/deps/rocksdb/rocksdb/utilities/write_batch_with_index/write_batch_with_index_internal.h +91 -316
  855. package/deps/rocksdb/rocksdb/utilities/write_batch_with_index/write_batch_with_index_test.cc +1212 -672
  856. package/deps/rocksdb/rocksdb.gyp +425 -446
  857. package/index.js +5 -87
  858. package/package-lock.json +23687 -0
  859. package/package.json +8 -9
  860. package/prebuilds/darwin-arm64/node.napi.node +0 -0
  861. package/prebuilds/darwin-x64/node.napi.node +0 -0
  862. package/prebuilds/{darwin-x64+arm64 → linux-x64}/node.napi.node +0 -0
  863. package/deps/rocksdb/rocksdb/README.md +0 -32
  864. package/deps/rocksdb/rocksdb/env/env_hdfs.cc +0 -648
  865. package/deps/rocksdb/rocksdb/hdfs/README +0 -23
  866. package/deps/rocksdb/rocksdb/hdfs/env_hdfs.h +0 -386
  867. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/backupable_db.h +0 -535
  868. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/env_librados.h +0 -175
  869. package/deps/rocksdb/rocksdb/include/rocksdb/utilities/utility_db.h +0 -34
  870. package/deps/rocksdb/rocksdb/memory/memkind_kmem_allocator_test.cc +0 -102
  871. package/deps/rocksdb/rocksdb/memtable/hash_linklist_rep.h +0 -49
  872. package/deps/rocksdb/rocksdb/memtable/hash_skiplist_rep.h +0 -44
  873. package/deps/rocksdb/rocksdb/options/customizable_helper.h +0 -216
  874. package/deps/rocksdb/rocksdb/port/README +0 -10
  875. package/deps/rocksdb/rocksdb/third-party/folly/folly/CPortability.h +0 -27
  876. package/deps/rocksdb/rocksdb/third-party/folly/folly/ConstexprMath.h +0 -45
  877. package/deps/rocksdb/rocksdb/third-party/folly/folly/Indestructible.h +0 -166
  878. package/deps/rocksdb/rocksdb/third-party/folly/folly/Optional.h +0 -570
  879. package/deps/rocksdb/rocksdb/third-party/folly/folly/Portability.h +0 -92
  880. package/deps/rocksdb/rocksdb/third-party/folly/folly/ScopeGuard.h +0 -54
  881. package/deps/rocksdb/rocksdb/third-party/folly/folly/Traits.h +0 -152
  882. package/deps/rocksdb/rocksdb/third-party/folly/folly/Unit.h +0 -59
  883. package/deps/rocksdb/rocksdb/third-party/folly/folly/Utility.h +0 -141
  884. package/deps/rocksdb/rocksdb/third-party/folly/folly/chrono/Hardware.h +0 -33
  885. package/deps/rocksdb/rocksdb/third-party/folly/folly/container/Array.h +0 -74
  886. package/deps/rocksdb/rocksdb/third-party/folly/folly/detail/Futex-inl.h +0 -117
  887. package/deps/rocksdb/rocksdb/third-party/folly/folly/detail/Futex.cpp +0 -263
  888. package/deps/rocksdb/rocksdb/third-party/folly/folly/detail/Futex.h +0 -96
  889. package/deps/rocksdb/rocksdb/third-party/folly/folly/functional/Invoke.h +0 -40
  890. package/deps/rocksdb/rocksdb/third-party/folly/folly/hash/Hash.h +0 -29
  891. package/deps/rocksdb/rocksdb/third-party/folly/folly/lang/Align.h +0 -144
  892. package/deps/rocksdb/rocksdb/third-party/folly/folly/lang/Bits.h +0 -30
  893. package/deps/rocksdb/rocksdb/third-party/folly/folly/lang/Launder.h +0 -51
  894. package/deps/rocksdb/rocksdb/third-party/folly/folly/portability/Asm.h +0 -28
  895. package/deps/rocksdb/rocksdb/third-party/folly/folly/portability/SysSyscall.h +0 -10
  896. package/deps/rocksdb/rocksdb/third-party/folly/folly/portability/SysTypes.h +0 -26
  897. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/AtomicNotification-inl.h +0 -138
  898. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/AtomicNotification.cpp +0 -23
  899. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/AtomicNotification.h +0 -57
  900. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/AtomicUtil-inl.h +0 -260
  901. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/AtomicUtil.h +0 -52
  902. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/Baton.h +0 -328
  903. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/DistributedMutex-inl.h +0 -1703
  904. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/DistributedMutex.cpp +0 -16
  905. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/DistributedMutex.h +0 -304
  906. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/DistributedMutexSpecializations.h +0 -39
  907. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/ParkingLot.cpp +0 -26
  908. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/ParkingLot.h +0 -318
  909. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/WaitOptions.h +0 -57
  910. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/detail/InlineFunctionRef.h +0 -219
  911. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/detail/ProxyLockable-inl.h +0 -207
  912. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/detail/ProxyLockable.h +0 -164
  913. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/detail/Sleeper.h +0 -57
  914. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/detail/Spin.h +0 -77
  915. package/deps/rocksdb/rocksdb/third-party/folly/folly/synchronization/test/DistributedMutexTest.cpp +0 -1145
  916. package/deps/rocksdb/rocksdb/util/build_version.h +0 -15
  917. package/deps/rocksdb/rocksdb/util/xxh3p.h +0 -1392
  918. package/deps/rocksdb/rocksdb/utilities/backupable/backupable_db.cc +0 -2354
  919. package/deps/rocksdb/rocksdb/utilities/env_librados.cc +0 -1497
  920. package/deps/rocksdb/rocksdb/utilities/env_librados_test.cc +0 -1146
  921. package/deps/rocksdb/rocksdb/utilities/transactions/lock/range/range_tree/lib/README +0 -13
  922. package/deps/snappy/snappy-1.1.7/README.md +0 -149
  923. package/prebuilds/linux-x64/node.napi.glibc.node +0 -0
@@ -0,0 +1,3164 @@
1
+ // Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
2
+ // This source code is licensed under both the GPLv2 (found in the
3
+ // COPYING file in the root directory) and Apache 2.0 License
4
+ // (found in the LICENSE.Apache file in the root directory).
5
+ //
6
+ // Copyright (c) 2011 The LevelDB Authors. All rights reserved.
7
+ // Use of this source code is governed by a BSD-style license that can be
8
+ // found in the LICENSE file. See the AUTHORS file for names of contributors.
9
+
10
+ #ifndef ROCKSDB_LITE
11
+
12
+ #include <algorithm>
13
+ #include <atomic>
14
+ #include <cinttypes>
15
+ #include <cstdlib>
16
+ #include <functional>
17
+ #include <future>
18
+ #include <limits>
19
+ #include <map>
20
+ #include <mutex>
21
+ #include <sstream>
22
+ #include <string>
23
+ #include <thread>
24
+ #include <unordered_map>
25
+ #include <unordered_set>
26
+ #include <vector>
27
+
28
+ #include "env/composite_env_wrapper.h"
29
+ #include "env/fs_readonly.h"
30
+ #include "env/fs_remap.h"
31
+ #include "file/filename.h"
32
+ #include "file/line_file_reader.h"
33
+ #include "file/sequence_file_reader.h"
34
+ #include "file/writable_file_writer.h"
35
+ #include "logging/logging.h"
36
+ #include "monitoring/iostats_context_imp.h"
37
+ #include "options/options_helper.h"
38
+ #include "port/port.h"
39
+ #include "rocksdb/advanced_options.h"
40
+ #include "rocksdb/env.h"
41
+ #include "rocksdb/rate_limiter.h"
42
+ #include "rocksdb/statistics.h"
43
+ #include "rocksdb/transaction_log.h"
44
+ #include "table/sst_file_dumper.h"
45
+ #include "test_util/sync_point.h"
46
+ #include "util/cast_util.h"
47
+ #include "util/channel.h"
48
+ #include "util/coding.h"
49
+ #include "util/crc32c.h"
50
+ #include "util/math.h"
51
+ #include "util/string_util.h"
52
+ #include "utilities/backup/backup_engine_impl.h"
53
+ #include "utilities/checkpoint/checkpoint_impl.h"
54
+
55
+ namespace ROCKSDB_NAMESPACE {
56
+
57
+ namespace {
58
+ using ShareFilesNaming = BackupEngineOptions::ShareFilesNaming;
59
+
60
+ constexpr BackupID kLatestBackupIDMarker = static_cast<BackupID>(-2);
61
+
62
+ inline uint32_t ChecksumHexToInt32(const std::string& checksum_hex) {
63
+ std::string checksum_str;
64
+ Slice(checksum_hex).DecodeHex(&checksum_str);
65
+ return EndianSwapValue(DecodeFixed32(checksum_str.c_str()));
66
+ }
67
+ inline std::string ChecksumStrToHex(const std::string& checksum_str) {
68
+ return Slice(checksum_str).ToString(true);
69
+ }
70
+ inline std::string ChecksumInt32ToHex(const uint32_t& checksum_value) {
71
+ std::string checksum_str;
72
+ PutFixed32(&checksum_str, EndianSwapValue(checksum_value));
73
+ return ChecksumStrToHex(checksum_str);
74
+ }
75
+
76
+ const std::string kPrivateDirName = "private";
77
+ const std::string kMetaDirName = "meta";
78
+ const std::string kSharedDirName = "shared";
79
+ const std::string kSharedChecksumDirName = "shared_checksum";
80
+ const std::string kPrivateDirSlash = kPrivateDirName + "/";
81
+ const std::string kMetaDirSlash = kMetaDirName + "/";
82
+ const std::string kSharedDirSlash = kSharedDirName + "/";
83
+ const std::string kSharedChecksumDirSlash = kSharedChecksumDirName + "/";
84
+
85
+ } // namespace
86
+
87
+ void BackupStatistics::IncrementNumberSuccessBackup() {
88
+ number_success_backup++;
89
+ }
90
+ void BackupStatistics::IncrementNumberFailBackup() {
91
+ number_fail_backup++;
92
+ }
93
+
94
+ uint32_t BackupStatistics::GetNumberSuccessBackup() const {
95
+ return number_success_backup;
96
+ }
97
+ uint32_t BackupStatistics::GetNumberFailBackup() const {
98
+ return number_fail_backup;
99
+ }
100
+
101
+ std::string BackupStatistics::ToString() const {
102
+ char result[50];
103
+ snprintf(result, sizeof(result), "# success backup: %u, # fail backup: %u",
104
+ GetNumberSuccessBackup(), GetNumberFailBackup());
105
+ return result;
106
+ }
107
+
108
+ void BackupEngineOptions::Dump(Logger* logger) const {
109
+ ROCKS_LOG_INFO(logger, " Options.backup_dir: %s",
110
+ backup_dir.c_str());
111
+ ROCKS_LOG_INFO(logger, " Options.backup_env: %p", backup_env);
112
+ ROCKS_LOG_INFO(logger, " Options.share_table_files: %d",
113
+ static_cast<int>(share_table_files));
114
+ ROCKS_LOG_INFO(logger, " Options.info_log: %p", info_log);
115
+ ROCKS_LOG_INFO(logger, " Options.sync: %d",
116
+ static_cast<int>(sync));
117
+ ROCKS_LOG_INFO(logger, " Options.destroy_old_data: %d",
118
+ static_cast<int>(destroy_old_data));
119
+ ROCKS_LOG_INFO(logger, " Options.backup_log_files: %d",
120
+ static_cast<int>(backup_log_files));
121
+ ROCKS_LOG_INFO(logger, " Options.backup_rate_limit: %" PRIu64,
122
+ backup_rate_limit);
123
+ ROCKS_LOG_INFO(logger, " Options.restore_rate_limit: %" PRIu64,
124
+ restore_rate_limit);
125
+ ROCKS_LOG_INFO(logger, "Options.max_background_operations: %d",
126
+ max_background_operations);
127
+ }
128
+
129
+ namespace {
130
+ // -------- BackupEngineImpl class ---------
131
+ class BackupEngineImpl {
132
+ public:
133
+ BackupEngineImpl(const BackupEngineOptions& options, Env* db_env,
134
+ bool read_only = false);
135
+ ~BackupEngineImpl();
136
+
137
+ IOStatus CreateNewBackupWithMetadata(const CreateBackupOptions& options,
138
+ DB* db, const std::string& app_metadata,
139
+ BackupID* new_backup_id_ptr);
140
+
141
+ IOStatus PurgeOldBackups(uint32_t num_backups_to_keep);
142
+
143
+ IOStatus DeleteBackup(BackupID backup_id);
144
+
145
+ void StopBackup() { stop_backup_.store(true, std::memory_order_release); }
146
+
147
+ IOStatus GarbageCollect();
148
+
149
+ // The returned BackupInfos are in chronological order, which means the
150
+ // latest backup comes last.
151
+ void GetBackupInfo(std::vector<BackupInfo>* backup_info,
152
+ bool include_file_details) const;
153
+
154
+ Status GetBackupInfo(BackupID backup_id, BackupInfo* backup_info,
155
+ bool include_file_details = false) const;
156
+
157
+ void GetCorruptedBackups(std::vector<BackupID>* corrupt_backup_ids) const;
158
+
159
+ IOStatus RestoreDBFromBackup(const RestoreOptions& options,
160
+ BackupID backup_id, const std::string& db_dir,
161
+ const std::string& wal_dir) const;
162
+
163
+ IOStatus RestoreDBFromLatestBackup(const RestoreOptions& options,
164
+ const std::string& db_dir,
165
+ const std::string& wal_dir) const {
166
+ // Note: don't read latest_valid_backup_id_ outside of lock
167
+ return RestoreDBFromBackup(options, kLatestBackupIDMarker, db_dir, wal_dir);
168
+ }
169
+
170
+ IOStatus VerifyBackup(BackupID backup_id,
171
+ bool verify_with_checksum = false) const;
172
+
173
+ IOStatus Initialize();
174
+
175
+ ShareFilesNaming GetNamingNoFlags() const {
176
+ return options_.share_files_with_checksum_naming &
177
+ BackupEngineOptions::kMaskNoNamingFlags;
178
+ }
179
+ ShareFilesNaming GetNamingFlags() const {
180
+ return options_.share_files_with_checksum_naming &
181
+ BackupEngineOptions::kMaskNamingFlags;
182
+ }
183
+
184
+ private:
185
+ void DeleteChildren(const std::string& dir,
186
+ uint32_t file_type_filter = 0) const;
187
+ IOStatus DeleteBackupNoGC(BackupID backup_id);
188
+
189
+ // Extends the "result" map with pathname->size mappings for the contents of
190
+ // "dir" in "env". Pathnames are prefixed with "dir".
191
+ IOStatus ReadChildFileCurrentSizes(
192
+ const std::string& dir, const std::shared_ptr<FileSystem>&,
193
+ std::unordered_map<std::string, uint64_t>* result) const;
194
+
195
+ struct FileInfo {
196
+ FileInfo(const std::string& fname, uint64_t sz, const std::string& checksum,
197
+ const std::string& id, const std::string& sid, Temperature _temp)
198
+ : refs(0),
199
+ filename(fname),
200
+ size(sz),
201
+ checksum_hex(checksum),
202
+ db_id(id),
203
+ db_session_id(sid),
204
+ temp(_temp) {}
205
+
206
+ FileInfo(const FileInfo&) = delete;
207
+ FileInfo& operator=(const FileInfo&) = delete;
208
+
209
+ int refs;
210
+ const std::string filename;
211
+ const uint64_t size;
212
+ // crc32c checksum as hex. empty == unknown / unavailable
213
+ std::string checksum_hex;
214
+ // DB identities
215
+ // db_id is obtained for potential usage in the future but not used
216
+ // currently
217
+ const std::string db_id;
218
+ // db_session_id appears in the backup SST filename if the table naming
219
+ // option is kUseDbSessionId
220
+ const std::string db_session_id;
221
+ Temperature temp;
222
+
223
+ std::string GetDbFileName() {
224
+ std::string rv;
225
+ // extract the filename part
226
+ size_t slash = filename.find_last_of('/');
227
+ // file will either be shared/<file>, shared_checksum/<file_crc32c_size>,
228
+ // shared_checksum/<file_session>, shared_checksum/<file_crc32c_session>,
229
+ // or private/<number>/<file>
230
+ assert(slash != std::string::npos);
231
+ rv = filename.substr(slash + 1);
232
+
233
+ // if the file was in shared_checksum, extract the real file name
234
+ // in this case the file is <number>_<checksum>_<size>.<type>,
235
+ // <number>_<session>.<type>, or <number>_<checksum>_<session>.<type>
236
+ if (filename.substr(0, slash) == kSharedChecksumDirName) {
237
+ rv = GetFileFromChecksumFile(rv);
238
+ }
239
+ return rv;
240
+ }
241
+ };
242
+
243
+ static void LoopRateLimitRequestHelper(const size_t total_bytes_to_request,
244
+ RateLimiter* rate_limiter,
245
+ const Env::IOPriority pri,
246
+ Statistics* stats,
247
+ const RateLimiter::OpType op_type);
248
+
249
+ static inline std::string WithoutTrailingSlash(const std::string& path) {
250
+ if (path.empty() || path.back() != '/') {
251
+ return path;
252
+ } else {
253
+ return path.substr(path.size() - 1);
254
+ }
255
+ }
256
+
257
+ static inline std::string WithTrailingSlash(const std::string& path) {
258
+ if (path.empty() || path.back() != '/') {
259
+ return path + '/';
260
+ } else {
261
+ return path;
262
+ }
263
+ }
264
+
265
+ // A filesystem wrapper that makes shared backup files appear to be in the
266
+ // private backup directory (dst_dir), so that the private backup dir can
267
+ // be opened as a read-only DB.
268
+ class RemapSharedFileSystem : public RemapFileSystem {
269
+ public:
270
+ RemapSharedFileSystem(const std::shared_ptr<FileSystem>& base,
271
+ const std::string& dst_dir,
272
+ const std::string& src_base_dir,
273
+ const std::vector<std::shared_ptr<FileInfo>>& files)
274
+ : RemapFileSystem(base),
275
+ dst_dir_(WithoutTrailingSlash(dst_dir)),
276
+ dst_dir_slash_(WithTrailingSlash(dst_dir)),
277
+ src_base_dir_(WithTrailingSlash(src_base_dir)) {
278
+ for (auto& info : files) {
279
+ if (!StartsWith(info->filename, kPrivateDirSlash)) {
280
+ assert(StartsWith(info->filename, kSharedDirSlash) ||
281
+ StartsWith(info->filename, kSharedChecksumDirSlash));
282
+ remaps_[info->GetDbFileName()] = info;
283
+ }
284
+ }
285
+ }
286
+
287
+ const char* Name() const override {
288
+ return "BackupEngineImpl::RemapSharedFileSystem";
289
+ }
290
+
291
+ // Sometimes a directory listing is required in opening a DB
292
+ IOStatus GetChildren(const std::string& dir, const IOOptions& options,
293
+ std::vector<std::string>* result,
294
+ IODebugContext* dbg) override {
295
+ IOStatus s = RemapFileSystem::GetChildren(dir, options, result, dbg);
296
+ if (s.ok() && (dir == dst_dir_ || dir == dst_dir_slash_)) {
297
+ // Assume remapped files exist
298
+ for (auto& r : remaps_) {
299
+ result->push_back(r.first);
300
+ }
301
+ }
302
+ return s;
303
+ }
304
+
305
+ // Sometimes a directory listing is required in opening a DB
306
+ IOStatus GetChildrenFileAttributes(const std::string& dir,
307
+ const IOOptions& options,
308
+ std::vector<FileAttributes>* result,
309
+ IODebugContext* dbg) override {
310
+ IOStatus s =
311
+ RemapFileSystem::GetChildrenFileAttributes(dir, options, result, dbg);
312
+ if (s.ok() && (dir == dst_dir_ || dir == dst_dir_slash_)) {
313
+ // Assume remapped files exist with recorded size
314
+ for (auto& r : remaps_) {
315
+ result->emplace_back(); // clean up with C++20
316
+ FileAttributes& attr = result->back();
317
+ attr.name = r.first;
318
+ attr.size_bytes = r.second->size;
319
+ }
320
+ }
321
+ return s;
322
+ }
323
+
324
+ protected:
325
+ // When a file in dst_dir is requested, see if we need to remap to shared
326
+ // file path.
327
+ std::pair<IOStatus, std::string> EncodePath(
328
+ const std::string& path) override {
329
+ if (path.empty() || path[0] != '/') {
330
+ return {IOStatus::InvalidArgument(path, "Not an absolute path"), ""};
331
+ }
332
+ std::pair<IOStatus, std::string> rv{IOStatus(), path};
333
+ if (StartsWith(path, dst_dir_slash_)) {
334
+ std::string relative = path.substr(dst_dir_slash_.size());
335
+ auto it = remaps_.find(relative);
336
+ if (it != remaps_.end()) {
337
+ rv.second = src_base_dir_ + it->second->filename;
338
+ }
339
+ }
340
+ return rv;
341
+ }
342
+
343
+ private:
344
+ // Absolute path to a directory that some extra files will be mapped into.
345
+ const std::string dst_dir_;
346
+ // Includes a trailing slash.
347
+ const std::string dst_dir_slash_;
348
+ // Absolute path to a directory containing some files to be mapped into
349
+ // dst_dir_. Includes a trailing slash.
350
+ const std::string src_base_dir_;
351
+ // If remaps_[x] exists, attempt to read dst_dir_ / x should instead read
352
+ // src_base_dir_ / remaps_[x]->filename. FileInfo is used to maximize
353
+ // sharing with other backup data in memory.
354
+ std::unordered_map<std::string, std::shared_ptr<FileInfo>> remaps_;
355
+ };
356
+
357
+ class BackupMeta {
358
+ public:
359
+ BackupMeta(
360
+ const std::string& meta_filename, const std::string& meta_tmp_filename,
361
+ std::unordered_map<std::string, std::shared_ptr<FileInfo>>* file_infos,
362
+ Env* env, const std::shared_ptr<FileSystem>& fs)
363
+ : timestamp_(0),
364
+ sequence_number_(0),
365
+ size_(0),
366
+ meta_filename_(meta_filename),
367
+ meta_tmp_filename_(meta_tmp_filename),
368
+ file_infos_(file_infos),
369
+ env_(env),
370
+ fs_(fs) {}
371
+
372
+ BackupMeta(const BackupMeta&) = delete;
373
+ BackupMeta& operator=(const BackupMeta&) = delete;
374
+
375
+ ~BackupMeta() {}
376
+
377
+ void RecordTimestamp() {
378
+ // Best effort
379
+ Status s = env_->GetCurrentTime(&timestamp_);
380
+ if (!s.ok()) {
381
+ timestamp_ = /* something clearly fabricated */ 1;
382
+ }
383
+ }
384
+ int64_t GetTimestamp() const {
385
+ return timestamp_;
386
+ }
387
+ uint64_t GetSize() const {
388
+ return size_;
389
+ }
390
+ uint32_t GetNumberFiles() const {
391
+ return static_cast<uint32_t>(files_.size());
392
+ }
393
+ void SetSequenceNumber(uint64_t sequence_number) {
394
+ sequence_number_ = sequence_number;
395
+ }
396
+ uint64_t GetSequenceNumber() const { return sequence_number_; }
397
+
398
+ const std::string& GetAppMetadata() const { return app_metadata_; }
399
+
400
+ void SetAppMetadata(const std::string& app_metadata) {
401
+ app_metadata_ = app_metadata;
402
+ }
403
+
404
+ IOStatus AddFile(std::shared_ptr<FileInfo> file_info);
405
+
406
+ IOStatus Delete(bool delete_meta = true);
407
+
408
+ bool Empty() const { return files_.empty(); }
409
+
410
+ std::shared_ptr<FileInfo> GetFile(const std::string& filename) const {
411
+ auto it = file_infos_->find(filename);
412
+ if (it == file_infos_->end()) {
413
+ return nullptr;
414
+ }
415
+ return it->second;
416
+ }
417
+
418
+ const std::vector<std::shared_ptr<FileInfo>>& GetFiles() const {
419
+ return files_;
420
+ }
421
+
422
+ // @param abs_path_to_size Pre-fetched file sizes (bytes).
423
+ IOStatus LoadFromFile(
424
+ const std::string& backup_dir,
425
+ const std::unordered_map<std::string, uint64_t>& abs_path_to_size,
426
+ RateLimiter* rate_limiter, Logger* info_log,
427
+ std::unordered_set<std::string>* reported_ignored_fields);
428
+ IOStatus StoreToFile(
429
+ bool sync, int schema_version,
430
+ const TEST_BackupMetaSchemaOptions* schema_test_options);
431
+
432
+ std::string GetInfoString() {
433
+ std::ostringstream ss;
434
+ ss << "Timestamp: " << timestamp_ << std::endl;
435
+ char human_size[16];
436
+ AppendHumanBytes(size_, human_size, sizeof(human_size));
437
+ ss << "Size: " << human_size << std::endl;
438
+ ss << "Files:" << std::endl;
439
+ for (const auto& file : files_) {
440
+ AppendHumanBytes(file->size, human_size, sizeof(human_size));
441
+ ss << file->filename << ", size " << human_size << ", refs "
442
+ << file->refs << std::endl;
443
+ }
444
+ return ss.str();
445
+ }
446
+
447
+ const std::shared_ptr<Env>& GetEnvForOpen() const {
448
+ if (!env_for_open_) {
449
+ // Lazy initialize
450
+ // Find directories
451
+ std::string dst_dir = meta_filename_;
452
+ auto i = dst_dir.rfind(kMetaDirSlash);
453
+ assert(i != std::string::npos);
454
+ std::string src_base_dir = dst_dir.substr(0, i);
455
+ dst_dir.replace(i, kMetaDirSlash.size(), kPrivateDirSlash);
456
+ // Make the RemapSharedFileSystem
457
+ std::shared_ptr<FileSystem> remap_fs =
458
+ std::make_shared<RemapSharedFileSystem>(fs_, dst_dir, src_base_dir,
459
+ files_);
460
+ // Make it read-only for safety
461
+ remap_fs = std::make_shared<ReadOnlyFileSystem>(remap_fs);
462
+ // Make an Env wrapper
463
+ env_for_open_ = std::make_shared<CompositeEnvWrapper>(env_, remap_fs);
464
+ }
465
+ return env_for_open_;
466
+ }
467
+
468
+ private:
469
+ int64_t timestamp_;
470
+ // sequence number is only approximate, should not be used
471
+ // by clients
472
+ uint64_t sequence_number_;
473
+ uint64_t size_;
474
+ std::string app_metadata_;
475
+ std::string const meta_filename_;
476
+ std::string const meta_tmp_filename_;
477
+ // files with relative paths (without "/" prefix!!)
478
+ std::vector<std::shared_ptr<FileInfo>> files_;
479
+ std::unordered_map<std::string, std::shared_ptr<FileInfo>>* file_infos_;
480
+ Env* env_;
481
+ mutable std::shared_ptr<Env> env_for_open_;
482
+ std::shared_ptr<FileSystem> fs_;
483
+ IOOptions iooptions_ = IOOptions();
484
+ }; // BackupMeta
485
+
486
+ void SetBackupInfoFromBackupMeta(BackupID id, const BackupMeta& meta,
487
+ BackupInfo* backup_info,
488
+ bool include_file_details) const;
489
+
490
+ inline std::string GetAbsolutePath(
491
+ const std::string &relative_path = "") const {
492
+ assert(relative_path.size() == 0 || relative_path[0] != '/');
493
+ return options_.backup_dir + "/" + relative_path;
494
+ }
495
+ inline std::string GetPrivateFileRel(BackupID backup_id,
496
+ bool tmp = false,
497
+ const std::string& file = "") const {
498
+ assert(file.size() == 0 || file[0] != '/');
499
+ return kPrivateDirSlash + ROCKSDB_NAMESPACE::ToString(backup_id) +
500
+ (tmp ? ".tmp" : "") + "/" + file;
501
+ }
502
+ inline std::string GetSharedFileRel(const std::string& file = "",
503
+ bool tmp = false) const {
504
+ assert(file.size() == 0 || file[0] != '/');
505
+ return kSharedDirSlash + std::string(tmp ? "." : "") + file +
506
+ (tmp ? ".tmp" : "");
507
+ }
508
+ inline std::string GetSharedFileWithChecksumRel(const std::string& file = "",
509
+ bool tmp = false) const {
510
+ assert(file.size() == 0 || file[0] != '/');
511
+ return kSharedChecksumDirSlash + std::string(tmp ? "." : "") + file +
512
+ (tmp ? ".tmp" : "");
513
+ }
514
+ inline bool UseLegacyNaming(const std::string& sid) const {
515
+ return GetNamingNoFlags() ==
516
+ BackupEngineOptions::kLegacyCrc32cAndFileSize ||
517
+ sid.empty();
518
+ }
519
+ inline std::string GetSharedFileWithChecksum(
520
+ const std::string& file, const std::string& checksum_hex,
521
+ const uint64_t file_size, const std::string& db_session_id) const {
522
+ assert(file.size() == 0 || file[0] != '/');
523
+ std::string file_copy = file;
524
+ if (UseLegacyNaming(db_session_id)) {
525
+ assert(!checksum_hex.empty());
526
+ file_copy.insert(file_copy.find_last_of('.'),
527
+ "_" + ToString(ChecksumHexToInt32(checksum_hex)) + "_" +
528
+ ToString(file_size));
529
+ } else {
530
+ file_copy.insert(file_copy.find_last_of('.'), "_s" + db_session_id);
531
+ if (GetNamingFlags() & BackupEngineOptions::kFlagIncludeFileSize) {
532
+ file_copy.insert(file_copy.find_last_of('.'),
533
+ "_" + ToString(file_size));
534
+ }
535
+ }
536
+ return file_copy;
537
+ }
538
+ static inline std::string GetFileFromChecksumFile(const std::string& file) {
539
+ assert(file.size() == 0 || file[0] != '/');
540
+ std::string file_copy = file;
541
+ size_t first_underscore = file_copy.find_first_of('_');
542
+ return file_copy.erase(first_underscore,
543
+ file_copy.find_last_of('.') - first_underscore);
544
+ }
545
+ inline std::string GetBackupMetaFile(BackupID backup_id, bool tmp) const {
546
+ return GetAbsolutePath(kMetaDirName) + "/" + (tmp ? "." : "") +
547
+ ROCKSDB_NAMESPACE::ToString(backup_id) + (tmp ? ".tmp" : "");
548
+ }
549
+
550
+ // If size_limit == 0, there is no size limit, copy everything.
551
+ //
552
+ // Exactly one of src and contents must be non-empty.
553
+ //
554
+ // @param src If non-empty, the file is copied from this pathname.
555
+ // @param contents If non-empty, the file will be created with these contents.
556
+ // @param src_temperature Pass in expected temperature of src, return back
557
+ // temperature reported by FileSystem
558
+ IOStatus CopyOrCreateFile(const std::string& src, const std::string& dst,
559
+ const std::string& contents, uint64_t size_limit,
560
+ Env* src_env, Env* dst_env,
561
+ const EnvOptions& src_env_options, bool sync,
562
+ RateLimiter* rate_limiter,
563
+ std::function<void()> progress_callback,
564
+ Temperature* src_temperature,
565
+ Temperature dst_temperature,
566
+ uint64_t* bytes_toward_next_callback,
567
+ uint64_t* size, std::string* checksum_hex);
568
+
569
+ IOStatus ReadFileAndComputeChecksum(const std::string& src,
570
+ const std::shared_ptr<FileSystem>& src_fs,
571
+ const EnvOptions& src_env_options,
572
+ uint64_t size_limit,
573
+ std::string* checksum_hex,
574
+ const Temperature src_temperature) const;
575
+
576
+ // Obtain db_id and db_session_id from the table properties of file_path
577
+ Status GetFileDbIdentities(Env* src_env, const EnvOptions& src_env_options,
578
+ const std::string& file_path,
579
+ Temperature file_temp, RateLimiter* rate_limiter,
580
+ std::string* db_id, std::string* db_session_id);
581
+
582
+ struct CopyOrCreateResult {
583
+ ~CopyOrCreateResult() {
584
+ // The Status needs to be ignored here for two reasons.
585
+ // First, if the BackupEngineImpl shuts down with jobs outstanding, then
586
+ // it is possible that the Status in the future/promise is never read,
587
+ // resulting in an unchecked Status. Second, if there are items in the
588
+ // channel when the BackupEngineImpl is shutdown, these will also have
589
+ // Status that have not been checked. This
590
+ // TODO: Fix those issues so that the Status
591
+ io_status.PermitUncheckedError();
592
+ }
593
+ uint64_t size;
594
+ std::string checksum_hex;
595
+ std::string db_id;
596
+ std::string db_session_id;
597
+ IOStatus io_status;
598
+ Temperature expected_src_temperature = Temperature::kUnknown;
599
+ Temperature current_src_temperature = Temperature::kUnknown;
600
+ };
601
+
602
+ // Exactly one of src_path and contents must be non-empty. If src_path is
603
+ // non-empty, the file is copied from this pathname. Otherwise, if contents is
604
+ // non-empty, the file will be created at dst_path with these contents.
605
+ struct CopyOrCreateWorkItem {
606
+ std::string src_path;
607
+ std::string dst_path;
608
+ Temperature src_temperature;
609
+ Temperature dst_temperature;
610
+ std::string contents;
611
+ Env* src_env;
612
+ Env* dst_env;
613
+ EnvOptions src_env_options;
614
+ bool sync;
615
+ RateLimiter* rate_limiter;
616
+ uint64_t size_limit;
617
+ Statistics* stats;
618
+ std::promise<CopyOrCreateResult> result;
619
+ std::function<void()> progress_callback;
620
+ std::string src_checksum_func_name;
621
+ std::string src_checksum_hex;
622
+ std::string db_id;
623
+ std::string db_session_id;
624
+
625
+ CopyOrCreateWorkItem()
626
+ : src_path(""),
627
+ dst_path(""),
628
+ src_temperature(Temperature::kUnknown),
629
+ dst_temperature(Temperature::kUnknown),
630
+ contents(""),
631
+ src_env(nullptr),
632
+ dst_env(nullptr),
633
+ src_env_options(),
634
+ sync(false),
635
+ rate_limiter(nullptr),
636
+ size_limit(0),
637
+ stats(nullptr),
638
+ src_checksum_func_name(kUnknownFileChecksumFuncName),
639
+ src_checksum_hex(""),
640
+ db_id(""),
641
+ db_session_id("") {}
642
+
643
+ CopyOrCreateWorkItem(const CopyOrCreateWorkItem&) = delete;
644
+ CopyOrCreateWorkItem& operator=(const CopyOrCreateWorkItem&) = delete;
645
+
646
+ CopyOrCreateWorkItem(CopyOrCreateWorkItem&& o) ROCKSDB_NOEXCEPT {
647
+ *this = std::move(o);
648
+ }
649
+
650
+ CopyOrCreateWorkItem& operator=(CopyOrCreateWorkItem&& o) ROCKSDB_NOEXCEPT {
651
+ src_path = std::move(o.src_path);
652
+ dst_path = std::move(o.dst_path);
653
+ src_temperature = std::move(o.src_temperature);
654
+ dst_temperature = std::move(o.dst_temperature);
655
+ contents = std::move(o.contents);
656
+ src_env = o.src_env;
657
+ dst_env = o.dst_env;
658
+ src_env_options = std::move(o.src_env_options);
659
+ sync = o.sync;
660
+ rate_limiter = o.rate_limiter;
661
+ size_limit = o.size_limit;
662
+ stats = o.stats;
663
+ result = std::move(o.result);
664
+ progress_callback = std::move(o.progress_callback);
665
+ src_checksum_func_name = std::move(o.src_checksum_func_name);
666
+ src_checksum_hex = std::move(o.src_checksum_hex);
667
+ db_id = std::move(o.db_id);
668
+ db_session_id = std::move(o.db_session_id);
669
+ src_temperature = o.src_temperature;
670
+ return *this;
671
+ }
672
+
673
+ CopyOrCreateWorkItem(
674
+ std::string _src_path, std::string _dst_path,
675
+ const Temperature _src_temperature, const Temperature _dst_temperature,
676
+ std::string _contents, Env* _src_env, Env* _dst_env,
677
+ EnvOptions _src_env_options, bool _sync, RateLimiter* _rate_limiter,
678
+ uint64_t _size_limit, Statistics* _stats,
679
+ std::function<void()> _progress_callback = []() {},
680
+ const std::string& _src_checksum_func_name =
681
+ kUnknownFileChecksumFuncName,
682
+ const std::string& _src_checksum_hex = "",
683
+ const std::string& _db_id = "", const std::string& _db_session_id = "")
684
+ : src_path(std::move(_src_path)),
685
+ dst_path(std::move(_dst_path)),
686
+ src_temperature(_src_temperature),
687
+ dst_temperature(_dst_temperature),
688
+ contents(std::move(_contents)),
689
+ src_env(_src_env),
690
+ dst_env(_dst_env),
691
+ src_env_options(std::move(_src_env_options)),
692
+ sync(_sync),
693
+ rate_limiter(_rate_limiter),
694
+ size_limit(_size_limit),
695
+ stats(_stats),
696
+ progress_callback(_progress_callback),
697
+ src_checksum_func_name(_src_checksum_func_name),
698
+ src_checksum_hex(_src_checksum_hex),
699
+ db_id(_db_id),
700
+ db_session_id(_db_session_id) {}
701
+ };
702
+
703
+ struct BackupAfterCopyOrCreateWorkItem {
704
+ std::future<CopyOrCreateResult> result;
705
+ bool shared;
706
+ bool needed_to_copy;
707
+ Env* backup_env;
708
+ std::string dst_path_tmp;
709
+ std::string dst_path;
710
+ std::string dst_relative;
711
+ BackupAfterCopyOrCreateWorkItem()
712
+ : shared(false),
713
+ needed_to_copy(false),
714
+ backup_env(nullptr),
715
+ dst_path_tmp(""),
716
+ dst_path(""),
717
+ dst_relative("") {}
718
+
719
+ BackupAfterCopyOrCreateWorkItem(BackupAfterCopyOrCreateWorkItem&& o)
720
+ ROCKSDB_NOEXCEPT {
721
+ *this = std::move(o);
722
+ }
723
+
724
+ BackupAfterCopyOrCreateWorkItem& operator=(
725
+ BackupAfterCopyOrCreateWorkItem&& o) ROCKSDB_NOEXCEPT {
726
+ result = std::move(o.result);
727
+ shared = o.shared;
728
+ needed_to_copy = o.needed_to_copy;
729
+ backup_env = o.backup_env;
730
+ dst_path_tmp = std::move(o.dst_path_tmp);
731
+ dst_path = std::move(o.dst_path);
732
+ dst_relative = std::move(o.dst_relative);
733
+ return *this;
734
+ }
735
+
736
+ BackupAfterCopyOrCreateWorkItem(std::future<CopyOrCreateResult>&& _result,
737
+ bool _shared, bool _needed_to_copy,
738
+ Env* _backup_env, std::string _dst_path_tmp,
739
+ std::string _dst_path,
740
+ std::string _dst_relative)
741
+ : result(std::move(_result)),
742
+ shared(_shared),
743
+ needed_to_copy(_needed_to_copy),
744
+ backup_env(_backup_env),
745
+ dst_path_tmp(std::move(_dst_path_tmp)),
746
+ dst_path(std::move(_dst_path)),
747
+ dst_relative(std::move(_dst_relative)) {}
748
+ };
749
+
750
+ struct RestoreAfterCopyOrCreateWorkItem {
751
+ std::future<CopyOrCreateResult> result;
752
+ std::string from_file;
753
+ std::string to_file;
754
+ std::string checksum_hex;
755
+ RestoreAfterCopyOrCreateWorkItem() : checksum_hex("") {}
756
+ RestoreAfterCopyOrCreateWorkItem(std::future<CopyOrCreateResult>&& _result,
757
+ const std::string& _from_file,
758
+ const std::string& _to_file,
759
+ const std::string& _checksum_hex)
760
+ : result(std::move(_result)),
761
+ from_file(_from_file),
762
+ to_file(_to_file),
763
+ checksum_hex(_checksum_hex) {}
764
+ RestoreAfterCopyOrCreateWorkItem(RestoreAfterCopyOrCreateWorkItem&& o)
765
+ ROCKSDB_NOEXCEPT {
766
+ *this = std::move(o);
767
+ }
768
+
769
+ RestoreAfterCopyOrCreateWorkItem& operator=(
770
+ RestoreAfterCopyOrCreateWorkItem&& o) ROCKSDB_NOEXCEPT {
771
+ result = std::move(o.result);
772
+ checksum_hex = std::move(o.checksum_hex);
773
+ return *this;
774
+ }
775
+ };
776
+
777
+ bool initialized_;
778
+ std::mutex byte_report_mutex_;
779
+ mutable channel<CopyOrCreateWorkItem> files_to_copy_or_create_;
780
+ std::vector<port::Thread> threads_;
781
+ std::atomic<CpuPriority> threads_cpu_priority_;
782
+
783
+ // Certain operations like PurgeOldBackups and DeleteBackup will trigger
784
+ // automatic GarbageCollect (true) unless we've already done one in this
785
+ // session and have not failed to delete backup files since then (false).
786
+ bool might_need_garbage_collect_ = true;
787
+
788
+ // Adds a file to the backup work queue to be copied or created if it doesn't
789
+ // already exist.
790
+ //
791
+ // Exactly one of src_dir and contents must be non-empty.
792
+ //
793
+ // @param src_dir If non-empty, the file in this directory named fname will be
794
+ // copied.
795
+ // @param fname Name of destination file and, in case of copy, source file.
796
+ // @param contents If non-empty, the file will be created with these contents.
797
+ IOStatus AddBackupFileWorkItem(
798
+ std::unordered_set<std::string>& live_dst_paths,
799
+ std::vector<BackupAfterCopyOrCreateWorkItem>& backup_items_to_finish,
800
+ BackupID backup_id, bool shared, const std::string& src_dir,
801
+ const std::string& fname, // starts with "/"
802
+ const EnvOptions& src_env_options, RateLimiter* rate_limiter,
803
+ FileType file_type, uint64_t size_bytes, Statistics* stats,
804
+ uint64_t size_limit = 0, bool shared_checksum = false,
805
+ std::function<void()> progress_callback = []() {},
806
+ const std::string& contents = std::string(),
807
+ const std::string& src_checksum_func_name = kUnknownFileChecksumFuncName,
808
+ const std::string& src_checksum_str = kUnknownFileChecksum,
809
+ const Temperature src_temperature = Temperature::kUnknown);
810
+
811
+ // backup state data
812
+ BackupID latest_backup_id_;
813
+ BackupID latest_valid_backup_id_;
814
+ std::map<BackupID, std::unique_ptr<BackupMeta>> backups_;
815
+ std::map<BackupID, std::pair<IOStatus, std::unique_ptr<BackupMeta>>>
816
+ corrupt_backups_;
817
+ std::unordered_map<std::string,
818
+ std::shared_ptr<FileInfo>> backuped_file_infos_;
819
+ std::atomic<bool> stop_backup_;
820
+
821
+ // options data
822
+ BackupEngineOptions options_;
823
+ Env* db_env_;
824
+ Env* backup_env_;
825
+
826
+ // directories
827
+ std::unique_ptr<FSDirectory> backup_directory_;
828
+ std::unique_ptr<FSDirectory> shared_directory_;
829
+ std::unique_ptr<FSDirectory> meta_directory_;
830
+ std::unique_ptr<FSDirectory> private_directory_;
831
+
832
+ static const size_t kDefaultCopyFileBufferSize = 5 * 1024 * 1024LL; // 5MB
833
+ bool read_only_;
834
+ BackupStatistics backup_statistics_;
835
+ std::unordered_set<std::string> reported_ignored_fields_;
836
+ static const size_t kMaxAppMetaSize = 1024 * 1024; // 1MB
837
+ std::shared_ptr<FileSystem> db_fs_;
838
+ std::shared_ptr<FileSystem> backup_fs_;
839
+ IOOptions io_options_ = IOOptions();
840
+
841
+ public:
842
+ std::unique_ptr<TEST_BackupMetaSchemaOptions> schema_test_options_;
843
+ };
844
+
845
+ // -------- BackupEngineImplThreadSafe class ---------
846
+ // This locking layer for thread safety in the public API is layered on
847
+ // top to prevent accidental recursive locking with RWMutex, which is UB.
848
+ // Note: BackupEngineReadOnlyBase inherited twice, but has no fields
849
+ class BackupEngineImplThreadSafe : public BackupEngine,
850
+ public BackupEngineReadOnly {
851
+ public:
852
+ BackupEngineImplThreadSafe(const BackupEngineOptions& options, Env* db_env,
853
+ bool read_only = false)
854
+ : impl_(options, db_env, read_only) {}
855
+ ~BackupEngineImplThreadSafe() override {}
856
+
857
+ using BackupEngine::CreateNewBackupWithMetadata;
858
+ IOStatus CreateNewBackupWithMetadata(const CreateBackupOptions& options,
859
+ DB* db, const std::string& app_metadata,
860
+ BackupID* new_backup_id) override {
861
+ WriteLock lock(&mutex_);
862
+ return impl_.CreateNewBackupWithMetadata(options, db, app_metadata,
863
+ new_backup_id);
864
+ }
865
+
866
+ IOStatus PurgeOldBackups(uint32_t num_backups_to_keep) override {
867
+ WriteLock lock(&mutex_);
868
+ return impl_.PurgeOldBackups(num_backups_to_keep);
869
+ }
870
+
871
+ IOStatus DeleteBackup(BackupID backup_id) override {
872
+ WriteLock lock(&mutex_);
873
+ return impl_.DeleteBackup(backup_id);
874
+ }
875
+
876
+ void StopBackup() override {
877
+ // No locking needed
878
+ impl_.StopBackup();
879
+ }
880
+
881
+ IOStatus GarbageCollect() override {
882
+ WriteLock lock(&mutex_);
883
+ return impl_.GarbageCollect();
884
+ }
885
+
886
+ Status GetLatestBackupInfo(BackupInfo* backup_info,
887
+ bool include_file_details = false) const override {
888
+ ReadLock lock(&mutex_);
889
+ return impl_.GetBackupInfo(kLatestBackupIDMarker, backup_info,
890
+ include_file_details);
891
+ }
892
+
893
+ Status GetBackupInfo(BackupID backup_id, BackupInfo* backup_info,
894
+ bool include_file_details = false) const override {
895
+ ReadLock lock(&mutex_);
896
+ return impl_.GetBackupInfo(backup_id, backup_info, include_file_details);
897
+ }
898
+
899
+ void GetBackupInfo(std::vector<BackupInfo>* backup_info,
900
+ bool include_file_details) const override {
901
+ ReadLock lock(&mutex_);
902
+ impl_.GetBackupInfo(backup_info, include_file_details);
903
+ }
904
+
905
+ void GetCorruptedBackups(
906
+ std::vector<BackupID>* corrupt_backup_ids) const override {
907
+ ReadLock lock(&mutex_);
908
+ impl_.GetCorruptedBackups(corrupt_backup_ids);
909
+ }
910
+
911
+ using BackupEngine::RestoreDBFromBackup;
912
+ IOStatus RestoreDBFromBackup(const RestoreOptions& options,
913
+ BackupID backup_id, const std::string& db_dir,
914
+ const std::string& wal_dir) const override {
915
+ ReadLock lock(&mutex_);
916
+ return impl_.RestoreDBFromBackup(options, backup_id, db_dir, wal_dir);
917
+ }
918
+
919
+ using BackupEngine::RestoreDBFromLatestBackup;
920
+ IOStatus RestoreDBFromLatestBackup(
921
+ const RestoreOptions& options, const std::string& db_dir,
922
+ const std::string& wal_dir) const override {
923
+ // Defer to above function, which locks
924
+ return RestoreDBFromBackup(options, kLatestBackupIDMarker, db_dir, wal_dir);
925
+ }
926
+
927
+ IOStatus VerifyBackup(BackupID backup_id,
928
+ bool verify_with_checksum = false) const override {
929
+ ReadLock lock(&mutex_);
930
+ return impl_.VerifyBackup(backup_id, verify_with_checksum);
931
+ }
932
+
933
+ // Not public API but needed
934
+ IOStatus Initialize() {
935
+ // No locking needed
936
+ return impl_.Initialize();
937
+ }
938
+
939
+ // Not public API but used in testing
940
+ void TEST_SetBackupMetaSchemaOptions(
941
+ const TEST_BackupMetaSchemaOptions& options) {
942
+ impl_.schema_test_options_.reset(new TEST_BackupMetaSchemaOptions(options));
943
+ }
944
+
945
+ private:
946
+ mutable port::RWMutex mutex_;
947
+ BackupEngineImpl impl_;
948
+ };
949
+ } // namespace
950
+
951
+ IOStatus BackupEngine::Open(const BackupEngineOptions& options, Env* env,
952
+ BackupEngine** backup_engine_ptr) {
953
+ std::unique_ptr<BackupEngineImplThreadSafe> backup_engine(
954
+ new BackupEngineImplThreadSafe(options, env));
955
+ auto s = backup_engine->Initialize();
956
+ if (!s.ok()) {
957
+ *backup_engine_ptr = nullptr;
958
+ return s;
959
+ }
960
+ *backup_engine_ptr = backup_engine.release();
961
+ return IOStatus::OK();
962
+ }
963
+
964
+ namespace {
965
+ BackupEngineImpl::BackupEngineImpl(const BackupEngineOptions& options,
966
+ Env* db_env, bool read_only)
967
+ : initialized_(false),
968
+ threads_cpu_priority_(),
969
+ latest_backup_id_(0),
970
+ latest_valid_backup_id_(0),
971
+ stop_backup_(false),
972
+ options_(options),
973
+ db_env_(db_env),
974
+ backup_env_(options.backup_env != nullptr ? options.backup_env : db_env_),
975
+ read_only_(read_only) {
976
+ if (options_.backup_rate_limiter == nullptr &&
977
+ options_.backup_rate_limit > 0) {
978
+ options_.backup_rate_limiter.reset(
979
+ NewGenericRateLimiter(options_.backup_rate_limit));
980
+ }
981
+ if (options_.restore_rate_limiter == nullptr &&
982
+ options_.restore_rate_limit > 0) {
983
+ options_.restore_rate_limiter.reset(
984
+ NewGenericRateLimiter(options_.restore_rate_limit));
985
+ }
986
+ db_fs_ = db_env_->GetFileSystem();
987
+ backup_fs_ = backup_env_->GetFileSystem();
988
+ }
989
+
990
+ BackupEngineImpl::~BackupEngineImpl() {
991
+ files_to_copy_or_create_.sendEof();
992
+ for (auto& t : threads_) {
993
+ t.join();
994
+ }
995
+ LogFlush(options_.info_log);
996
+ for (const auto& it : corrupt_backups_) {
997
+ it.second.first.PermitUncheckedError();
998
+ }
999
+ }
1000
+
1001
+ IOStatus BackupEngineImpl::Initialize() {
1002
+ assert(!initialized_);
1003
+ initialized_ = true;
1004
+ if (read_only_) {
1005
+ ROCKS_LOG_INFO(options_.info_log, "Starting read_only backup engine");
1006
+ }
1007
+ options_.Dump(options_.info_log);
1008
+
1009
+ auto meta_path = GetAbsolutePath(kMetaDirName);
1010
+
1011
+ if (!read_only_) {
1012
+ // we might need to clean up from previous crash or I/O errors
1013
+ might_need_garbage_collect_ = true;
1014
+
1015
+ if (options_.max_valid_backups_to_open != port::kMaxInt32) {
1016
+ options_.max_valid_backups_to_open = port::kMaxInt32;
1017
+ ROCKS_LOG_WARN(
1018
+ options_.info_log,
1019
+ "`max_valid_backups_to_open` is not set to the default value. Ignoring "
1020
+ "its value since BackupEngine is not read-only.");
1021
+ }
1022
+
1023
+ // gather the list of directories that we need to create
1024
+ std::vector<std::pair<std::string, std::unique_ptr<FSDirectory>*>>
1025
+ directories;
1026
+ directories.emplace_back(GetAbsolutePath(), &backup_directory_);
1027
+ if (options_.share_table_files) {
1028
+ if (options_.share_files_with_checksum) {
1029
+ directories.emplace_back(
1030
+ GetAbsolutePath(GetSharedFileWithChecksumRel()),
1031
+ &shared_directory_);
1032
+ } else {
1033
+ directories.emplace_back(GetAbsolutePath(GetSharedFileRel()),
1034
+ &shared_directory_);
1035
+ }
1036
+ }
1037
+ directories.emplace_back(GetAbsolutePath(kPrivateDirName),
1038
+ &private_directory_);
1039
+ directories.emplace_back(meta_path, &meta_directory_);
1040
+ // create all the dirs we need
1041
+ for (const auto& d : directories) {
1042
+ IOStatus io_s =
1043
+ backup_fs_->CreateDirIfMissing(d.first, io_options_, nullptr);
1044
+ if (io_s.ok()) {
1045
+ io_s =
1046
+ backup_fs_->NewDirectory(d.first, io_options_, d.second, nullptr);
1047
+ }
1048
+ if (!io_s.ok()) {
1049
+ return io_s;
1050
+ }
1051
+ }
1052
+ }
1053
+
1054
+ std::vector<std::string> backup_meta_files;
1055
+ {
1056
+ IOStatus io_s = backup_fs_->GetChildren(meta_path, io_options_,
1057
+ &backup_meta_files, nullptr);
1058
+ if (io_s.IsNotFound()) {
1059
+ return IOStatus::NotFound(meta_path + " is missing");
1060
+ } else if (!io_s.ok()) {
1061
+ return io_s;
1062
+ }
1063
+ }
1064
+ // create backups_ structure
1065
+ for (auto& file : backup_meta_files) {
1066
+ ROCKS_LOG_INFO(options_.info_log, "Detected backup %s", file.c_str());
1067
+ BackupID backup_id = 0;
1068
+ sscanf(file.c_str(), "%u", &backup_id);
1069
+ if (backup_id == 0 || file != ROCKSDB_NAMESPACE::ToString(backup_id)) {
1070
+ // Invalid file name, will be deleted with auto-GC when user
1071
+ // initiates an append or write operation. (Behave as read-only until
1072
+ // then.)
1073
+ ROCKS_LOG_INFO(options_.info_log, "Skipping unrecognized meta file %s",
1074
+ file.c_str());
1075
+ continue;
1076
+ }
1077
+ assert(backups_.find(backup_id) == backups_.end());
1078
+ // Insert all the (backup_id, BackupMeta) that will be loaded later
1079
+ // The loading performed later will check whether there are corrupt backups
1080
+ // and move the corrupt backups to corrupt_backups_
1081
+ backups_.insert(std::make_pair(
1082
+ backup_id, std::unique_ptr<BackupMeta>(new BackupMeta(
1083
+ GetBackupMetaFile(backup_id, false /* tmp */),
1084
+ GetBackupMetaFile(backup_id, true /* tmp */),
1085
+ &backuped_file_infos_, backup_env_, backup_fs_))));
1086
+ }
1087
+
1088
+ latest_backup_id_ = 0;
1089
+ latest_valid_backup_id_ = 0;
1090
+ if (options_.destroy_old_data) { // Destroy old data
1091
+ assert(!read_only_);
1092
+ ROCKS_LOG_INFO(
1093
+ options_.info_log,
1094
+ "Backup Engine started with destroy_old_data == true, deleting all "
1095
+ "backups");
1096
+ IOStatus io_s = PurgeOldBackups(0);
1097
+ if (io_s.ok()) {
1098
+ io_s = GarbageCollect();
1099
+ }
1100
+ if (!io_s.ok()) {
1101
+ return io_s;
1102
+ }
1103
+ } else { // Load data from storage
1104
+ // abs_path_to_size: maps absolute paths of files in backup directory to
1105
+ // their corresponding sizes
1106
+ std::unordered_map<std::string, uint64_t> abs_path_to_size;
1107
+ // Insert files and their sizes in backup sub-directories (shared and
1108
+ // shared_checksum) to abs_path_to_size
1109
+ for (const auto& rel_dir :
1110
+ {GetSharedFileRel(), GetSharedFileWithChecksumRel()}) {
1111
+ const auto abs_dir = GetAbsolutePath(rel_dir);
1112
+ IOStatus io_s =
1113
+ ReadChildFileCurrentSizes(abs_dir, backup_fs_, &abs_path_to_size);
1114
+ if (!io_s.ok()) {
1115
+ // I/O error likely impacting all backups
1116
+ return io_s;
1117
+ }
1118
+ }
1119
+ // load the backups if any, until valid_backups_to_open of the latest
1120
+ // non-corrupted backups have been successfully opened.
1121
+ int valid_backups_to_open = options_.max_valid_backups_to_open;
1122
+ for (auto backup_iter = backups_.rbegin();
1123
+ backup_iter != backups_.rend();
1124
+ ++backup_iter) {
1125
+ assert(latest_backup_id_ == 0 || latest_backup_id_ > backup_iter->first);
1126
+ if (latest_backup_id_ == 0) {
1127
+ latest_backup_id_ = backup_iter->first;
1128
+ }
1129
+ if (valid_backups_to_open == 0) {
1130
+ break;
1131
+ }
1132
+
1133
+ // Insert files and their sizes in backup sub-directories
1134
+ // (private/backup_id) to abs_path_to_size
1135
+ IOStatus io_s = ReadChildFileCurrentSizes(
1136
+ GetAbsolutePath(GetPrivateFileRel(backup_iter->first)), backup_fs_,
1137
+ &abs_path_to_size);
1138
+ if (io_s.ok()) {
1139
+ io_s = backup_iter->second->LoadFromFile(
1140
+ options_.backup_dir, abs_path_to_size,
1141
+ options_.backup_rate_limiter.get(), options_.info_log,
1142
+ &reported_ignored_fields_);
1143
+ }
1144
+ if (io_s.IsCorruption() || io_s.IsNotSupported()) {
1145
+ ROCKS_LOG_INFO(options_.info_log, "Backup %u corrupted -- %s",
1146
+ backup_iter->first, io_s.ToString().c_str());
1147
+ corrupt_backups_.insert(std::make_pair(
1148
+ backup_iter->first,
1149
+ std::make_pair(io_s, std::move(backup_iter->second))));
1150
+ } else if (!io_s.ok()) {
1151
+ // Distinguish corruption errors from errors in the backup Env.
1152
+ // Errors in the backup Env (i.e., this code path) will cause Open() to
1153
+ // fail, whereas corruption errors would not cause Open() failures.
1154
+ return io_s;
1155
+ } else {
1156
+ ROCKS_LOG_INFO(options_.info_log, "Loading backup %" PRIu32 " OK:\n%s",
1157
+ backup_iter->first,
1158
+ backup_iter->second->GetInfoString().c_str());
1159
+ assert(latest_valid_backup_id_ == 0 ||
1160
+ latest_valid_backup_id_ > backup_iter->first);
1161
+ if (latest_valid_backup_id_ == 0) {
1162
+ latest_valid_backup_id_ = backup_iter->first;
1163
+ }
1164
+ --valid_backups_to_open;
1165
+ }
1166
+ }
1167
+
1168
+ for (const auto& corrupt : corrupt_backups_) {
1169
+ backups_.erase(backups_.find(corrupt.first));
1170
+ }
1171
+ // erase the backups before max_valid_backups_to_open
1172
+ int num_unopened_backups;
1173
+ if (options_.max_valid_backups_to_open == 0) {
1174
+ num_unopened_backups = 0;
1175
+ } else {
1176
+ num_unopened_backups =
1177
+ std::max(0, static_cast<int>(backups_.size()) -
1178
+ options_.max_valid_backups_to_open);
1179
+ }
1180
+ for (int i = 0; i < num_unopened_backups; ++i) {
1181
+ assert(backups_.begin()->second->Empty());
1182
+ backups_.erase(backups_.begin());
1183
+ }
1184
+ }
1185
+
1186
+ ROCKS_LOG_INFO(options_.info_log, "Latest backup is %u", latest_backup_id_);
1187
+ ROCKS_LOG_INFO(options_.info_log, "Latest valid backup is %u",
1188
+ latest_valid_backup_id_);
1189
+
1190
+ // set up threads perform copies from files_to_copy_or_create_ in the
1191
+ // background
1192
+ threads_cpu_priority_ = CpuPriority::kNormal;
1193
+ threads_.reserve(options_.max_background_operations);
1194
+ for (int t = 0; t < options_.max_background_operations; t++) {
1195
+ threads_.emplace_back([this]() {
1196
+ #if defined(_GNU_SOURCE) && defined(__GLIBC_PREREQ)
1197
+ #if __GLIBC_PREREQ(2, 12)
1198
+ pthread_setname_np(pthread_self(), "backup_engine");
1199
+ #endif
1200
+ #endif
1201
+ CpuPriority current_priority = CpuPriority::kNormal;
1202
+ CopyOrCreateWorkItem work_item;
1203
+ uint64_t bytes_toward_next_callback = 0;
1204
+ while (files_to_copy_or_create_.read(work_item)) {
1205
+ CpuPriority priority = threads_cpu_priority_;
1206
+ if (current_priority != priority) {
1207
+ TEST_SYNC_POINT_CALLBACK(
1208
+ "BackupEngineImpl::Initialize:SetCpuPriority", &priority);
1209
+ port::SetCpuPriority(0, priority);
1210
+ current_priority = priority;
1211
+ }
1212
+ // `bytes_read` and `bytes_written` stats are enabled based on
1213
+ // compile-time support and cannot be dynamically toggled. So we do not
1214
+ // need to worry about `PerfLevel` here, unlike many other
1215
+ // `IOStatsContext` / `PerfContext` stats.
1216
+ uint64_t prev_bytes_read = IOSTATS(bytes_read);
1217
+ uint64_t prev_bytes_written = IOSTATS(bytes_written);
1218
+
1219
+ CopyOrCreateResult result;
1220
+ Temperature temp = work_item.src_temperature;
1221
+ result.io_status = CopyOrCreateFile(
1222
+ work_item.src_path, work_item.dst_path, work_item.contents,
1223
+ work_item.size_limit, work_item.src_env, work_item.dst_env,
1224
+ work_item.src_env_options, work_item.sync, work_item.rate_limiter,
1225
+ work_item.progress_callback, &temp, work_item.dst_temperature,
1226
+ &bytes_toward_next_callback, &result.size, &result.checksum_hex);
1227
+
1228
+ RecordTick(work_item.stats, BACKUP_READ_BYTES,
1229
+ IOSTATS(bytes_read) - prev_bytes_read);
1230
+ RecordTick(work_item.stats, BACKUP_WRITE_BYTES,
1231
+ IOSTATS(bytes_written) - prev_bytes_written);
1232
+
1233
+ result.db_id = work_item.db_id;
1234
+ result.db_session_id = work_item.db_session_id;
1235
+ result.expected_src_temperature = work_item.src_temperature;
1236
+ result.current_src_temperature = temp;
1237
+ if (result.io_status.ok() && !work_item.src_checksum_hex.empty()) {
1238
+ // unknown checksum function name implies no db table file checksum in
1239
+ // db manifest; work_item.src_checksum_hex not empty means
1240
+ // backup engine has calculated its crc32c checksum for the table
1241
+ // file; therefore, we are able to compare the checksums.
1242
+ if (work_item.src_checksum_func_name ==
1243
+ kUnknownFileChecksumFuncName ||
1244
+ work_item.src_checksum_func_name == kDbFileChecksumFuncName) {
1245
+ if (work_item.src_checksum_hex != result.checksum_hex) {
1246
+ std::string checksum_info(
1247
+ "Expected checksum is " + work_item.src_checksum_hex +
1248
+ " while computed checksum is " + result.checksum_hex);
1249
+ result.io_status = IOStatus::Corruption(
1250
+ "Checksum mismatch after copying to " + work_item.dst_path +
1251
+ ": " + checksum_info);
1252
+ }
1253
+ } else {
1254
+ // FIXME(peterd): dead code?
1255
+ std::string checksum_function_info(
1256
+ "Existing checksum function is " +
1257
+ work_item.src_checksum_func_name +
1258
+ " while provided checksum function is " +
1259
+ kBackupFileChecksumFuncName);
1260
+ ROCKS_LOG_INFO(
1261
+ options_.info_log,
1262
+ "Unable to verify checksum after copying to %s: %s\n",
1263
+ work_item.dst_path.c_str(), checksum_function_info.c_str());
1264
+ }
1265
+ }
1266
+ work_item.result.set_value(std::move(result));
1267
+ }
1268
+ });
1269
+ }
1270
+ ROCKS_LOG_INFO(options_.info_log, "Initialized BackupEngine");
1271
+ return IOStatus::OK();
1272
+ }
1273
+
1274
+ IOStatus BackupEngineImpl::CreateNewBackupWithMetadata(
1275
+ const CreateBackupOptions& options, DB* db, const std::string& app_metadata,
1276
+ BackupID* new_backup_id_ptr) {
1277
+ assert(initialized_);
1278
+ assert(!read_only_);
1279
+ if (app_metadata.size() > kMaxAppMetaSize) {
1280
+ return IOStatus::InvalidArgument("App metadata too large");
1281
+ }
1282
+
1283
+ if (options.decrease_background_thread_cpu_priority) {
1284
+ if (options.background_thread_cpu_priority < threads_cpu_priority_) {
1285
+ threads_cpu_priority_.store(options.background_thread_cpu_priority);
1286
+ }
1287
+ }
1288
+
1289
+ BackupID new_backup_id = latest_backup_id_ + 1;
1290
+
1291
+ // `bytes_read` and `bytes_written` stats are enabled based on compile-time
1292
+ // support and cannot be dynamically toggled. So we do not need to worry about
1293
+ // `PerfLevel` here, unlike many other `IOStatsContext` / `PerfContext` stats.
1294
+ uint64_t prev_bytes_read = IOSTATS(bytes_read);
1295
+ uint64_t prev_bytes_written = IOSTATS(bytes_written);
1296
+
1297
+ assert(backups_.find(new_backup_id) == backups_.end());
1298
+
1299
+ auto private_dir = GetAbsolutePath(GetPrivateFileRel(new_backup_id));
1300
+ IOStatus io_s = backup_fs_->FileExists(private_dir, io_options_, nullptr);
1301
+ if (io_s.ok()) {
1302
+ // maybe last backup failed and left partial state behind, clean it up.
1303
+ // need to do this before updating backups_ such that a private dir
1304
+ // named after new_backup_id will be cleaned up.
1305
+ // (If an incomplete new backup is followed by an incomplete delete
1306
+ // of the latest full backup, then there could be more than one next
1307
+ // id with a private dir, the last thing to be deleted in delete
1308
+ // backup, but all will be cleaned up with a GarbageCollect.)
1309
+ io_s = GarbageCollect();
1310
+ } else if (io_s.IsNotFound()) {
1311
+ // normal case, the new backup's private dir doesn't exist yet
1312
+ io_s = IOStatus::OK();
1313
+ }
1314
+
1315
+ auto ret = backups_.insert(std::make_pair(
1316
+ new_backup_id, std::unique_ptr<BackupMeta>(new BackupMeta(
1317
+ GetBackupMetaFile(new_backup_id, false /* tmp */),
1318
+ GetBackupMetaFile(new_backup_id, true /* tmp */),
1319
+ &backuped_file_infos_, backup_env_, backup_fs_))));
1320
+ assert(ret.second == true);
1321
+ auto& new_backup = ret.first->second;
1322
+ new_backup->RecordTimestamp();
1323
+ new_backup->SetAppMetadata(app_metadata);
1324
+
1325
+ auto start_backup = backup_env_->NowMicros();
1326
+
1327
+ ROCKS_LOG_INFO(options_.info_log,
1328
+ "Started the backup process -- creating backup %u",
1329
+ new_backup_id);
1330
+
1331
+ if (options_.share_table_files && !options_.share_files_with_checksum) {
1332
+ ROCKS_LOG_WARN(options_.info_log,
1333
+ "BackupEngineOptions::share_files_with_checksum=false is "
1334
+ "DEPRECATED and could lead to data loss.");
1335
+ }
1336
+
1337
+ if (io_s.ok()) {
1338
+ io_s = backup_fs_->CreateDir(private_dir, io_options_, nullptr);
1339
+ }
1340
+
1341
+ // A set into which we will insert the dst_paths that are calculated for live
1342
+ // files and live WAL files.
1343
+ // This is used to check whether a live files shares a dst_path with another
1344
+ // live file.
1345
+ std::unordered_set<std::string> live_dst_paths;
1346
+
1347
+ std::vector<BackupAfterCopyOrCreateWorkItem> backup_items_to_finish;
1348
+ // Add a CopyOrCreateWorkItem to the channel for each live file
1349
+ Status disabled = db->DisableFileDeletions();
1350
+ DBOptions db_options = db->GetDBOptions();
1351
+ Statistics* stats = db_options.statistics.get();
1352
+ if (io_s.ok()) {
1353
+ CheckpointImpl checkpoint(db);
1354
+ uint64_t sequence_number = 0;
1355
+ FileChecksumGenFactory* db_checksum_factory =
1356
+ db_options.file_checksum_gen_factory.get();
1357
+ const std::string kFileChecksumGenFactoryName =
1358
+ "FileChecksumGenCrc32cFactory";
1359
+ bool compare_checksum =
1360
+ db_checksum_factory != nullptr &&
1361
+ db_checksum_factory->Name() == kFileChecksumGenFactoryName
1362
+ ? true
1363
+ : false;
1364
+ EnvOptions src_raw_env_options(db_options);
1365
+ RateLimiter* rate_limiter = options_.backup_rate_limiter.get();
1366
+ io_s = status_to_io_status(checkpoint.CreateCustomCheckpoint(
1367
+ [&](const std::string& /*src_dirname*/, const std::string& /*fname*/,
1368
+ FileType) {
1369
+ // custom checkpoint will switch to calling copy_file_cb after it sees
1370
+ // NotSupported returned from link_file_cb.
1371
+ return IOStatus::NotSupported();
1372
+ } /* link_file_cb */,
1373
+ [&](const std::string& src_dirname, const std::string& fname,
1374
+ uint64_t size_limit_bytes, FileType type,
1375
+ const std::string& checksum_func_name,
1376
+ const std::string& checksum_val,
1377
+ const Temperature src_temperature) {
1378
+ if (type == kWalFile && !options_.backup_log_files) {
1379
+ return IOStatus::OK();
1380
+ }
1381
+ Log(options_.info_log, "add file for backup %s", fname.c_str());
1382
+ uint64_t size_bytes = 0;
1383
+ IOStatus io_st;
1384
+ if (type == kTableFile || type == kBlobFile) {
1385
+ io_st = db_fs_->GetFileSize(src_dirname + "/" + fname, io_options_,
1386
+ &size_bytes, nullptr);
1387
+ }
1388
+ EnvOptions src_env_options;
1389
+ switch (type) {
1390
+ case kWalFile:
1391
+ src_env_options =
1392
+ db_env_->OptimizeForLogRead(src_raw_env_options);
1393
+ break;
1394
+ case kTableFile:
1395
+ src_env_options = db_env_->OptimizeForCompactionTableRead(
1396
+ src_raw_env_options, ImmutableDBOptions(db_options));
1397
+ break;
1398
+ case kDescriptorFile:
1399
+ src_env_options =
1400
+ db_env_->OptimizeForManifestRead(src_raw_env_options);
1401
+ break;
1402
+ case kBlobFile:
1403
+ src_env_options = db_env_->OptimizeForBlobFileRead(
1404
+ src_raw_env_options, ImmutableDBOptions(db_options));
1405
+ break;
1406
+ default:
1407
+ // Other backed up files (like options file) are not read by live
1408
+ // DB, so don't need to worry about avoiding mixing buffered and
1409
+ // direct I/O. Just use plain defaults.
1410
+ src_env_options = src_raw_env_options;
1411
+ break;
1412
+ }
1413
+ if (io_st.ok()) {
1414
+ io_st = AddBackupFileWorkItem(
1415
+ live_dst_paths, backup_items_to_finish, new_backup_id,
1416
+ options_.share_table_files &&
1417
+ (type == kTableFile || type == kBlobFile),
1418
+ src_dirname, fname, src_env_options, rate_limiter, type,
1419
+ size_bytes, db_options.statistics.get(), size_limit_bytes,
1420
+ options_.share_files_with_checksum &&
1421
+ (type == kTableFile || type == kBlobFile),
1422
+ options.progress_callback, "" /* contents */,
1423
+ checksum_func_name, checksum_val, src_temperature);
1424
+ }
1425
+ return io_st;
1426
+ } /* copy_file_cb */,
1427
+ [&](const std::string& fname, const std::string& contents,
1428
+ FileType type) {
1429
+ Log(options_.info_log, "add file for backup %s", fname.c_str());
1430
+ return AddBackupFileWorkItem(
1431
+ live_dst_paths, backup_items_to_finish, new_backup_id,
1432
+ false /* shared */, "" /* src_dir */, fname,
1433
+ EnvOptions() /* src_env_options */, rate_limiter, type,
1434
+ contents.size(), db_options.statistics.get(), 0 /* size_limit */,
1435
+ false /* shared_checksum */, options.progress_callback, contents);
1436
+ } /* create_file_cb */,
1437
+ &sequence_number, options.flush_before_backup ? 0 : port::kMaxUint64,
1438
+ compare_checksum));
1439
+ if (io_s.ok()) {
1440
+ new_backup->SetSequenceNumber(sequence_number);
1441
+ }
1442
+ }
1443
+ ROCKS_LOG_INFO(options_.info_log, "add files for backup done, wait finish.");
1444
+ IOStatus item_io_status;
1445
+ for (auto& item : backup_items_to_finish) {
1446
+ item.result.wait();
1447
+ auto result = item.result.get();
1448
+ item_io_status = result.io_status;
1449
+ Temperature temp = result.expected_src_temperature;
1450
+ if (result.current_src_temperature != Temperature::kUnknown &&
1451
+ (temp == Temperature::kUnknown ||
1452
+ options_.current_temperatures_override_manifest)) {
1453
+ temp = result.current_src_temperature;
1454
+ }
1455
+ if (item_io_status.ok() && item.shared && item.needed_to_copy) {
1456
+ item_io_status = item.backup_env->GetFileSystem()->RenameFile(
1457
+ item.dst_path_tmp, item.dst_path, io_options_, nullptr);
1458
+ }
1459
+ if (item_io_status.ok()) {
1460
+ item_io_status = new_backup.get()->AddFile(std::make_shared<FileInfo>(
1461
+ item.dst_relative, result.size, result.checksum_hex, result.db_id,
1462
+ result.db_session_id, temp));
1463
+ }
1464
+ if (!item_io_status.ok()) {
1465
+ io_s = item_io_status;
1466
+ }
1467
+ }
1468
+
1469
+ // we copied all the files, enable file deletions
1470
+ if (disabled.ok()) { // If we successfully disabled file deletions
1471
+ db->EnableFileDeletions(false).PermitUncheckedError();
1472
+ }
1473
+ auto backup_time = backup_env_->NowMicros() - start_backup;
1474
+
1475
+ if (io_s.ok()) {
1476
+ // persist the backup metadata on the disk
1477
+ io_s = new_backup->StoreToFile(options_.sync, options_.schema_version,
1478
+ schema_test_options_.get());
1479
+ }
1480
+ if (io_s.ok() && options_.sync) {
1481
+ std::unique_ptr<FSDirectory> backup_private_directory;
1482
+ backup_fs_
1483
+ ->NewDirectory(GetAbsolutePath(GetPrivateFileRel(new_backup_id, false)),
1484
+ io_options_, &backup_private_directory, nullptr)
1485
+ .PermitUncheckedError();
1486
+ if (backup_private_directory != nullptr) {
1487
+ io_s = backup_private_directory->FsyncWithDirOptions(io_options_, nullptr,
1488
+ DirFsyncOptions());
1489
+ }
1490
+ if (io_s.ok() && private_directory_ != nullptr) {
1491
+ io_s = private_directory_->FsyncWithDirOptions(io_options_, nullptr,
1492
+ DirFsyncOptions());
1493
+ }
1494
+ if (io_s.ok() && meta_directory_ != nullptr) {
1495
+ io_s = meta_directory_->FsyncWithDirOptions(io_options_, nullptr,
1496
+ DirFsyncOptions());
1497
+ }
1498
+ if (io_s.ok() && shared_directory_ != nullptr) {
1499
+ io_s = shared_directory_->FsyncWithDirOptions(io_options_, nullptr,
1500
+ DirFsyncOptions());
1501
+ }
1502
+ if (io_s.ok() && backup_directory_ != nullptr) {
1503
+ io_s = backup_directory_->FsyncWithDirOptions(io_options_, nullptr,
1504
+ DirFsyncOptions());
1505
+ }
1506
+ }
1507
+
1508
+ if (io_s.ok()) {
1509
+ backup_statistics_.IncrementNumberSuccessBackup();
1510
+ // here we know that we succeeded and installed the new backup
1511
+ latest_backup_id_ = new_backup_id;
1512
+ latest_valid_backup_id_ = new_backup_id;
1513
+ if (new_backup_id_ptr) {
1514
+ *new_backup_id_ptr = new_backup_id;
1515
+ }
1516
+ ROCKS_LOG_INFO(options_.info_log, "Backup DONE. All is good");
1517
+
1518
+ // backup_speed is in byte/second
1519
+ double backup_speed = new_backup->GetSize() / (1.048576 * backup_time);
1520
+ ROCKS_LOG_INFO(options_.info_log, "Backup number of files: %u",
1521
+ new_backup->GetNumberFiles());
1522
+ char human_size[16];
1523
+ AppendHumanBytes(new_backup->GetSize(), human_size, sizeof(human_size));
1524
+ ROCKS_LOG_INFO(options_.info_log, "Backup size: %s", human_size);
1525
+ ROCKS_LOG_INFO(options_.info_log, "Backup time: %" PRIu64 " microseconds",
1526
+ backup_time);
1527
+ ROCKS_LOG_INFO(options_.info_log, "Backup speed: %.3f MB/s", backup_speed);
1528
+ ROCKS_LOG_INFO(options_.info_log, "Backup Statistics %s",
1529
+ backup_statistics_.ToString().c_str());
1530
+ } else {
1531
+ backup_statistics_.IncrementNumberFailBackup();
1532
+ // clean all the files we might have created
1533
+ ROCKS_LOG_INFO(options_.info_log, "Backup failed -- %s",
1534
+ io_s.ToString().c_str());
1535
+ ROCKS_LOG_INFO(options_.info_log, "Backup Statistics %s\n",
1536
+ backup_statistics_.ToString().c_str());
1537
+ // delete files that we might have already written
1538
+ might_need_garbage_collect_ = true;
1539
+ DeleteBackup(new_backup_id).PermitUncheckedError();
1540
+ }
1541
+
1542
+ RecordTick(stats, BACKUP_READ_BYTES, IOSTATS(bytes_read) - prev_bytes_read);
1543
+ RecordTick(stats, BACKUP_WRITE_BYTES,
1544
+ IOSTATS(bytes_written) - prev_bytes_written);
1545
+ return io_s;
1546
+ }
1547
+
1548
+ IOStatus BackupEngineImpl::PurgeOldBackups(uint32_t num_backups_to_keep) {
1549
+ assert(initialized_);
1550
+ assert(!read_only_);
1551
+
1552
+ // Best effort deletion even with errors
1553
+ IOStatus overall_status = IOStatus::OK();
1554
+
1555
+ ROCKS_LOG_INFO(options_.info_log, "Purging old backups, keeping %u",
1556
+ num_backups_to_keep);
1557
+ std::vector<BackupID> to_delete;
1558
+ auto itr = backups_.begin();
1559
+ while ((backups_.size() - to_delete.size()) > num_backups_to_keep) {
1560
+ to_delete.push_back(itr->first);
1561
+ itr++;
1562
+ }
1563
+ for (auto backup_id : to_delete) {
1564
+ // Do not GC until end
1565
+ IOStatus io_s = DeleteBackupNoGC(backup_id);
1566
+ if (!io_s.ok()) {
1567
+ overall_status = io_s;
1568
+ }
1569
+ }
1570
+ // Clean up after any incomplete backup deletion, potentially from
1571
+ // earlier session.
1572
+ if (might_need_garbage_collect_) {
1573
+ IOStatus io_s = GarbageCollect();
1574
+ if (!io_s.ok() && overall_status.ok()) {
1575
+ overall_status = io_s;
1576
+ }
1577
+ }
1578
+ return overall_status;
1579
+ }
1580
+
1581
+ IOStatus BackupEngineImpl::DeleteBackup(BackupID backup_id) {
1582
+ IOStatus s1 = DeleteBackupNoGC(backup_id);
1583
+ IOStatus s2 = IOStatus::OK();
1584
+
1585
+ // Clean up after any incomplete backup deletion, potentially from
1586
+ // earlier session.
1587
+ if (might_need_garbage_collect_) {
1588
+ s2 = GarbageCollect();
1589
+ }
1590
+
1591
+ if (!s1.ok()) {
1592
+ // Any failure in the primary objective trumps any failure in the
1593
+ // secondary objective.
1594
+ s2.PermitUncheckedError();
1595
+ return s1;
1596
+ } else {
1597
+ return s2;
1598
+ }
1599
+ }
1600
+
1601
+ // Does not auto-GarbageCollect nor lock
1602
+ IOStatus BackupEngineImpl::DeleteBackupNoGC(BackupID backup_id) {
1603
+ assert(initialized_);
1604
+ assert(!read_only_);
1605
+
1606
+ ROCKS_LOG_INFO(options_.info_log, "Deleting backup %u", backup_id);
1607
+ auto backup = backups_.find(backup_id);
1608
+ if (backup != backups_.end()) {
1609
+ IOStatus io_s = backup->second->Delete();
1610
+ if (!io_s.ok()) {
1611
+ return io_s;
1612
+ }
1613
+ backups_.erase(backup);
1614
+ } else {
1615
+ auto corrupt = corrupt_backups_.find(backup_id);
1616
+ if (corrupt == corrupt_backups_.end()) {
1617
+ return IOStatus::NotFound("Backup not found");
1618
+ }
1619
+ IOStatus io_s = corrupt->second.second->Delete();
1620
+ if (!io_s.ok()) {
1621
+ return io_s;
1622
+ }
1623
+ corrupt->second.first.PermitUncheckedError();
1624
+ corrupt_backups_.erase(corrupt);
1625
+ }
1626
+
1627
+ // After removing meta file, best effort deletion even with errors.
1628
+ // (Don't delete other files if we can't delete the meta file right
1629
+ // now.)
1630
+ std::vector<std::string> to_delete;
1631
+ for (auto& itr : backuped_file_infos_) {
1632
+ if (itr.second->refs == 0) {
1633
+ IOStatus io_s = backup_fs_->DeleteFile(GetAbsolutePath(itr.first),
1634
+ io_options_, nullptr);
1635
+ ROCKS_LOG_INFO(options_.info_log, "Deleting %s -- %s", itr.first.c_str(),
1636
+ io_s.ToString().c_str());
1637
+ to_delete.push_back(itr.first);
1638
+ if (!io_s.ok()) {
1639
+ // Trying again later might work
1640
+ might_need_garbage_collect_ = true;
1641
+ }
1642
+ }
1643
+ }
1644
+ for (auto& td : to_delete) {
1645
+ backuped_file_infos_.erase(td);
1646
+ }
1647
+
1648
+ // take care of private dirs -- GarbageCollect() will take care of them
1649
+ // if they are not empty
1650
+ std::string private_dir = GetPrivateFileRel(backup_id);
1651
+ IOStatus io_s =
1652
+ backup_fs_->DeleteDir(GetAbsolutePath(private_dir), io_options_, nullptr);
1653
+ ROCKS_LOG_INFO(options_.info_log, "Deleting private dir %s -- %s",
1654
+ private_dir.c_str(), io_s.ToString().c_str());
1655
+ if (!io_s.ok()) {
1656
+ // Full gc or trying again later might work
1657
+ might_need_garbage_collect_ = true;
1658
+ }
1659
+ return IOStatus::OK();
1660
+ }
1661
+
1662
+ void BackupEngineImpl::SetBackupInfoFromBackupMeta(
1663
+ BackupID id, const BackupMeta& meta, BackupInfo* backup_info,
1664
+ bool include_file_details) const {
1665
+ *backup_info = BackupInfo(id, meta.GetTimestamp(), meta.GetSize(),
1666
+ meta.GetNumberFiles(), meta.GetAppMetadata());
1667
+ std::string dir = options_.backup_dir + "/" + kPrivateDirSlash +
1668
+ ROCKSDB_NAMESPACE::ToString(id);
1669
+ if (include_file_details) {
1670
+ auto& file_details = backup_info->file_details;
1671
+ file_details.reserve(meta.GetFiles().size());
1672
+ for (auto& file_ptr : meta.GetFiles()) {
1673
+ BackupFileInfo& finfo = *file_details.emplace(file_details.end());
1674
+ finfo.relative_filename = file_ptr->filename;
1675
+ finfo.size = file_ptr->size;
1676
+ finfo.directory = dir;
1677
+ uint64_t number;
1678
+ FileType type;
1679
+ bool ok = ParseFileName(file_ptr->filename, &number, &type);
1680
+ if (ok) {
1681
+ finfo.file_number = number;
1682
+ finfo.file_type = type;
1683
+ }
1684
+ // TODO: temperature, file_checksum, file_checksum_func_name
1685
+ }
1686
+ backup_info->name_for_open = GetAbsolutePath(GetPrivateFileRel(id));
1687
+ backup_info->name_for_open.pop_back(); // remove trailing '/'
1688
+ backup_info->env_for_open = meta.GetEnvForOpen();
1689
+ }
1690
+ }
1691
+
1692
+ Status BackupEngineImpl::GetBackupInfo(BackupID backup_id,
1693
+ BackupInfo* backup_info,
1694
+ bool include_file_details) const {
1695
+ assert(initialized_);
1696
+ if (backup_id == kLatestBackupIDMarker) {
1697
+ // Note: Read latest_valid_backup_id_ inside of lock
1698
+ backup_id = latest_valid_backup_id_;
1699
+ }
1700
+ auto corrupt_itr = corrupt_backups_.find(backup_id);
1701
+ if (corrupt_itr != corrupt_backups_.end()) {
1702
+ return Status::Corruption(corrupt_itr->second.first.ToString());
1703
+ }
1704
+ auto backup_itr = backups_.find(backup_id);
1705
+ if (backup_itr == backups_.end()) {
1706
+ return Status::NotFound("Backup not found");
1707
+ }
1708
+ auto& backup = backup_itr->second;
1709
+ if (backup->Empty()) {
1710
+ return Status::NotFound("Backup not found");
1711
+ }
1712
+
1713
+ SetBackupInfoFromBackupMeta(backup_id, *backup, backup_info,
1714
+ include_file_details);
1715
+ return Status::OK();
1716
+ }
1717
+
1718
+ void BackupEngineImpl::GetBackupInfo(std::vector<BackupInfo>* backup_info,
1719
+ bool include_file_details) const {
1720
+ assert(initialized_);
1721
+ backup_info->resize(backups_.size());
1722
+ size_t i = 0;
1723
+ for (auto& backup : backups_) {
1724
+ const BackupMeta& meta = *backup.second;
1725
+ if (!meta.Empty()) {
1726
+ SetBackupInfoFromBackupMeta(backup.first, meta, &backup_info->at(i++),
1727
+ include_file_details);
1728
+ }
1729
+ }
1730
+ }
1731
+
1732
+ void BackupEngineImpl::GetCorruptedBackups(
1733
+ std::vector<BackupID>* corrupt_backup_ids) const {
1734
+ assert(initialized_);
1735
+ corrupt_backup_ids->reserve(corrupt_backups_.size());
1736
+ for (auto& backup : corrupt_backups_) {
1737
+ corrupt_backup_ids->push_back(backup.first);
1738
+ }
1739
+ }
1740
+
1741
+ IOStatus BackupEngineImpl::RestoreDBFromBackup(
1742
+ const RestoreOptions& options, BackupID backup_id,
1743
+ const std::string& db_dir, const std::string& wal_dir) const {
1744
+ assert(initialized_);
1745
+ if (backup_id == kLatestBackupIDMarker) {
1746
+ // Note: Read latest_valid_backup_id_ inside of lock
1747
+ backup_id = latest_valid_backup_id_;
1748
+ }
1749
+ auto corrupt_itr = corrupt_backups_.find(backup_id);
1750
+ if (corrupt_itr != corrupt_backups_.end()) {
1751
+ return corrupt_itr->second.first;
1752
+ }
1753
+ auto backup_itr = backups_.find(backup_id);
1754
+ if (backup_itr == backups_.end()) {
1755
+ return IOStatus::NotFound("Backup not found");
1756
+ }
1757
+ auto& backup = backup_itr->second;
1758
+ if (backup->Empty()) {
1759
+ return IOStatus::NotFound("Backup not found");
1760
+ }
1761
+
1762
+ ROCKS_LOG_INFO(options_.info_log, "Restoring backup id %u\n", backup_id);
1763
+ ROCKS_LOG_INFO(options_.info_log, "keep_log_files: %d\n",
1764
+ static_cast<int>(options.keep_log_files));
1765
+
1766
+ // just in case. Ignore errors
1767
+ db_fs_->CreateDirIfMissing(db_dir, io_options_, nullptr)
1768
+ .PermitUncheckedError();
1769
+ db_fs_->CreateDirIfMissing(wal_dir, io_options_, nullptr)
1770
+ .PermitUncheckedError();
1771
+
1772
+ if (options.keep_log_files) {
1773
+ // delete files in db_dir, but keep all the log files
1774
+ DeleteChildren(db_dir, 1 << kWalFile);
1775
+ // move all the files from archive dir to wal_dir
1776
+ std::string archive_dir = ArchivalDirectory(wal_dir);
1777
+ std::vector<std::string> archive_files;
1778
+ db_fs_->GetChildren(archive_dir, io_options_, &archive_files, nullptr)
1779
+ .PermitUncheckedError(); // ignore errors
1780
+ for (const auto& f : archive_files) {
1781
+ uint64_t number;
1782
+ FileType type;
1783
+ bool ok = ParseFileName(f, &number, &type);
1784
+ if (ok && type == kWalFile) {
1785
+ ROCKS_LOG_INFO(options_.info_log,
1786
+ "Moving log file from archive/ to wal_dir: %s",
1787
+ f.c_str());
1788
+ IOStatus io_s = db_fs_->RenameFile(
1789
+ archive_dir + "/" + f, wal_dir + "/" + f, io_options_, nullptr);
1790
+ if (!io_s.ok()) {
1791
+ // if we can't move log file from archive_dir to wal_dir,
1792
+ // we should fail, since it might mean data loss
1793
+ return io_s;
1794
+ }
1795
+ }
1796
+ }
1797
+ } else {
1798
+ DeleteChildren(wal_dir);
1799
+ DeleteChildren(ArchivalDirectory(wal_dir));
1800
+ DeleteChildren(db_dir);
1801
+ }
1802
+
1803
+ IOStatus io_s;
1804
+ std::vector<RestoreAfterCopyOrCreateWorkItem> restore_items_to_finish;
1805
+ std::string temporary_current_file;
1806
+ std::string final_current_file;
1807
+ std::unique_ptr<FSDirectory> db_dir_for_fsync;
1808
+ std::unique_ptr<FSDirectory> wal_dir_for_fsync;
1809
+
1810
+ for (const auto& file_info : backup->GetFiles()) {
1811
+ const std::string& file = file_info->filename;
1812
+ // 1. get DB filename
1813
+ std::string dst = file_info->GetDbFileName();
1814
+
1815
+ // 2. find the filetype
1816
+ uint64_t number;
1817
+ FileType type;
1818
+ bool ok = ParseFileName(dst, &number, &type);
1819
+ if (!ok) {
1820
+ return IOStatus::Corruption("Backup corrupted: Fail to parse filename " +
1821
+ dst);
1822
+ }
1823
+ // 3. Construct the final path
1824
+ // kWalFile lives in wal_dir and all the rest live in db_dir
1825
+ if (type == kWalFile) {
1826
+ dst = wal_dir + "/" + dst;
1827
+ if (options_.sync && !wal_dir_for_fsync) {
1828
+ io_s = db_fs_->NewDirectory(wal_dir, io_options_, &wal_dir_for_fsync,
1829
+ nullptr);
1830
+ if (!io_s.ok()) {
1831
+ return io_s;
1832
+ }
1833
+ }
1834
+ } else {
1835
+ dst = db_dir + "/" + dst;
1836
+ if (options_.sync && !db_dir_for_fsync) {
1837
+ io_s = db_fs_->NewDirectory(db_dir, io_options_, &db_dir_for_fsync,
1838
+ nullptr);
1839
+ if (!io_s.ok()) {
1840
+ return io_s;
1841
+ }
1842
+ }
1843
+ }
1844
+ // For atomicity, initially restore CURRENT file to a temporary name.
1845
+ // This is useful even without options_.sync e.g. in case the restore
1846
+ // process is interrupted.
1847
+ if (type == kCurrentFile) {
1848
+ final_current_file = dst;
1849
+ dst = temporary_current_file = dst + ".tmp";
1850
+ }
1851
+
1852
+ ROCKS_LOG_INFO(options_.info_log, "Restoring %s to %s\n", file.c_str(),
1853
+ dst.c_str());
1854
+ CopyOrCreateWorkItem copy_or_create_work_item(
1855
+ GetAbsolutePath(file), dst, Temperature::kUnknown /* src_temp */,
1856
+ file_info->temp, "" /* contents */, backup_env_, db_env_,
1857
+ EnvOptions() /* src_env_options */, options_.sync,
1858
+ options_.restore_rate_limiter.get(), 0 /* size_limit */,
1859
+ nullptr /* stats */);
1860
+ RestoreAfterCopyOrCreateWorkItem after_copy_or_create_work_item(
1861
+ copy_or_create_work_item.result.get_future(), file, dst,
1862
+ file_info->checksum_hex);
1863
+ files_to_copy_or_create_.write(std::move(copy_or_create_work_item));
1864
+ restore_items_to_finish.push_back(
1865
+ std::move(after_copy_or_create_work_item));
1866
+ }
1867
+ IOStatus item_io_status;
1868
+ for (auto& item : restore_items_to_finish) {
1869
+ item.result.wait();
1870
+ auto result = item.result.get();
1871
+ item_io_status = result.io_status;
1872
+ // Note: It is possible that both of the following bad-status cases occur
1873
+ // during copying. But, we only return one status.
1874
+ if (!item_io_status.ok()) {
1875
+ io_s = item_io_status;
1876
+ break;
1877
+ } else if (!item.checksum_hex.empty() &&
1878
+ item.checksum_hex != result.checksum_hex) {
1879
+ io_s = IOStatus::Corruption(
1880
+ "While restoring " + item.from_file + " -> " + item.to_file +
1881
+ ": expected checksum is " + item.checksum_hex +
1882
+ " while computed checksum is " + result.checksum_hex);
1883
+ break;
1884
+ }
1885
+ }
1886
+
1887
+ // When enabled, the first FsyncWithDirOptions is to ensure all files are
1888
+ // fully persisted before renaming CURRENT.tmp
1889
+ if (io_s.ok() && db_dir_for_fsync) {
1890
+ ROCKS_LOG_INFO(options_.info_log, "Restore: fsync\n");
1891
+ io_s = db_dir_for_fsync->FsyncWithDirOptions(io_options_, nullptr,
1892
+ DirFsyncOptions());
1893
+ }
1894
+
1895
+ if (io_s.ok() && wal_dir_for_fsync) {
1896
+ io_s = wal_dir_for_fsync->FsyncWithDirOptions(io_options_, nullptr,
1897
+ DirFsyncOptions());
1898
+ }
1899
+
1900
+ if (io_s.ok() && !temporary_current_file.empty()) {
1901
+ ROCKS_LOG_INFO(options_.info_log, "Restore: atomic rename CURRENT.tmp\n");
1902
+ assert(!final_current_file.empty());
1903
+ io_s = db_fs_->RenameFile(temporary_current_file, final_current_file,
1904
+ io_options_, nullptr);
1905
+ }
1906
+
1907
+ if (io_s.ok() && db_dir_for_fsync && !temporary_current_file.empty()) {
1908
+ // Second FsyncWithDirOptions is to ensure the final atomic rename of DB
1909
+ // restore is fully persisted even if power goes out right after restore
1910
+ // operation returns success
1911
+ assert(db_dir_for_fsync);
1912
+ io_s = db_dir_for_fsync->FsyncWithDirOptions(
1913
+ io_options_, nullptr, DirFsyncOptions(final_current_file));
1914
+ }
1915
+
1916
+ ROCKS_LOG_INFO(options_.info_log, "Restoring done -- %s\n",
1917
+ io_s.ToString().c_str());
1918
+ return io_s;
1919
+ }
1920
+
1921
+ IOStatus BackupEngineImpl::VerifyBackup(BackupID backup_id,
1922
+ bool verify_with_checksum) const {
1923
+ assert(initialized_);
1924
+ // Check if backup_id is corrupted, or valid and registered
1925
+ auto corrupt_itr = corrupt_backups_.find(backup_id);
1926
+ if (corrupt_itr != corrupt_backups_.end()) {
1927
+ return corrupt_itr->second.first;
1928
+ }
1929
+
1930
+ auto backup_itr = backups_.find(backup_id);
1931
+ if (backup_itr == backups_.end()) {
1932
+ return IOStatus::NotFound();
1933
+ }
1934
+
1935
+ auto& backup = backup_itr->second;
1936
+ if (backup->Empty()) {
1937
+ return IOStatus::NotFound();
1938
+ }
1939
+
1940
+ ROCKS_LOG_INFO(options_.info_log, "Verifying backup id %u\n", backup_id);
1941
+
1942
+ // Find all existing backup files belong to backup_id
1943
+ std::unordered_map<std::string, uint64_t> curr_abs_path_to_size;
1944
+ for (const auto& rel_dir : {GetPrivateFileRel(backup_id), GetSharedFileRel(),
1945
+ GetSharedFileWithChecksumRel()}) {
1946
+ const auto abs_dir = GetAbsolutePath(rel_dir);
1947
+ // Shared directories allowed to be missing in some cases. Expected but
1948
+ // missing files will be reported a few lines down.
1949
+ ReadChildFileCurrentSizes(abs_dir, backup_fs_, &curr_abs_path_to_size)
1950
+ .PermitUncheckedError();
1951
+ }
1952
+
1953
+ // For all files registered in backup
1954
+ for (const auto& file_info : backup->GetFiles()) {
1955
+ const auto abs_path = GetAbsolutePath(file_info->filename);
1956
+ // check existence of the file
1957
+ if (curr_abs_path_to_size.find(abs_path) == curr_abs_path_to_size.end()) {
1958
+ return IOStatus::NotFound("File missing: " + abs_path);
1959
+ }
1960
+ // verify file size
1961
+ if (file_info->size != curr_abs_path_to_size[abs_path]) {
1962
+ std::string size_info("Expected file size is " +
1963
+ ToString(file_info->size) +
1964
+ " while found file size is " +
1965
+ ToString(curr_abs_path_to_size[abs_path]));
1966
+ return IOStatus::Corruption("File corrupted: File size mismatch for " +
1967
+ abs_path + ": " + size_info);
1968
+ }
1969
+ if (verify_with_checksum && !file_info->checksum_hex.empty()) {
1970
+ // verify file checksum
1971
+ std::string checksum_hex;
1972
+ ROCKS_LOG_INFO(options_.info_log, "Verifying %s checksum...\n",
1973
+ abs_path.c_str());
1974
+ IOStatus io_s = ReadFileAndComputeChecksum(
1975
+ abs_path, backup_fs_, EnvOptions(), 0 /* size_limit */, &checksum_hex,
1976
+ Temperature::kUnknown);
1977
+ if (!io_s.ok()) {
1978
+ return io_s;
1979
+ } else if (file_info->checksum_hex != checksum_hex) {
1980
+ std::string checksum_info(
1981
+ "Expected checksum is " + file_info->checksum_hex +
1982
+ " while computed checksum is " + checksum_hex);
1983
+ return IOStatus::Corruption("File corrupted: Checksum mismatch for " +
1984
+ abs_path + ": " + checksum_info);
1985
+ }
1986
+ }
1987
+ }
1988
+ return IOStatus::OK();
1989
+ }
1990
+
1991
+ IOStatus BackupEngineImpl::CopyOrCreateFile(
1992
+ const std::string& src, const std::string& dst, const std::string& contents,
1993
+ uint64_t size_limit, Env* src_env, Env* dst_env,
1994
+ const EnvOptions& src_env_options, bool sync, RateLimiter* rate_limiter,
1995
+ std::function<void()> progress_callback, Temperature* src_temperature,
1996
+ Temperature dst_temperature, uint64_t* bytes_toward_next_callback,
1997
+ uint64_t* size, std::string* checksum_hex) {
1998
+ assert(src.empty() != contents.empty());
1999
+ IOStatus io_s;
2000
+ std::unique_ptr<FSWritableFile> dst_file;
2001
+ std::unique_ptr<FSSequentialFile> src_file;
2002
+ FileOptions dst_file_options;
2003
+ dst_file_options.use_mmap_writes = false;
2004
+ dst_file_options.temperature = dst_temperature;
2005
+ // TODO:(gzh) maybe use direct reads/writes here if possible
2006
+ if (size != nullptr) {
2007
+ *size = 0;
2008
+ }
2009
+ uint32_t checksum_value = 0;
2010
+
2011
+ // Check if size limit is set. if not, set it to very big number
2012
+ if (size_limit == 0) {
2013
+ size_limit = std::numeric_limits<uint64_t>::max();
2014
+ }
2015
+
2016
+ io_s = dst_env->GetFileSystem()->NewWritableFile(dst, dst_file_options,
2017
+ &dst_file, nullptr);
2018
+ if (io_s.ok() && !src.empty()) {
2019
+ auto src_file_options = FileOptions(src_env_options);
2020
+ src_file_options.temperature = *src_temperature;
2021
+ io_s = src_env->GetFileSystem()->NewSequentialFile(src, src_file_options,
2022
+ &src_file, nullptr);
2023
+ }
2024
+ if (!io_s.ok()) {
2025
+ return io_s;
2026
+ }
2027
+
2028
+ size_t buf_size =
2029
+ rate_limiter ? static_cast<size_t>(rate_limiter->GetSingleBurstBytes())
2030
+ : kDefaultCopyFileBufferSize;
2031
+
2032
+ std::unique_ptr<WritableFileWriter> dest_writer(
2033
+ new WritableFileWriter(std::move(dst_file), dst, dst_file_options));
2034
+ std::unique_ptr<SequentialFileReader> src_reader;
2035
+ std::unique_ptr<char[]> buf;
2036
+ if (!src.empty()) {
2037
+ // Return back current temperature in FileSystem
2038
+ *src_temperature = src_file->GetTemperature();
2039
+
2040
+ src_reader.reset(new SequentialFileReader(std::move(src_file), src));
2041
+ buf.reset(new char[buf_size]);
2042
+ }
2043
+
2044
+ Slice data;
2045
+ do {
2046
+ if (stop_backup_.load(std::memory_order_acquire)) {
2047
+ return status_to_io_status(Status::Incomplete("Backup stopped"));
2048
+ }
2049
+ if (!src.empty()) {
2050
+ size_t buffer_to_read =
2051
+ (buf_size < size_limit) ? buf_size : static_cast<size_t>(size_limit);
2052
+ io_s = src_reader->Read(buffer_to_read, &data, buf.get());
2053
+ if (rate_limiter != nullptr) {
2054
+ rate_limiter->Request(data.size(), Env::IO_LOW, nullptr /* stats */,
2055
+ RateLimiter::OpType::kRead);
2056
+ }
2057
+ *bytes_toward_next_callback += data.size();
2058
+ } else {
2059
+ data = contents;
2060
+ }
2061
+ size_limit -= data.size();
2062
+ TEST_SYNC_POINT_CALLBACK(
2063
+ "BackupEngineImpl::CopyOrCreateFile:CorruptionDuringBackup",
2064
+ (src.length() > 4 && src.rfind(".sst") == src.length() - 4) ? &data
2065
+ : nullptr);
2066
+
2067
+ if (!io_s.ok()) {
2068
+ return io_s;
2069
+ }
2070
+
2071
+ if (size != nullptr) {
2072
+ *size += data.size();
2073
+ }
2074
+ if (checksum_hex != nullptr) {
2075
+ checksum_value = crc32c::Extend(checksum_value, data.data(), data.size());
2076
+ }
2077
+ io_s = dest_writer->Append(data);
2078
+
2079
+ if (rate_limiter != nullptr) {
2080
+ if (!src.empty()) {
2081
+ rate_limiter->Request(data.size(), Env::IO_LOW, nullptr /* stats */,
2082
+ RateLimiter::OpType::kWrite);
2083
+ } else {
2084
+ LoopRateLimitRequestHelper(data.size(), rate_limiter, Env::IO_LOW,
2085
+ nullptr /* stats */,
2086
+ RateLimiter::OpType::kWrite);
2087
+ }
2088
+ }
2089
+ while (*bytes_toward_next_callback >=
2090
+ options_.callback_trigger_interval_size) {
2091
+ *bytes_toward_next_callback -= options_.callback_trigger_interval_size;
2092
+ std::lock_guard<std::mutex> lock(byte_report_mutex_);
2093
+ progress_callback();
2094
+ }
2095
+ } while (io_s.ok() && contents.empty() && data.size() > 0 && size_limit > 0);
2096
+
2097
+ // Convert uint32_t checksum to hex checksum
2098
+ if (checksum_hex != nullptr) {
2099
+ checksum_hex->assign(ChecksumInt32ToHex(checksum_value));
2100
+ }
2101
+
2102
+ if (io_s.ok() && sync) {
2103
+ io_s = dest_writer->Sync(false);
2104
+ }
2105
+ if (io_s.ok()) {
2106
+ io_s = dest_writer->Close();
2107
+ }
2108
+ return io_s;
2109
+ }
2110
+
2111
+ // fname will always start with "/"
2112
+ IOStatus BackupEngineImpl::AddBackupFileWorkItem(
2113
+ std::unordered_set<std::string>& live_dst_paths,
2114
+ std::vector<BackupAfterCopyOrCreateWorkItem>& backup_items_to_finish,
2115
+ BackupID backup_id, bool shared, const std::string& src_dir,
2116
+ const std::string& fname, const EnvOptions& src_env_options,
2117
+ RateLimiter* rate_limiter, FileType file_type, uint64_t size_bytes,
2118
+ Statistics* stats, uint64_t size_limit, bool shared_checksum,
2119
+ std::function<void()> progress_callback, const std::string& contents,
2120
+ const std::string& src_checksum_func_name,
2121
+ const std::string& src_checksum_str, const Temperature src_temperature) {
2122
+ assert(contents.empty() != src_dir.empty());
2123
+
2124
+ std::string src_path = src_dir + "/" + fname;
2125
+ std::string dst_relative;
2126
+ std::string dst_relative_tmp;
2127
+ std::string db_id;
2128
+ std::string db_session_id;
2129
+ // crc32c checksum in hex. empty == unavailable / unknown
2130
+ std::string checksum_hex;
2131
+
2132
+ // Whenever a default checksum function name is passed in, we will compares
2133
+ // the corresponding checksum values after copying. Note that only table and
2134
+ // blob files may have a known checksum function name passed in.
2135
+ //
2136
+ // If no default checksum function name is passed in and db session id is not
2137
+ // available, we will calculate the checksum *before* copying in two cases
2138
+ // (we always calcuate checksums when copying or creating for any file types):
2139
+ // a) share_files_with_checksum is true and file type is table;
2140
+ // b) share_table_files is true and the file exists already.
2141
+ //
2142
+ // Step 0: Check if default checksum function name is passed in
2143
+ if (kDbFileChecksumFuncName == src_checksum_func_name) {
2144
+ if (src_checksum_str == kUnknownFileChecksum) {
2145
+ return status_to_io_status(
2146
+ Status::Aborted("Unknown checksum value for " + fname));
2147
+ }
2148
+ checksum_hex = ChecksumStrToHex(src_checksum_str);
2149
+ }
2150
+
2151
+ // Step 1: Prepare the relative path to destination
2152
+ if (shared && shared_checksum) {
2153
+ if (GetNamingNoFlags() != BackupEngineOptions::kLegacyCrc32cAndFileSize &&
2154
+ file_type != kBlobFile) {
2155
+ // Prepare db_session_id to add to the file name
2156
+ // Ignore the returned status
2157
+ // In the failed cases, db_id and db_session_id will be empty
2158
+ GetFileDbIdentities(db_env_, src_env_options, src_path, src_temperature,
2159
+ rate_limiter, &db_id, &db_session_id)
2160
+ .PermitUncheckedError();
2161
+ }
2162
+ // Calculate checksum if checksum and db session id are not available.
2163
+ // If db session id is available, we will not calculate the checksum
2164
+ // since the session id should suffice to avoid file name collision in
2165
+ // the shared_checksum directory.
2166
+ if (checksum_hex.empty() && db_session_id.empty()) {
2167
+ IOStatus io_s = ReadFileAndComputeChecksum(
2168
+ src_path, db_fs_, src_env_options, size_limit, &checksum_hex,
2169
+ src_temperature);
2170
+ if (!io_s.ok()) {
2171
+ return io_s;
2172
+ }
2173
+ }
2174
+ if (size_bytes == port::kMaxUint64) {
2175
+ return IOStatus::NotFound("File missing: " + src_path);
2176
+ }
2177
+ // dst_relative depends on the following conditions:
2178
+ // 1) the naming scheme is kUseDbSessionId,
2179
+ // 2) db_session_id is not empty,
2180
+ // 3) checksum is available in the DB manifest.
2181
+ // If 1,2,3) are satisfied, then dst_relative will be of the form:
2182
+ // shared_checksum/<file_number>_<checksum>_<db_session_id>.sst
2183
+ // If 1,2) are satisfied, then dst_relative will be of the form:
2184
+ // shared_checksum/<file_number>_<db_session_id>.sst
2185
+ // Otherwise, dst_relative is of the form
2186
+ // shared_checksum/<file_number>_<checksum>_<size>.sst
2187
+ //
2188
+ // For blob files, db_session_id is not supported with the blob file format.
2189
+ // It uses original/legacy naming scheme.
2190
+ // dst_relative will be of the form:
2191
+ // shared_checksum/<file_number>_<checksum>_<size>.blob
2192
+ dst_relative = GetSharedFileWithChecksum(fname, checksum_hex, size_bytes,
2193
+ db_session_id);
2194
+ dst_relative_tmp = GetSharedFileWithChecksumRel(dst_relative, true);
2195
+ dst_relative = GetSharedFileWithChecksumRel(dst_relative, false);
2196
+ } else if (shared) {
2197
+ dst_relative_tmp = GetSharedFileRel(fname, true);
2198
+ dst_relative = GetSharedFileRel(fname, false);
2199
+ } else {
2200
+ dst_relative = GetPrivateFileRel(backup_id, false, fname);
2201
+ }
2202
+
2203
+ // We copy into `temp_dest_path` and, once finished, rename it to
2204
+ // `final_dest_path`. This allows files to atomically appear at
2205
+ // `final_dest_path`. We can copy directly to the final path when atomicity
2206
+ // is unnecessary, like for files in private backup directories.
2207
+ const std::string* copy_dest_path;
2208
+ std::string temp_dest_path;
2209
+ std::string final_dest_path = GetAbsolutePath(dst_relative);
2210
+ if (!dst_relative_tmp.empty()) {
2211
+ temp_dest_path = GetAbsolutePath(dst_relative_tmp);
2212
+ copy_dest_path = &temp_dest_path;
2213
+ } else {
2214
+ copy_dest_path = &final_dest_path;
2215
+ }
2216
+
2217
+ // Step 2: Determine whether to copy or not
2218
+ // if it's shared, we also need to check if it exists -- if it does, no need
2219
+ // to copy it again.
2220
+ bool need_to_copy = true;
2221
+ // true if final_dest_path is the same path as another live file
2222
+ const bool same_path =
2223
+ live_dst_paths.find(final_dest_path) != live_dst_paths.end();
2224
+
2225
+ bool file_exists = false;
2226
+ if (shared && !same_path) {
2227
+ // Should be in shared directory but not a live path, check existence in
2228
+ // shared directory
2229
+ IOStatus exist =
2230
+ backup_fs_->FileExists(final_dest_path, io_options_, nullptr);
2231
+ if (exist.ok()) {
2232
+ file_exists = true;
2233
+ } else if (exist.IsNotFound()) {
2234
+ file_exists = false;
2235
+ } else {
2236
+ return exist;
2237
+ }
2238
+ }
2239
+
2240
+ if (!contents.empty()) {
2241
+ need_to_copy = false;
2242
+ } else if (shared && (same_path || file_exists)) {
2243
+ need_to_copy = false;
2244
+ auto find_result = backuped_file_infos_.find(dst_relative);
2245
+ if (find_result == backuped_file_infos_.end() && !same_path) {
2246
+ // file exists but not referenced
2247
+ ROCKS_LOG_INFO(
2248
+ options_.info_log,
2249
+ "%s already present, but not referenced by any backup. We will "
2250
+ "overwrite the file.",
2251
+ fname.c_str());
2252
+ need_to_copy = true;
2253
+ // Defer any failure reporting to when we try to write the file
2254
+ backup_fs_->DeleteFile(final_dest_path, io_options_, nullptr)
2255
+ .PermitUncheckedError();
2256
+ } else {
2257
+ // file exists and referenced
2258
+ if (checksum_hex.empty()) {
2259
+ // same_path should not happen for a standard DB, so OK to
2260
+ // read file contents to check for checksum mismatch between
2261
+ // two files from same DB getting same name.
2262
+ // For compatibility with future meta file that might not have
2263
+ // crc32c checksum available, consider it might be empty, but
2264
+ // we don't currently generate meta file without crc32c checksum.
2265
+ // Therefore we have to read & compute it if we don't have it.
2266
+ if (!same_path && !find_result->second->checksum_hex.empty()) {
2267
+ assert(find_result != backuped_file_infos_.end());
2268
+ // Note: to save I/O on incremental backups, we copy prior known
2269
+ // checksum of the file instead of reading entire file contents
2270
+ // to recompute it.
2271
+ checksum_hex = find_result->second->checksum_hex;
2272
+ // Regarding corruption detection, consider:
2273
+ // (a) the DB file is corrupt (since previous backup) and the backup
2274
+ // file is OK: we failed to detect, but the backup is safe. DB can
2275
+ // be repaired/restored once its corruption is detected.
2276
+ // (b) the backup file is corrupt (since previous backup) and the
2277
+ // db file is OK: we failed to detect, but the backup is corrupt.
2278
+ // CreateNewBackup should support fast incremental backups and
2279
+ // there's no way to support that without reading all the files.
2280
+ // We might add an option for extra checks on incremental backup,
2281
+ // but until then, use VerifyBackups to check existing backup data.
2282
+ // (c) file name collision with legitimately different content.
2283
+ // This is almost inconceivable with a well-generated DB session
2284
+ // ID, but even in that case, we double check the file sizes in
2285
+ // BackupMeta::AddFile.
2286
+ } else {
2287
+ IOStatus io_s = ReadFileAndComputeChecksum(
2288
+ src_path, db_fs_, src_env_options, size_limit, &checksum_hex,
2289
+ src_temperature);
2290
+ if (!io_s.ok()) {
2291
+ return io_s;
2292
+ }
2293
+ }
2294
+ }
2295
+ if (!db_session_id.empty()) {
2296
+ ROCKS_LOG_INFO(options_.info_log,
2297
+ "%s already present, with checksum %s, size %" PRIu64
2298
+ " and DB session identity %s",
2299
+ fname.c_str(), checksum_hex.c_str(), size_bytes,
2300
+ db_session_id.c_str());
2301
+ } else {
2302
+ ROCKS_LOG_INFO(options_.info_log,
2303
+ "%s already present, with checksum %s and size %" PRIu64,
2304
+ fname.c_str(), checksum_hex.c_str(), size_bytes);
2305
+ }
2306
+ }
2307
+ }
2308
+ live_dst_paths.insert(final_dest_path);
2309
+
2310
+ // Step 3: Add work item
2311
+ if (!contents.empty() || need_to_copy) {
2312
+ ROCKS_LOG_INFO(options_.info_log, "Copying %s to %s", fname.c_str(),
2313
+ copy_dest_path->c_str());
2314
+ CopyOrCreateWorkItem copy_or_create_work_item(
2315
+ src_dir.empty() ? "" : src_path, *copy_dest_path, src_temperature,
2316
+ Temperature::kUnknown /*dst_temp*/, contents, db_env_, backup_env_,
2317
+ src_env_options, options_.sync, rate_limiter, size_limit, stats,
2318
+ progress_callback, src_checksum_func_name, checksum_hex, db_id,
2319
+ db_session_id);
2320
+ BackupAfterCopyOrCreateWorkItem after_copy_or_create_work_item(
2321
+ copy_or_create_work_item.result.get_future(), shared, need_to_copy,
2322
+ backup_env_, temp_dest_path, final_dest_path, dst_relative);
2323
+ files_to_copy_or_create_.write(std::move(copy_or_create_work_item));
2324
+ backup_items_to_finish.push_back(std::move(after_copy_or_create_work_item));
2325
+ } else {
2326
+ std::promise<CopyOrCreateResult> promise_result;
2327
+ BackupAfterCopyOrCreateWorkItem after_copy_or_create_work_item(
2328
+ promise_result.get_future(), shared, need_to_copy, backup_env_,
2329
+ temp_dest_path, final_dest_path, dst_relative);
2330
+ backup_items_to_finish.push_back(std::move(after_copy_or_create_work_item));
2331
+ CopyOrCreateResult result;
2332
+ result.io_status = IOStatus::OK();
2333
+ result.size = size_bytes;
2334
+ result.checksum_hex = std::move(checksum_hex);
2335
+ result.db_id = std::move(db_id);
2336
+ result.db_session_id = std::move(db_session_id);
2337
+ promise_result.set_value(std::move(result));
2338
+ }
2339
+ return IOStatus::OK();
2340
+ }
2341
+
2342
+ IOStatus BackupEngineImpl::ReadFileAndComputeChecksum(
2343
+ const std::string& src, const std::shared_ptr<FileSystem>& src_fs,
2344
+ const EnvOptions& src_env_options, uint64_t size_limit,
2345
+ std::string* checksum_hex, const Temperature src_temperature) const {
2346
+ if (checksum_hex == nullptr) {
2347
+ return status_to_io_status(Status::Aborted("Checksum pointer is null"));
2348
+ }
2349
+ uint32_t checksum_value = 0;
2350
+ if (size_limit == 0) {
2351
+ size_limit = std::numeric_limits<uint64_t>::max();
2352
+ }
2353
+
2354
+ std::unique_ptr<SequentialFileReader> src_reader;
2355
+ auto file_options = FileOptions(src_env_options);
2356
+ file_options.temperature = src_temperature;
2357
+ IOStatus io_s = SequentialFileReader::Create(src_fs, src, file_options,
2358
+ &src_reader, nullptr);
2359
+ if (!io_s.ok()) {
2360
+ return io_s;
2361
+ }
2362
+
2363
+ RateLimiter* rate_limiter = options_.backup_rate_limiter.get();
2364
+ size_t buf_size =
2365
+ rate_limiter ? static_cast<size_t>(rate_limiter->GetSingleBurstBytes())
2366
+ : kDefaultCopyFileBufferSize;
2367
+ std::unique_ptr<char[]> buf(new char[buf_size]);
2368
+ Slice data;
2369
+
2370
+ do {
2371
+ if (stop_backup_.load(std::memory_order_acquire)) {
2372
+ return status_to_io_status(Status::Incomplete("Backup stopped"));
2373
+ }
2374
+ size_t buffer_to_read =
2375
+ (buf_size < size_limit) ? buf_size : static_cast<size_t>(size_limit);
2376
+ io_s = src_reader->Read(buffer_to_read, &data, buf.get());
2377
+ if (rate_limiter != nullptr) {
2378
+ rate_limiter->Request(data.size(), Env::IO_LOW, nullptr /* stats */,
2379
+ RateLimiter::OpType::kRead);
2380
+ }
2381
+ if (!io_s.ok()) {
2382
+ return io_s;
2383
+ }
2384
+
2385
+ size_limit -= data.size();
2386
+ checksum_value = crc32c::Extend(checksum_value, data.data(), data.size());
2387
+ } while (data.size() > 0 && size_limit > 0);
2388
+
2389
+ checksum_hex->assign(ChecksumInt32ToHex(checksum_value));
2390
+
2391
+ return io_s;
2392
+ }
2393
+
2394
+ Status BackupEngineImpl::GetFileDbIdentities(
2395
+ Env* src_env, const EnvOptions& src_env_options,
2396
+ const std::string& file_path, Temperature file_temp,
2397
+ RateLimiter* rate_limiter, std::string* db_id, std::string* db_session_id) {
2398
+ assert(db_id != nullptr || db_session_id != nullptr);
2399
+
2400
+ Options options;
2401
+ options.env = src_env;
2402
+ SstFileDumper sst_reader(options, file_path, file_temp,
2403
+ 2 * 1024 * 1024
2404
+ /* readahead_size */,
2405
+ false /* verify_checksum */, false /* output_hex */,
2406
+ false /* decode_blob_index */, src_env_options,
2407
+ true /* silent */);
2408
+
2409
+ const TableProperties* table_properties = nullptr;
2410
+ std::shared_ptr<const TableProperties> tp;
2411
+ Status s = sst_reader.getStatus();
2412
+
2413
+ if (s.ok()) {
2414
+ // Try to get table properties from the table reader of sst_reader
2415
+ if (!sst_reader.ReadTableProperties(&tp).ok()) {
2416
+ // Try to use table properites from the initialization of sst_reader
2417
+ table_properties = sst_reader.GetInitTableProperties();
2418
+ } else {
2419
+ table_properties = tp.get();
2420
+ if (table_properties != nullptr && rate_limiter != nullptr) {
2421
+ // sizeof(*table_properties) is a sufficent but far-from-exact
2422
+ // approximation of read bytes due to metaindex block, std::string
2423
+ // properties and varint compression
2424
+ LoopRateLimitRequestHelper(sizeof(*table_properties), rate_limiter,
2425
+ Env::IO_LOW, nullptr /* stats */,
2426
+ RateLimiter::OpType::kRead);
2427
+ }
2428
+ }
2429
+ } else {
2430
+ ROCKS_LOG_INFO(options_.info_log, "Failed to read %s: %s",
2431
+ file_path.c_str(), s.ToString().c_str());
2432
+ return s;
2433
+ }
2434
+
2435
+ if (table_properties != nullptr) {
2436
+ if (db_id != nullptr) {
2437
+ db_id->assign(table_properties->db_id);
2438
+ }
2439
+ if (db_session_id != nullptr) {
2440
+ db_session_id->assign(table_properties->db_session_id);
2441
+ if (db_session_id->empty()) {
2442
+ s = Status::NotFound("DB session identity not found in " + file_path);
2443
+ ROCKS_LOG_INFO(options_.info_log, "%s", s.ToString().c_str());
2444
+ return s;
2445
+ }
2446
+ }
2447
+ return Status::OK();
2448
+ } else {
2449
+ s = Status::Corruption("Table properties missing in " + file_path);
2450
+ ROCKS_LOG_INFO(options_.info_log, "%s", s.ToString().c_str());
2451
+ return s;
2452
+ }
2453
+ }
2454
+
2455
+ void BackupEngineImpl::LoopRateLimitRequestHelper(
2456
+ const size_t total_bytes_to_request, RateLimiter* rate_limiter,
2457
+ const Env::IOPriority pri, Statistics* stats,
2458
+ const RateLimiter::OpType op_type) {
2459
+ assert(rate_limiter != nullptr);
2460
+ size_t remaining_bytes = total_bytes_to_request;
2461
+ size_t request_bytes = 0;
2462
+ while (remaining_bytes > 0) {
2463
+ request_bytes =
2464
+ std::min(static_cast<size_t>(rate_limiter->GetSingleBurstBytes()),
2465
+ remaining_bytes);
2466
+ rate_limiter->Request(request_bytes, pri, stats, op_type);
2467
+ remaining_bytes -= request_bytes;
2468
+ }
2469
+ }
2470
+
2471
+ void BackupEngineImpl::DeleteChildren(const std::string& dir,
2472
+ uint32_t file_type_filter) const {
2473
+ std::vector<std::string> children;
2474
+ db_fs_->GetChildren(dir, io_options_, &children, nullptr)
2475
+ .PermitUncheckedError(); // ignore errors
2476
+
2477
+ for (const auto& f : children) {
2478
+ uint64_t number;
2479
+ FileType type;
2480
+ bool ok = ParseFileName(f, &number, &type);
2481
+ if (ok && (file_type_filter & (1 << type))) {
2482
+ // don't delete this file
2483
+ continue;
2484
+ }
2485
+ db_fs_->DeleteFile(dir + "/" + f, io_options_, nullptr)
2486
+ .PermitUncheckedError(); // ignore errors
2487
+ }
2488
+ }
2489
+
2490
+ IOStatus BackupEngineImpl::ReadChildFileCurrentSizes(
2491
+ const std::string& dir, const std::shared_ptr<FileSystem>& fs,
2492
+ std::unordered_map<std::string, uint64_t>* result) const {
2493
+ assert(result != nullptr);
2494
+ std::vector<Env::FileAttributes> files_attrs;
2495
+ IOStatus io_status = fs->FileExists(dir, io_options_, nullptr);
2496
+ if (io_status.ok()) {
2497
+ io_status =
2498
+ fs->GetChildrenFileAttributes(dir, io_options_, &files_attrs, nullptr);
2499
+ } else if (io_status.IsNotFound()) {
2500
+ // Insert no entries can be considered success
2501
+ io_status = IOStatus::OK();
2502
+ }
2503
+ const bool slash_needed = dir.empty() || dir.back() != '/';
2504
+ for (const auto& file_attrs : files_attrs) {
2505
+ result->emplace(dir + (slash_needed ? "/" : "") + file_attrs.name,
2506
+ file_attrs.size_bytes);
2507
+ }
2508
+ return io_status;
2509
+ }
2510
+
2511
+ IOStatus BackupEngineImpl::GarbageCollect() {
2512
+ assert(!read_only_);
2513
+
2514
+ // We will make a best effort to remove all garbage even in the presence
2515
+ // of inconsistencies or I/O failures that inhibit finding garbage.
2516
+ IOStatus overall_status = IOStatus::OK();
2517
+ // If all goes well, we don't need another auto-GC this session
2518
+ might_need_garbage_collect_ = false;
2519
+
2520
+ ROCKS_LOG_INFO(options_.info_log, "Starting garbage collection");
2521
+
2522
+ // delete obsolete shared files
2523
+ for (bool with_checksum : {false, true}) {
2524
+ std::vector<std::string> shared_children;
2525
+ {
2526
+ std::string shared_path;
2527
+ if (with_checksum) {
2528
+ shared_path = GetAbsolutePath(GetSharedFileWithChecksumRel());
2529
+ } else {
2530
+ shared_path = GetAbsolutePath(GetSharedFileRel());
2531
+ }
2532
+ IOStatus io_s = backup_fs_->FileExists(shared_path, io_options_, nullptr);
2533
+ if (io_s.ok()) {
2534
+ io_s = backup_fs_->GetChildren(shared_path, io_options_,
2535
+ &shared_children, nullptr);
2536
+ } else if (io_s.IsNotFound()) {
2537
+ io_s = IOStatus::OK();
2538
+ }
2539
+ if (!io_s.ok()) {
2540
+ overall_status = io_s;
2541
+ // Trying again later might work
2542
+ might_need_garbage_collect_ = true;
2543
+ }
2544
+ }
2545
+ for (auto& child : shared_children) {
2546
+ std::string rel_fname;
2547
+ if (with_checksum) {
2548
+ rel_fname = GetSharedFileWithChecksumRel(child);
2549
+ } else {
2550
+ rel_fname = GetSharedFileRel(child);
2551
+ }
2552
+ auto child_itr = backuped_file_infos_.find(rel_fname);
2553
+ // if it's not refcounted, delete it
2554
+ if (child_itr == backuped_file_infos_.end() ||
2555
+ child_itr->second->refs == 0) {
2556
+ // this might be a directory, but DeleteFile will just fail in that
2557
+ // case, so we're good
2558
+ IOStatus io_s = backup_fs_->DeleteFile(GetAbsolutePath(rel_fname),
2559
+ io_options_, nullptr);
2560
+ ROCKS_LOG_INFO(options_.info_log, "Deleting %s -- %s",
2561
+ rel_fname.c_str(), io_s.ToString().c_str());
2562
+ backuped_file_infos_.erase(rel_fname);
2563
+ if (!io_s.ok()) {
2564
+ // Trying again later might work
2565
+ might_need_garbage_collect_ = true;
2566
+ }
2567
+ }
2568
+ }
2569
+ }
2570
+
2571
+ // delete obsolete private files
2572
+ std::vector<std::string> private_children;
2573
+ {
2574
+ IOStatus io_s =
2575
+ backup_fs_->GetChildren(GetAbsolutePath(kPrivateDirName), io_options_,
2576
+ &private_children, nullptr);
2577
+ if (!io_s.ok()) {
2578
+ overall_status = io_s;
2579
+ // Trying again later might work
2580
+ might_need_garbage_collect_ = true;
2581
+ }
2582
+ }
2583
+ for (auto& child : private_children) {
2584
+ BackupID backup_id = 0;
2585
+ bool tmp_dir = child.find(".tmp") != std::string::npos;
2586
+ sscanf(child.c_str(), "%u", &backup_id);
2587
+ if (!tmp_dir && // if it's tmp_dir, delete it
2588
+ (backup_id == 0 || backups_.find(backup_id) != backups_.end())) {
2589
+ // it's either not a number or it's still alive. continue
2590
+ continue;
2591
+ }
2592
+ // here we have to delete the dir and all its children
2593
+ std::string full_private_path =
2594
+ GetAbsolutePath(GetPrivateFileRel(backup_id));
2595
+ std::vector<std::string> subchildren;
2596
+ if (backup_fs_
2597
+ ->GetChildren(full_private_path, io_options_, &subchildren, nullptr)
2598
+ .ok()) {
2599
+ for (auto& subchild : subchildren) {
2600
+ IOStatus io_s = backup_fs_->DeleteFile(full_private_path + subchild,
2601
+ io_options_, nullptr);
2602
+ ROCKS_LOG_INFO(options_.info_log, "Deleting %s -- %s",
2603
+ (full_private_path + subchild).c_str(),
2604
+ io_s.ToString().c_str());
2605
+ if (!io_s.ok()) {
2606
+ // Trying again later might work
2607
+ might_need_garbage_collect_ = true;
2608
+ }
2609
+ }
2610
+ }
2611
+ // finally delete the private dir
2612
+ IOStatus io_s =
2613
+ backup_fs_->DeleteDir(full_private_path, io_options_, nullptr);
2614
+ ROCKS_LOG_INFO(options_.info_log, "Deleting dir %s -- %s",
2615
+ full_private_path.c_str(), io_s.ToString().c_str());
2616
+ if (!io_s.ok()) {
2617
+ // Trying again later might work
2618
+ might_need_garbage_collect_ = true;
2619
+ }
2620
+ }
2621
+
2622
+ assert(overall_status.ok() || might_need_garbage_collect_);
2623
+ return overall_status;
2624
+ }
2625
+
2626
+ // ------- BackupMeta class --------
2627
+
2628
+ IOStatus BackupEngineImpl::BackupMeta::AddFile(
2629
+ std::shared_ptr<FileInfo> file_info) {
2630
+ auto itr = file_infos_->find(file_info->filename);
2631
+ if (itr == file_infos_->end()) {
2632
+ auto ret = file_infos_->insert({file_info->filename, file_info});
2633
+ if (ret.second) {
2634
+ itr = ret.first;
2635
+ itr->second->refs = 1;
2636
+ } else {
2637
+ // if this happens, something is seriously wrong
2638
+ return IOStatus::Corruption("In memory metadata insertion error");
2639
+ }
2640
+ } else {
2641
+ // Compare sizes, because we scanned that off the filesystem on both
2642
+ // ends. This is like a check in VerifyBackup.
2643
+ if (itr->second->size != file_info->size) {
2644
+ std::string msg = "Size mismatch for existing backup file: ";
2645
+ msg.append(file_info->filename);
2646
+ msg.append(" Size in backup is " + ToString(itr->second->size) +
2647
+ " while size in DB is " + ToString(file_info->size));
2648
+ msg.append(
2649
+ " If this DB file checks as not corrupt, try deleting old"
2650
+ " backups or backing up to a different backup directory.");
2651
+ return IOStatus::Corruption(msg);
2652
+ }
2653
+ if (file_info->checksum_hex.empty()) {
2654
+ // No checksum available to check
2655
+ } else if (itr->second->checksum_hex.empty()) {
2656
+ // Remember checksum if newly acquired
2657
+ itr->second->checksum_hex = file_info->checksum_hex;
2658
+ } else if (itr->second->checksum_hex != file_info->checksum_hex) {
2659
+ // Note: to save I/O, these will be equal trivially on already backed
2660
+ // up files that don't have the checksum in their name. And it should
2661
+ // never fail for files that do have checksum in their name.
2662
+
2663
+ // Should never reach here, but produce an appropriate corruption
2664
+ // message in case we do in a release build.
2665
+ assert(false);
2666
+ std::string msg = "Checksum mismatch for existing backup file: ";
2667
+ msg.append(file_info->filename);
2668
+ msg.append(" Expected checksum is " + itr->second->checksum_hex +
2669
+ " while computed checksum is " + file_info->checksum_hex);
2670
+ msg.append(
2671
+ " If this DB file checks as not corrupt, try deleting old"
2672
+ " backups or backing up to a different backup directory.");
2673
+ return IOStatus::Corruption(msg);
2674
+ }
2675
+ ++itr->second->refs; // increase refcount if already present
2676
+ }
2677
+
2678
+ size_ += file_info->size;
2679
+ files_.push_back(itr->second);
2680
+
2681
+ return IOStatus::OK();
2682
+ }
2683
+
2684
+ IOStatus BackupEngineImpl::BackupMeta::Delete(bool delete_meta) {
2685
+ IOStatus io_s;
2686
+ for (const auto& file : files_) {
2687
+ --file->refs; // decrease refcount
2688
+ }
2689
+ files_.clear();
2690
+ // delete meta file
2691
+ if (delete_meta) {
2692
+ io_s = fs_->FileExists(meta_filename_, iooptions_, nullptr);
2693
+ if (io_s.ok()) {
2694
+ io_s = fs_->DeleteFile(meta_filename_, iooptions_, nullptr);
2695
+ } else if (io_s.IsNotFound()) {
2696
+ io_s = IOStatus::OK(); // nothing to delete
2697
+ }
2698
+ }
2699
+ timestamp_ = 0;
2700
+ return io_s;
2701
+ }
2702
+
2703
+ // Constants for backup meta file schema (see LoadFromFile)
2704
+ const std::string kSchemaVersionPrefix{"schema_version "};
2705
+ const std::string kFooterMarker{"// FOOTER"};
2706
+
2707
+ const std::string kAppMetaDataFieldName{"metadata"};
2708
+
2709
+ // WART: The checksums are crc32c but named "crc32"
2710
+ const std::string kFileCrc32cFieldName{"crc32"};
2711
+ const std::string kFileSizeFieldName{"size"};
2712
+ const std::string kTemperatureFieldName{"temp"};
2713
+
2714
+ // Marks a (future) field that should cause failure if not recognized.
2715
+ // Other fields are assumed to be ignorable. For example, in the future
2716
+ // we might add
2717
+ // ni::file_name_escape uri_percent
2718
+ // to indicate all file names have had spaces and special characters
2719
+ // escaped using a URI percent encoding.
2720
+ const std::string kNonIgnorableFieldPrefix{"ni::"};
2721
+
2722
+ // Each backup meta file is of the format (schema version 1):
2723
+ //----------------------------------------------------------
2724
+ // <timestamp>
2725
+ // <seq number>
2726
+ // metadata <metadata> (optional)
2727
+ // <number of files>
2728
+ // <file1> crc32 <crc32c_as_unsigned_decimal>
2729
+ // <file2> crc32 <crc32c_as_unsigned_decimal>
2730
+ // ...
2731
+ //----------------------------------------------------------
2732
+ //
2733
+ // For schema version 2.x (not in public APIs, but
2734
+ // forward-compatibility started):
2735
+ //----------------------------------------------------------
2736
+ // schema_version <ver>
2737
+ // <timestamp>
2738
+ // <seq number>
2739
+ // [<field name> <field data>]
2740
+ // ...
2741
+ // <number of files>
2742
+ // <file1>( <field name> <field data no spaces>)*
2743
+ // <file2>( <field name> <field data no spaces>)*
2744
+ // ...
2745
+ // [// FOOTER]
2746
+ // [<field name> <field data>]
2747
+ // ...
2748
+ //----------------------------------------------------------
2749
+ // where
2750
+ // <ver> ::= [0-9]+([.][0-9]+)
2751
+ // <field name> ::= [A-Za-z_][A-Za-z_0-9.]+
2752
+ // <field data> is anything but newline
2753
+ // <field data no spaces> is anything but space and newline
2754
+ // Although "// FOOTER" wouldn't strictly be required as a delimiter
2755
+ // given the number of files is included, it is there for parsing
2756
+ // sanity in case of corruption. It is only required if followed
2757
+ // by footer fields, such as a checksum of the meta file (so far).
2758
+ // Unrecognized fields are ignored, to support schema evolution on
2759
+ // non-critical features with forward compatibility. Update schema
2760
+ // major version for breaking changes. Schema minor versions are indicated
2761
+ // only for diagnostic/debugging purposes.
2762
+ //
2763
+ // Fields in schema version 2.0:
2764
+ // * Top-level meta fields:
2765
+ // * Only "metadata" as in schema version 1
2766
+ // * File meta fields:
2767
+ // * "crc32" - a crc32c checksum as in schema version 1
2768
+ // * "size" - the size of the file (new)
2769
+ // * Footer meta fields:
2770
+ // * None yet (future use for meta file checksum anticipated)
2771
+ //
2772
+ IOStatus BackupEngineImpl::BackupMeta::LoadFromFile(
2773
+ const std::string& backup_dir,
2774
+ const std::unordered_map<std::string, uint64_t>& abs_path_to_size,
2775
+ RateLimiter* rate_limiter, Logger* info_log,
2776
+ std::unordered_set<std::string>* reported_ignored_fields) {
2777
+ assert(reported_ignored_fields);
2778
+ assert(Empty());
2779
+
2780
+ std::unique_ptr<LineFileReader> backup_meta_reader;
2781
+ {
2782
+ IOStatus io_s = LineFileReader::Create(fs_, meta_filename_, FileOptions(),
2783
+ &backup_meta_reader, nullptr);
2784
+ if (!io_s.ok()) {
2785
+ return io_s;
2786
+ }
2787
+ }
2788
+
2789
+ // If we don't read an explicit schema_version, that implies version 1,
2790
+ // which is what we call the original backup meta schema.
2791
+ int schema_major_version = 1;
2792
+
2793
+ // Failures handled at the end
2794
+ std::string line;
2795
+ if (backup_meta_reader->ReadLine(&line)) {
2796
+ if (rate_limiter != nullptr) {
2797
+ LoopRateLimitRequestHelper(line.size(), rate_limiter, Env::IO_LOW,
2798
+ nullptr /* stats */,
2799
+ RateLimiter::OpType::kRead);
2800
+ }
2801
+ if (StartsWith(line, kSchemaVersionPrefix)) {
2802
+ std::string ver = line.substr(kSchemaVersionPrefix.size());
2803
+ if (ver == "2" || StartsWith(ver, "2.")) {
2804
+ schema_major_version = 2;
2805
+ } else {
2806
+ return IOStatus::NotSupported(
2807
+ "Unsupported/unrecognized schema version: " + ver);
2808
+ }
2809
+ line.clear();
2810
+ } else if (line.empty()) {
2811
+ return IOStatus::Corruption("Unexpected empty line");
2812
+ }
2813
+ }
2814
+ if (!line.empty()) {
2815
+ timestamp_ = std::strtoull(line.c_str(), nullptr, /*base*/ 10);
2816
+ } else if (backup_meta_reader->ReadLine(&line)) {
2817
+ if (rate_limiter != nullptr) {
2818
+ LoopRateLimitRequestHelper(line.size(), rate_limiter, Env::IO_LOW,
2819
+ nullptr /* stats */,
2820
+ RateLimiter::OpType::kRead);
2821
+ }
2822
+ timestamp_ = std::strtoull(line.c_str(), nullptr, /*base*/ 10);
2823
+ }
2824
+ if (backup_meta_reader->ReadLine(&line)) {
2825
+ if (rate_limiter != nullptr) {
2826
+ LoopRateLimitRequestHelper(line.size(), rate_limiter, Env::IO_LOW,
2827
+ nullptr /* stats */,
2828
+ RateLimiter::OpType::kRead);
2829
+ }
2830
+ sequence_number_ = std::strtoull(line.c_str(), nullptr, /*base*/ 10);
2831
+ }
2832
+ uint32_t num_files = UINT32_MAX;
2833
+ while (backup_meta_reader->ReadLine(&line)) {
2834
+ if (rate_limiter != nullptr) {
2835
+ LoopRateLimitRequestHelper(line.size(), rate_limiter, Env::IO_LOW,
2836
+ nullptr /* stats */,
2837
+ RateLimiter::OpType::kRead);
2838
+ }
2839
+ if (line.empty()) {
2840
+ return IOStatus::Corruption("Unexpected empty line");
2841
+ }
2842
+ // Number -> number of files -> exit loop reading optional meta fields
2843
+ if (line[0] >= '0' && line[0] <= '9') {
2844
+ num_files = static_cast<uint32_t>(strtoul(line.c_str(), nullptr, 10));
2845
+ break;
2846
+ }
2847
+ // else, must be a meta field assignment
2848
+ auto space_pos = line.find_first_of(' ');
2849
+ if (space_pos == std::string::npos) {
2850
+ return IOStatus::Corruption("Expected number of files or meta field");
2851
+ }
2852
+ std::string field_name = line.substr(0, space_pos);
2853
+ std::string field_data = line.substr(space_pos + 1);
2854
+ if (field_name == kAppMetaDataFieldName) {
2855
+ // app metadata present
2856
+ bool decode_success = Slice(field_data).DecodeHex(&app_metadata_);
2857
+ if (!decode_success) {
2858
+ return IOStatus::Corruption(
2859
+ "Failed to decode stored hex encoded app metadata");
2860
+ }
2861
+ } else if (schema_major_version < 2) {
2862
+ return IOStatus::Corruption("Expected number of files or \"" +
2863
+ kAppMetaDataFieldName + "\" field");
2864
+ } else if (StartsWith(field_name, kNonIgnorableFieldPrefix)) {
2865
+ return IOStatus::NotSupported("Unrecognized non-ignorable meta field " +
2866
+ field_name + " (from future version?)");
2867
+ } else {
2868
+ // Warn the first time we see any particular unrecognized meta field
2869
+ if (reported_ignored_fields->insert("meta:" + field_name).second) {
2870
+ ROCKS_LOG_WARN(info_log, "Ignoring unrecognized backup meta field %s",
2871
+ field_name.c_str());
2872
+ }
2873
+ }
2874
+ }
2875
+ std::vector<std::shared_ptr<FileInfo>> files;
2876
+ bool footer_present = false;
2877
+ while (backup_meta_reader->ReadLine(&line)) {
2878
+ if (rate_limiter != nullptr) {
2879
+ LoopRateLimitRequestHelper(line.size(), rate_limiter, Env::IO_LOW,
2880
+ nullptr /* stats */,
2881
+ RateLimiter::OpType::kRead);
2882
+ }
2883
+ std::vector<std::string> components = StringSplit(line, ' ');
2884
+
2885
+ if (components.size() < 1) {
2886
+ return IOStatus::Corruption("Empty line instead of file entry.");
2887
+ }
2888
+ if (schema_major_version >= 2 && components.size() == 2 &&
2889
+ line == kFooterMarker) {
2890
+ footer_present = true;
2891
+ break;
2892
+ }
2893
+
2894
+ const std::string& filename = components[0];
2895
+
2896
+ uint64_t actual_size;
2897
+ const std::shared_ptr<FileInfo> file_info = GetFile(filename);
2898
+ if (file_info) {
2899
+ actual_size = file_info->size;
2900
+ } else {
2901
+ std::string abs_path = backup_dir + "/" + filename;
2902
+ auto e = abs_path_to_size.find(abs_path);
2903
+ if (e == abs_path_to_size.end()) {
2904
+ return IOStatus::Corruption(
2905
+ "Pathname in meta file not found on disk: " + abs_path);
2906
+ }
2907
+ actual_size = e->second;
2908
+ }
2909
+
2910
+ if (schema_major_version >= 2) {
2911
+ if (components.size() % 2 != 1) {
2912
+ return IOStatus::Corruption(
2913
+ "Bad number of line components for file entry.");
2914
+ }
2915
+ } else {
2916
+ // Check restricted original schema
2917
+ if (components.size() < 3) {
2918
+ return IOStatus::Corruption("File checksum is missing for " + filename +
2919
+ " in " + meta_filename_);
2920
+ }
2921
+ if (components[1] != kFileCrc32cFieldName) {
2922
+ return IOStatus::Corruption("Unknown checksum type for " + filename +
2923
+ " in " + meta_filename_);
2924
+ }
2925
+ if (components.size() > 3) {
2926
+ return IOStatus::Corruption("Extra data for entry " + filename +
2927
+ " in " + meta_filename_);
2928
+ }
2929
+ }
2930
+
2931
+ std::string checksum_hex;
2932
+ Temperature temp = Temperature::kUnknown;
2933
+ for (unsigned i = 1; i < components.size(); i += 2) {
2934
+ const std::string& field_name = components[i];
2935
+ const std::string& field_data = components[i + 1];
2936
+
2937
+ if (field_name == kFileCrc32cFieldName) {
2938
+ uint32_t checksum_value =
2939
+ static_cast<uint32_t>(strtoul(field_data.c_str(), nullptr, 10));
2940
+ if (field_data != ROCKSDB_NAMESPACE::ToString(checksum_value)) {
2941
+ return IOStatus::Corruption("Invalid checksum value for " + filename +
2942
+ " in " + meta_filename_);
2943
+ }
2944
+ checksum_hex = ChecksumInt32ToHex(checksum_value);
2945
+ } else if (field_name == kFileSizeFieldName) {
2946
+ uint64_t ex_size =
2947
+ std::strtoull(field_data.c_str(), nullptr, /*base*/ 10);
2948
+ if (ex_size != actual_size) {
2949
+ return IOStatus::Corruption(
2950
+ "For file " + filename + " expected size " + ToString(ex_size) +
2951
+ " but found size" + ToString(actual_size));
2952
+ }
2953
+ } else if (field_name == kTemperatureFieldName) {
2954
+ auto iter = temperature_string_map.find(field_data);
2955
+ if (iter != temperature_string_map.end()) {
2956
+ temp = iter->second;
2957
+ } else {
2958
+ // Could report corruption, but in case of new temperatures added
2959
+ // in future, letting those map to kUnknown which should generally
2960
+ // be safe.
2961
+ temp = Temperature::kUnknown;
2962
+ }
2963
+ } else if (StartsWith(field_name, kNonIgnorableFieldPrefix)) {
2964
+ return IOStatus::NotSupported("Unrecognized non-ignorable file field " +
2965
+ field_name + " (from future version?)");
2966
+ } else {
2967
+ // Warn the first time we see any particular unrecognized file field
2968
+ if (reported_ignored_fields->insert("file:" + field_name).second) {
2969
+ ROCKS_LOG_WARN(info_log, "Ignoring unrecognized backup file field %s",
2970
+ field_name.c_str());
2971
+ }
2972
+ }
2973
+ }
2974
+
2975
+ files.emplace_back(new FileInfo(filename, actual_size, checksum_hex,
2976
+ /*id*/ "", /*sid*/ "", temp));
2977
+ }
2978
+
2979
+ if (footer_present) {
2980
+ assert(schema_major_version >= 2);
2981
+ while (backup_meta_reader->ReadLine(&line)) {
2982
+ if (rate_limiter != nullptr) {
2983
+ LoopRateLimitRequestHelper(line.size(), rate_limiter, Env::IO_LOW,
2984
+ nullptr /* stats */,
2985
+ RateLimiter::OpType::kRead);
2986
+ }
2987
+ if (line.empty()) {
2988
+ return IOStatus::Corruption("Unexpected empty line");
2989
+ }
2990
+ auto space_pos = line.find_first_of(' ');
2991
+ if (space_pos == std::string::npos) {
2992
+ return IOStatus::Corruption("Expected footer field");
2993
+ }
2994
+ std::string field_name = line.substr(0, space_pos);
2995
+ std::string field_data = line.substr(space_pos + 1);
2996
+ if (StartsWith(field_name, kNonIgnorableFieldPrefix)) {
2997
+ return IOStatus::NotSupported("Unrecognized non-ignorable field " +
2998
+ field_name + " (from future version?)");
2999
+ } else if (reported_ignored_fields->insert("footer:" + field_name)
3000
+ .second) {
3001
+ // Warn the first time we see any particular unrecognized footer field
3002
+ ROCKS_LOG_WARN(info_log,
3003
+ "Ignoring unrecognized backup meta footer field %s",
3004
+ field_name.c_str());
3005
+ }
3006
+ }
3007
+ }
3008
+
3009
+ {
3010
+ IOStatus io_s = backup_meta_reader->GetStatus();
3011
+ if (!io_s.ok()) {
3012
+ return io_s;
3013
+ }
3014
+ }
3015
+
3016
+ if (num_files != files.size()) {
3017
+ return IOStatus::Corruption(
3018
+ "Inconsistent number of files or missing/incomplete header in " +
3019
+ meta_filename_);
3020
+ }
3021
+
3022
+ files_.reserve(files.size());
3023
+ for (const auto& file_info : files) {
3024
+ IOStatus io_s = AddFile(file_info);
3025
+ if (!io_s.ok()) {
3026
+ return io_s;
3027
+ }
3028
+ }
3029
+
3030
+ return IOStatus::OK();
3031
+ }
3032
+
3033
+ const std::vector<std::string> minor_version_strings{
3034
+ "", // invalid major version 0
3035
+ "", // implicit major version 1
3036
+ "2.0",
3037
+ };
3038
+
3039
+ IOStatus BackupEngineImpl::BackupMeta::StoreToFile(
3040
+ bool sync, int schema_version,
3041
+ const TEST_BackupMetaSchemaOptions* schema_test_options) {
3042
+ if (schema_version < 1) {
3043
+ return IOStatus::InvalidArgument(
3044
+ "BackupEngineOptions::schema_version must be >= 1");
3045
+ }
3046
+ if (schema_version > static_cast<int>(minor_version_strings.size() - 1)) {
3047
+ return IOStatus::NotSupported(
3048
+ "Only BackupEngineOptions::schema_version <= " +
3049
+ ToString(minor_version_strings.size() - 1) + " is supported");
3050
+ }
3051
+ std::string ver = minor_version_strings[schema_version];
3052
+
3053
+ // Need schema_version >= 2 for TEST_BackupMetaSchemaOptions
3054
+ assert(schema_version >= 2 || schema_test_options == nullptr);
3055
+
3056
+ IOStatus io_s;
3057
+ std::unique_ptr<FSWritableFile> backup_meta_file;
3058
+ FileOptions file_options;
3059
+ file_options.use_mmap_writes = false;
3060
+ file_options.use_direct_writes = false;
3061
+ io_s = fs_->NewWritableFile(meta_tmp_filename_, file_options,
3062
+ &backup_meta_file, nullptr);
3063
+ if (!io_s.ok()) {
3064
+ return io_s;
3065
+ }
3066
+
3067
+ std::ostringstream buf;
3068
+ if (schema_test_options) {
3069
+ // override for testing
3070
+ ver = schema_test_options->version;
3071
+ }
3072
+ if (!ver.empty()) {
3073
+ assert(schema_version >= 2);
3074
+ buf << kSchemaVersionPrefix << ver << "\n";
3075
+ }
3076
+ buf << static_cast<unsigned long long>(timestamp_) << "\n";
3077
+ buf << sequence_number_ << "\n";
3078
+
3079
+ if (!app_metadata_.empty()) {
3080
+ std::string hex_encoded_metadata =
3081
+ Slice(app_metadata_).ToString(/* hex */ true);
3082
+ buf << kAppMetaDataFieldName << " " << hex_encoded_metadata << "\n";
3083
+ }
3084
+ if (schema_test_options) {
3085
+ for (auto& e : schema_test_options->meta_fields) {
3086
+ buf << e.first << " " << e.second << "\n";
3087
+ }
3088
+ }
3089
+ buf << files_.size() << "\n";
3090
+
3091
+ for (const auto& file : files_) {
3092
+ buf << file->filename;
3093
+ if (schema_test_options == nullptr ||
3094
+ schema_test_options->crc32c_checksums) {
3095
+ // use crc32c for now, switch to something else if needed
3096
+ buf << " " << kFileCrc32cFieldName << " "
3097
+ << ChecksumHexToInt32(file->checksum_hex);
3098
+ }
3099
+ if (schema_version >= 2 && file->temp != Temperature::kUnknown) {
3100
+ buf << " " << kTemperatureFieldName << " "
3101
+ << temperature_to_string[file->temp];
3102
+ }
3103
+ if (schema_test_options && schema_test_options->file_sizes) {
3104
+ buf << " " << kFileSizeFieldName << " " << ToString(file->size);
3105
+ }
3106
+ if (schema_test_options) {
3107
+ for (auto& e : schema_test_options->file_fields) {
3108
+ buf << " " << e.first << " " << e.second;
3109
+ }
3110
+ }
3111
+ buf << "\n";
3112
+ }
3113
+
3114
+ if (schema_test_options && !schema_test_options->footer_fields.empty()) {
3115
+ buf << kFooterMarker << "\n";
3116
+ for (auto& e : schema_test_options->footer_fields) {
3117
+ buf << e.first << " " << e.second << "\n";
3118
+ }
3119
+ }
3120
+
3121
+ io_s = backup_meta_file->Append(Slice(buf.str()), iooptions_, nullptr);
3122
+ IOSTATS_ADD(bytes_written, buf.str().size());
3123
+ if (io_s.ok() && sync) {
3124
+ io_s = backup_meta_file->Sync(iooptions_, nullptr);
3125
+ }
3126
+ if (io_s.ok()) {
3127
+ io_s = backup_meta_file->Close(iooptions_, nullptr);
3128
+ }
3129
+ if (io_s.ok()) {
3130
+ io_s = fs_->RenameFile(meta_tmp_filename_, meta_filename_, iooptions_,
3131
+ nullptr);
3132
+ }
3133
+ return io_s;
3134
+ }
3135
+ } // namespace
3136
+
3137
+ IOStatus BackupEngineReadOnly::Open(const BackupEngineOptions& options,
3138
+ Env* env,
3139
+ BackupEngineReadOnly** backup_engine_ptr) {
3140
+ if (options.destroy_old_data) {
3141
+ return IOStatus::InvalidArgument(
3142
+ "Can't destroy old data with ReadOnly BackupEngine");
3143
+ }
3144
+ std::unique_ptr<BackupEngineImplThreadSafe> backup_engine(
3145
+ new BackupEngineImplThreadSafe(options, env, true /*read_only*/));
3146
+ auto s = backup_engine->Initialize();
3147
+ if (!s.ok()) {
3148
+ *backup_engine_ptr = nullptr;
3149
+ return s;
3150
+ }
3151
+ *backup_engine_ptr = backup_engine.release();
3152
+ return IOStatus::OK();
3153
+ }
3154
+
3155
+ void TEST_SetBackupMetaSchemaOptions(
3156
+ BackupEngine* engine, const TEST_BackupMetaSchemaOptions& options) {
3157
+ BackupEngineImplThreadSafe* impl =
3158
+ static_cast_with_check<BackupEngineImplThreadSafe>(engine);
3159
+ impl->TEST_SetBackupMetaSchemaOptions(options);
3160
+ }
3161
+
3162
+ } // namespace ROCKSDB_NAMESPACE
3163
+
3164
+ #endif // ROCKSDB_LITE