tigerbeetle 0.0.34 → 0.0.37

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (249) hide show
  1. checksums.yaml +4 -4
  2. data/CHANGELOG.md +10 -0
  3. data/ext/tb_client/extconf.rb +13 -13
  4. data/ext/tb_client/tigerbeetle/LICENSE +177 -0
  5. data/ext/tb_client/tigerbeetle/build.zig +2327 -0
  6. data/ext/tb_client/tigerbeetle/src/aof.zig +1000 -0
  7. data/ext/tb_client/tigerbeetle/src/build_multiversion.zig +808 -0
  8. data/ext/tb_client/tigerbeetle/src/cdc/amqp/protocol.zig +1283 -0
  9. data/ext/tb_client/tigerbeetle/src/cdc/amqp/spec.zig +1704 -0
  10. data/ext/tb_client/tigerbeetle/src/cdc/amqp/types.zig +341 -0
  11. data/ext/tb_client/tigerbeetle/src/cdc/amqp.zig +1450 -0
  12. data/ext/tb_client/tigerbeetle/src/cdc/runner.zig +1659 -0
  13. data/ext/tb_client/tigerbeetle/src/clients/c/samples/main.c +406 -0
  14. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client/context.zig +1084 -0
  15. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client/echo_client.zig +286 -0
  16. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client/packet.zig +158 -0
  17. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client/signal.zig +229 -0
  18. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client/signal_fuzz.zig +110 -0
  19. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client.h +386 -0
  20. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client.zig +34 -0
  21. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client_exports.zig +281 -0
  22. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client_header.zig +312 -0
  23. data/ext/tb_client/tigerbeetle/src/clients/c/tb_client_header_test.zig +138 -0
  24. data/ext/tb_client/tigerbeetle/src/clients/c/test.zig +466 -0
  25. data/ext/tb_client/tigerbeetle/src/clients/docs_samples.zig +157 -0
  26. data/ext/tb_client/tigerbeetle/src/clients/docs_types.zig +90 -0
  27. data/ext/tb_client/tigerbeetle/src/clients/dotnet/ci.zig +203 -0
  28. data/ext/tb_client/tigerbeetle/src/clients/dotnet/docs.zig +79 -0
  29. data/ext/tb_client/tigerbeetle/src/clients/dotnet/dotnet_bindings.zig +542 -0
  30. data/ext/tb_client/tigerbeetle/src/clients/go/ci.zig +109 -0
  31. data/ext/tb_client/tigerbeetle/src/clients/go/docs.zig +86 -0
  32. data/ext/tb_client/tigerbeetle/src/clients/go/go_bindings.zig +370 -0
  33. data/ext/tb_client/tigerbeetle/src/clients/go/pkg/native/tb_client.h +386 -0
  34. data/ext/tb_client/tigerbeetle/src/clients/java/ci.zig +167 -0
  35. data/ext/tb_client/tigerbeetle/src/clients/java/docs.zig +126 -0
  36. data/ext/tb_client/tigerbeetle/src/clients/java/java_bindings.zig +996 -0
  37. data/ext/tb_client/tigerbeetle/src/clients/java/src/client.zig +748 -0
  38. data/ext/tb_client/tigerbeetle/src/clients/java/src/jni.zig +3238 -0
  39. data/ext/tb_client/tigerbeetle/src/clients/java/src/jni_tests.zig +1718 -0
  40. data/ext/tb_client/tigerbeetle/src/clients/java/src/jni_thread_cleaner.zig +190 -0
  41. data/ext/tb_client/tigerbeetle/src/clients/node/ci.zig +104 -0
  42. data/ext/tb_client/tigerbeetle/src/clients/node/docs.zig +75 -0
  43. data/ext/tb_client/tigerbeetle/src/clients/node/node.zig +522 -0
  44. data/ext/tb_client/tigerbeetle/src/clients/node/node_bindings.zig +267 -0
  45. data/ext/tb_client/tigerbeetle/src/clients/node/src/c.zig +3 -0
  46. data/ext/tb_client/tigerbeetle/src/clients/node/src/translate.zig +379 -0
  47. data/ext/tb_client/tigerbeetle/src/clients/python/ci.zig +131 -0
  48. data/ext/tb_client/tigerbeetle/src/clients/python/docs.zig +63 -0
  49. data/ext/tb_client/tigerbeetle/src/clients/python/python_bindings.zig +588 -0
  50. data/ext/tb_client/tigerbeetle/src/clients/rust/assets/tb_client.h +386 -0
  51. data/ext/tb_client/tigerbeetle/src/clients/rust/ci.zig +73 -0
  52. data/ext/tb_client/tigerbeetle/src/clients/rust/docs.zig +106 -0
  53. data/ext/tb_client/tigerbeetle/src/clients/rust/rust_bindings.zig +305 -0
  54. data/ext/tb_client/tigerbeetle/src/config.zig +296 -0
  55. data/ext/tb_client/tigerbeetle/src/constants.zig +790 -0
  56. data/ext/tb_client/tigerbeetle/src/copyhound.zig +202 -0
  57. data/ext/tb_client/tigerbeetle/src/counting_allocator.zig +72 -0
  58. data/ext/tb_client/tigerbeetle/src/direction.zig +11 -0
  59. data/ext/tb_client/tigerbeetle/src/docs_website/build.zig +158 -0
  60. data/ext/tb_client/tigerbeetle/src/docs_website/src/content.zig +156 -0
  61. data/ext/tb_client/tigerbeetle/src/docs_website/src/docs.zig +252 -0
  62. data/ext/tb_client/tigerbeetle/src/docs_website/src/file_checker.zig +313 -0
  63. data/ext/tb_client/tigerbeetle/src/docs_website/src/html.zig +87 -0
  64. data/ext/tb_client/tigerbeetle/src/docs_website/src/page_writer.zig +63 -0
  65. data/ext/tb_client/tigerbeetle/src/docs_website/src/redirects.zig +47 -0
  66. data/ext/tb_client/tigerbeetle/src/docs_website/src/search_index_writer.zig +28 -0
  67. data/ext/tb_client/tigerbeetle/src/docs_website/src/service_worker_writer.zig +61 -0
  68. data/ext/tb_client/tigerbeetle/src/docs_website/src/single_page_writer.zig +169 -0
  69. data/ext/tb_client/tigerbeetle/src/docs_website/src/website.zig +46 -0
  70. data/ext/tb_client/tigerbeetle/src/ewah.zig +445 -0
  71. data/ext/tb_client/tigerbeetle/src/ewah_benchmark.zig +128 -0
  72. data/ext/tb_client/tigerbeetle/src/ewah_fuzz.zig +171 -0
  73. data/ext/tb_client/tigerbeetle/src/fuzz_tests.zig +179 -0
  74. data/ext/tb_client/tigerbeetle/src/integration_tests.zig +662 -0
  75. data/ext/tb_client/tigerbeetle/src/io/common.zig +155 -0
  76. data/ext/tb_client/tigerbeetle/src/io/darwin.zig +1093 -0
  77. data/ext/tb_client/tigerbeetle/src/io/linux.zig +1880 -0
  78. data/ext/tb_client/tigerbeetle/src/io/test.zig +1005 -0
  79. data/ext/tb_client/tigerbeetle/src/io/windows.zig +1598 -0
  80. data/ext/tb_client/tigerbeetle/src/io.zig +34 -0
  81. data/ext/tb_client/tigerbeetle/src/iops.zig +134 -0
  82. data/ext/tb_client/tigerbeetle/src/list.zig +236 -0
  83. data/ext/tb_client/tigerbeetle/src/lsm/binary_search.zig +848 -0
  84. data/ext/tb_client/tigerbeetle/src/lsm/binary_search_benchmark.zig +179 -0
  85. data/ext/tb_client/tigerbeetle/src/lsm/cache_map.zig +424 -0
  86. data/ext/tb_client/tigerbeetle/src/lsm/cache_map_fuzz.zig +420 -0
  87. data/ext/tb_client/tigerbeetle/src/lsm/compaction.zig +2117 -0
  88. data/ext/tb_client/tigerbeetle/src/lsm/composite_key.zig +182 -0
  89. data/ext/tb_client/tigerbeetle/src/lsm/forest.zig +1119 -0
  90. data/ext/tb_client/tigerbeetle/src/lsm/forest_fuzz.zig +1102 -0
  91. data/ext/tb_client/tigerbeetle/src/lsm/forest_table_iterator.zig +200 -0
  92. data/ext/tb_client/tigerbeetle/src/lsm/groove.zig +1495 -0
  93. data/ext/tb_client/tigerbeetle/src/lsm/k_way_merge.zig +739 -0
  94. data/ext/tb_client/tigerbeetle/src/lsm/k_way_merge_benchmark.zig +166 -0
  95. data/ext/tb_client/tigerbeetle/src/lsm/manifest.zig +754 -0
  96. data/ext/tb_client/tigerbeetle/src/lsm/manifest_level.zig +1294 -0
  97. data/ext/tb_client/tigerbeetle/src/lsm/manifest_level_fuzz.zig +510 -0
  98. data/ext/tb_client/tigerbeetle/src/lsm/manifest_log.zig +1263 -0
  99. data/ext/tb_client/tigerbeetle/src/lsm/manifest_log_fuzz.zig +628 -0
  100. data/ext/tb_client/tigerbeetle/src/lsm/node_pool.zig +247 -0
  101. data/ext/tb_client/tigerbeetle/src/lsm/scan_buffer.zig +116 -0
  102. data/ext/tb_client/tigerbeetle/src/lsm/scan_builder.zig +543 -0
  103. data/ext/tb_client/tigerbeetle/src/lsm/scan_fuzz.zig +938 -0
  104. data/ext/tb_client/tigerbeetle/src/lsm/scan_lookup.zig +293 -0
  105. data/ext/tb_client/tigerbeetle/src/lsm/scan_merge.zig +362 -0
  106. data/ext/tb_client/tigerbeetle/src/lsm/scan_range.zig +99 -0
  107. data/ext/tb_client/tigerbeetle/src/lsm/scan_state.zig +17 -0
  108. data/ext/tb_client/tigerbeetle/src/lsm/scan_tree.zig +1036 -0
  109. data/ext/tb_client/tigerbeetle/src/lsm/schema.zig +617 -0
  110. data/ext/tb_client/tigerbeetle/src/lsm/scratch_memory.zig +84 -0
  111. data/ext/tb_client/tigerbeetle/src/lsm/segmented_array.zig +1500 -0
  112. data/ext/tb_client/tigerbeetle/src/lsm/segmented_array_benchmark.zig +149 -0
  113. data/ext/tb_client/tigerbeetle/src/lsm/segmented_array_fuzz.zig +7 -0
  114. data/ext/tb_client/tigerbeetle/src/lsm/set_associative_cache.zig +865 -0
  115. data/ext/tb_client/tigerbeetle/src/lsm/table.zig +607 -0
  116. data/ext/tb_client/tigerbeetle/src/lsm/table_memory.zig +843 -0
  117. data/ext/tb_client/tigerbeetle/src/lsm/table_value_iterator.zig +105 -0
  118. data/ext/tb_client/tigerbeetle/src/lsm/timestamp_range.zig +40 -0
  119. data/ext/tb_client/tigerbeetle/src/lsm/tree.zig +630 -0
  120. data/ext/tb_client/tigerbeetle/src/lsm/tree_fuzz.zig +933 -0
  121. data/ext/tb_client/tigerbeetle/src/lsm/zig_zag_merge.zig +557 -0
  122. data/ext/tb_client/tigerbeetle/src/message_buffer.zig +469 -0
  123. data/ext/tb_client/tigerbeetle/src/message_bus.zig +1214 -0
  124. data/ext/tb_client/tigerbeetle/src/message_bus_fuzz.zig +936 -0
  125. data/ext/tb_client/tigerbeetle/src/message_pool.zig +343 -0
  126. data/ext/tb_client/tigerbeetle/src/multiversion.zig +2195 -0
  127. data/ext/tb_client/tigerbeetle/src/queue.zig +390 -0
  128. data/ext/tb_client/tigerbeetle/src/repl/completion.zig +201 -0
  129. data/ext/tb_client/tigerbeetle/src/repl/parser.zig +1356 -0
  130. data/ext/tb_client/tigerbeetle/src/repl/terminal.zig +496 -0
  131. data/ext/tb_client/tigerbeetle/src/repl.zig +1034 -0
  132. data/ext/tb_client/tigerbeetle/src/scripts/amqp.zig +973 -0
  133. data/ext/tb_client/tigerbeetle/src/scripts/cfo.zig +1866 -0
  134. data/ext/tb_client/tigerbeetle/src/scripts/changelog.zig +304 -0
  135. data/ext/tb_client/tigerbeetle/src/scripts/ci.zig +227 -0
  136. data/ext/tb_client/tigerbeetle/src/scripts/client_readmes.zig +658 -0
  137. data/ext/tb_client/tigerbeetle/src/scripts/devhub.zig +466 -0
  138. data/ext/tb_client/tigerbeetle/src/scripts/release.zig +1058 -0
  139. data/ext/tb_client/tigerbeetle/src/scripts.zig +105 -0
  140. data/ext/tb_client/tigerbeetle/src/shell.zig +1195 -0
  141. data/ext/tb_client/tigerbeetle/src/stack.zig +260 -0
  142. data/ext/tb_client/tigerbeetle/src/state_machine/auditor.zig +911 -0
  143. data/ext/tb_client/tigerbeetle/src/state_machine/workload.zig +2079 -0
  144. data/ext/tb_client/tigerbeetle/src/state_machine.zig +4872 -0
  145. data/ext/tb_client/tigerbeetle/src/state_machine_fuzz.zig +288 -0
  146. data/ext/tb_client/tigerbeetle/src/state_machine_tests.zig +3128 -0
  147. data/ext/tb_client/tigerbeetle/src/static_allocator.zig +82 -0
  148. data/ext/tb_client/tigerbeetle/src/stdx/bit_set.zig +157 -0
  149. data/ext/tb_client/tigerbeetle/src/stdx/bounded_array.zig +292 -0
  150. data/ext/tb_client/tigerbeetle/src/stdx/debug.zig +65 -0
  151. data/ext/tb_client/tigerbeetle/src/stdx/flags.zig +1414 -0
  152. data/ext/tb_client/tigerbeetle/src/stdx/mlock.zig +92 -0
  153. data/ext/tb_client/tigerbeetle/src/stdx/prng.zig +677 -0
  154. data/ext/tb_client/tigerbeetle/src/stdx/radix.zig +336 -0
  155. data/ext/tb_client/tigerbeetle/src/stdx/ring_buffer.zig +511 -0
  156. data/ext/tb_client/tigerbeetle/src/stdx/sort_test.zig +112 -0
  157. data/ext/tb_client/tigerbeetle/src/stdx/stdx.zig +1160 -0
  158. data/ext/tb_client/tigerbeetle/src/stdx/testing/low_level_hash_vectors.zig +142 -0
  159. data/ext/tb_client/tigerbeetle/src/stdx/testing/snaptest.zig +361 -0
  160. data/ext/tb_client/tigerbeetle/src/stdx/time_units.zig +275 -0
  161. data/ext/tb_client/tigerbeetle/src/stdx/unshare.zig +295 -0
  162. data/ext/tb_client/tigerbeetle/src/stdx/vendored/aegis.zig +436 -0
  163. data/ext/tb_client/tigerbeetle/src/stdx/windows.zig +48 -0
  164. data/ext/tb_client/tigerbeetle/src/stdx/zipfian.zig +402 -0
  165. data/ext/tb_client/tigerbeetle/src/storage.zig +489 -0
  166. data/ext/tb_client/tigerbeetle/src/storage_fuzz.zig +180 -0
  167. data/ext/tb_client/tigerbeetle/src/testing/bench.zig +146 -0
  168. data/ext/tb_client/tigerbeetle/src/testing/cluster/grid_checker.zig +53 -0
  169. data/ext/tb_client/tigerbeetle/src/testing/cluster/journal_checker.zig +61 -0
  170. data/ext/tb_client/tigerbeetle/src/testing/cluster/manifest_checker.zig +76 -0
  171. data/ext/tb_client/tigerbeetle/src/testing/cluster/message_bus.zig +110 -0
  172. data/ext/tb_client/tigerbeetle/src/testing/cluster/network.zig +412 -0
  173. data/ext/tb_client/tigerbeetle/src/testing/cluster/state_checker.zig +331 -0
  174. data/ext/tb_client/tigerbeetle/src/testing/cluster/storage_checker.zig +458 -0
  175. data/ext/tb_client/tigerbeetle/src/testing/cluster.zig +1198 -0
  176. data/ext/tb_client/tigerbeetle/src/testing/exhaustigen.zig +128 -0
  177. data/ext/tb_client/tigerbeetle/src/testing/fixtures.zig +181 -0
  178. data/ext/tb_client/tigerbeetle/src/testing/fuzz.zig +144 -0
  179. data/ext/tb_client/tigerbeetle/src/testing/id.zig +97 -0
  180. data/ext/tb_client/tigerbeetle/src/testing/io.zig +317 -0
  181. data/ext/tb_client/tigerbeetle/src/testing/marks.zig +126 -0
  182. data/ext/tb_client/tigerbeetle/src/testing/packet_simulator.zig +533 -0
  183. data/ext/tb_client/tigerbeetle/src/testing/reply_sequence.zig +154 -0
  184. data/ext/tb_client/tigerbeetle/src/testing/state_machine.zig +389 -0
  185. data/ext/tb_client/tigerbeetle/src/testing/storage.zig +1247 -0
  186. data/ext/tb_client/tigerbeetle/src/testing/table.zig +249 -0
  187. data/ext/tb_client/tigerbeetle/src/testing/time.zig +98 -0
  188. data/ext/tb_client/tigerbeetle/src/testing/tmp_tigerbeetle.zig +212 -0
  189. data/ext/tb_client/tigerbeetle/src/testing/vortex/constants.zig +26 -0
  190. data/ext/tb_client/tigerbeetle/src/testing/vortex/faulty_network.zig +580 -0
  191. data/ext/tb_client/tigerbeetle/src/testing/vortex/java_driver/ci.zig +39 -0
  192. data/ext/tb_client/tigerbeetle/src/testing/vortex/logged_process.zig +214 -0
  193. data/ext/tb_client/tigerbeetle/src/testing/vortex/rust_driver/ci.zig +34 -0
  194. data/ext/tb_client/tigerbeetle/src/testing/vortex/supervisor.zig +766 -0
  195. data/ext/tb_client/tigerbeetle/src/testing/vortex/workload.zig +543 -0
  196. data/ext/tb_client/tigerbeetle/src/testing/vortex/zig_driver.zig +181 -0
  197. data/ext/tb_client/tigerbeetle/src/tidy.zig +1448 -0
  198. data/ext/tb_client/tigerbeetle/src/tigerbeetle/benchmark_driver.zig +227 -0
  199. data/ext/tb_client/tigerbeetle/src/tigerbeetle/benchmark_load.zig +1069 -0
  200. data/ext/tb_client/tigerbeetle/src/tigerbeetle/cli.zig +1422 -0
  201. data/ext/tb_client/tigerbeetle/src/tigerbeetle/inspect.zig +1658 -0
  202. data/ext/tb_client/tigerbeetle/src/tigerbeetle/inspect_integrity.zig +518 -0
  203. data/ext/tb_client/tigerbeetle/src/tigerbeetle/libtb_client.zig +36 -0
  204. data/ext/tb_client/tigerbeetle/src/tigerbeetle/main.zig +646 -0
  205. data/ext/tb_client/tigerbeetle/src/tigerbeetle.zig +958 -0
  206. data/ext/tb_client/tigerbeetle/src/time.zig +236 -0
  207. data/ext/tb_client/tigerbeetle/src/trace/event.zig +745 -0
  208. data/ext/tb_client/tigerbeetle/src/trace/statsd.zig +462 -0
  209. data/ext/tb_client/tigerbeetle/src/trace.zig +556 -0
  210. data/ext/tb_client/tigerbeetle/src/unit_tests.zig +321 -0
  211. data/ext/tb_client/tigerbeetle/src/vopr.zig +1785 -0
  212. data/ext/tb_client/tigerbeetle/src/vortex.zig +101 -0
  213. data/ext/tb_client/tigerbeetle/src/vsr/checkpoint_trailer.zig +473 -0
  214. data/ext/tb_client/tigerbeetle/src/vsr/checksum.zig +208 -0
  215. data/ext/tb_client/tigerbeetle/src/vsr/checksum_benchmark.zig +43 -0
  216. data/ext/tb_client/tigerbeetle/src/vsr/client.zig +768 -0
  217. data/ext/tb_client/tigerbeetle/src/vsr/client_replies.zig +532 -0
  218. data/ext/tb_client/tigerbeetle/src/vsr/client_sessions.zig +338 -0
  219. data/ext/tb_client/tigerbeetle/src/vsr/clock.zig +1019 -0
  220. data/ext/tb_client/tigerbeetle/src/vsr/fault_detector.zig +279 -0
  221. data/ext/tb_client/tigerbeetle/src/vsr/free_set.zig +1381 -0
  222. data/ext/tb_client/tigerbeetle/src/vsr/free_set_fuzz.zig +315 -0
  223. data/ext/tb_client/tigerbeetle/src/vsr/grid.zig +1460 -0
  224. data/ext/tb_client/tigerbeetle/src/vsr/grid_blocks_missing.zig +757 -0
  225. data/ext/tb_client/tigerbeetle/src/vsr/grid_scrubber.zig +797 -0
  226. data/ext/tb_client/tigerbeetle/src/vsr/journal.zig +2586 -0
  227. data/ext/tb_client/tigerbeetle/src/vsr/marzullo.zig +308 -0
  228. data/ext/tb_client/tigerbeetle/src/vsr/message_header.zig +1777 -0
  229. data/ext/tb_client/tigerbeetle/src/vsr/multi_batch.zig +715 -0
  230. data/ext/tb_client/tigerbeetle/src/vsr/multi_batch_fuzz.zig +185 -0
  231. data/ext/tb_client/tigerbeetle/src/vsr/repair_budget.zig +333 -0
  232. data/ext/tb_client/tigerbeetle/src/vsr/replica.zig +12355 -0
  233. data/ext/tb_client/tigerbeetle/src/vsr/replica_format.zig +416 -0
  234. data/ext/tb_client/tigerbeetle/src/vsr/replica_reformat.zig +165 -0
  235. data/ext/tb_client/tigerbeetle/src/vsr/replica_test.zig +2910 -0
  236. data/ext/tb_client/tigerbeetle/src/vsr/routing.zig +1075 -0
  237. data/ext/tb_client/tigerbeetle/src/vsr/superblock.zig +1603 -0
  238. data/ext/tb_client/tigerbeetle/src/vsr/superblock_fuzz.zig +484 -0
  239. data/ext/tb_client/tigerbeetle/src/vsr/superblock_quorums.zig +405 -0
  240. data/ext/tb_client/tigerbeetle/src/vsr/superblock_quorums_fuzz.zig +355 -0
  241. data/ext/tb_client/tigerbeetle/src/vsr/sync.zig +29 -0
  242. data/ext/tb_client/tigerbeetle/src/vsr.zig +1727 -0
  243. data/lib/tb_client/shared_lib.rb +12 -5
  244. data/lib/tigerbeetle/client.rb +1 -1
  245. data/lib/tigerbeetle/platforms.rb +9 -0
  246. data/lib/tigerbeetle/version.rb +2 -2
  247. data/tigerbeetle.gemspec +22 -5
  248. metadata +242 -3
  249. data/ext/tb_client/pkg.tar.gz +0 -0
@@ -0,0 +1,768 @@
1
+ const std = @import("std");
2
+ const stdx = @import("stdx");
3
+ const mem = std.mem;
4
+ const assert = std.debug.assert;
5
+ const maybe = stdx.maybe;
6
+
7
+ const constants = @import("../constants.zig");
8
+ const vsr = @import("../vsr.zig");
9
+ const Header = vsr.Header;
10
+ const Time = vsr.time.Time;
11
+
12
+ const MessagePool = @import("../message_pool.zig").MessagePool;
13
+ const Message = @import("../message_pool.zig").MessagePool.Message;
14
+ const MessageBuffer = @import("../message_buffer.zig").MessageBuffer;
15
+
16
+ const log = stdx.log.scoped(.client);
17
+
18
+ pub fn ClientType(
19
+ comptime StateMachineOperation: type,
20
+ comptime MessageBus: type,
21
+ ) type {
22
+ return struct {
23
+ const Client = @This();
24
+
25
+ pub const Operation = StateMachineOperation;
26
+ pub const Request = struct {
27
+ pub const Callback = *const fn (
28
+ user_data: u128,
29
+ operation: vsr.Operation,
30
+ timestamp: u64,
31
+ results: []u8,
32
+ ) void;
33
+
34
+ pub const RegisterCallback = *const fn (
35
+ user_data: u128,
36
+ result: *const vsr.RegisterResult,
37
+ ) void;
38
+
39
+ message: *Message.Request,
40
+ user_data: u128,
41
+ callback: union(enum) {
42
+ /// When message.header.operation ≠ .register
43
+ request: Callback,
44
+ /// When message.header.operation = .register
45
+ register: RegisterCallback,
46
+ },
47
+ };
48
+
49
+ message_bus: MessageBus,
50
+
51
+ time: Time,
52
+
53
+ /// A universally unique identifier for the client (must not be zero).
54
+ /// Used for routing replies back to the client via any network path (multi-path routing).
55
+ /// The client ID must be ephemeral and random per process, and never persisted, so that
56
+ /// lingering or zombie deployment processes cannot break correctness and/or liveness.
57
+ /// A cryptographic random number generator must be used to ensure these properties.
58
+ id: u128,
59
+
60
+ /// The identifier for the cluster that this client intends to communicate with.
61
+ cluster: u128,
62
+
63
+ /// The number of replicas in the cluster.
64
+ replica_count: u8,
65
+
66
+ aof_recovery: bool,
67
+
68
+ /// Only tests should ever override the release.
69
+ release: vsr.Release = constants.config.process.release,
70
+
71
+ /// The total number of ticks elapsed since the client was initialized.
72
+ ticks: u64 = 0,
73
+
74
+ /// We hash-chain request/reply checksums to verify linearizability within a client session:
75
+ /// * so that the parent of the next request is the checksum of the latest reply, and
76
+ /// * so that the parent of the next reply is the checksum of the latest request.
77
+ parent: u128 = 0,
78
+
79
+ /// The session number for the client, zero when registering a session, non-zero thereafter.
80
+ session: u64 = 0,
81
+
82
+ /// The request number of the next request.
83
+ request_number: u32 = 0,
84
+
85
+ /// Measures the time elapsed between sending a request (in `raw_request`) and receiving the
86
+ /// corresponding reply (in `on_reply`).
87
+ request_completion_timer: vsr.time.Timer,
88
+
89
+ /// The maximum body size for `command=request` messages.
90
+ /// Set by the `register`'s reply.
91
+ batch_size_limit: ?u32 = null,
92
+
93
+ /// The highest view number seen by the client in messages exchanged with the cluster. Used
94
+ /// to locate the current primary, and provide more information to a partitioned primary.
95
+ view: u32 = 0,
96
+
97
+ /// Tracks a currently processing (non-register) request message submitted by `register()`
98
+ /// or `raw_request()`.
99
+ request_inflight: ?Request = null,
100
+
101
+ /// The number of ticks without a reply before the client resends the inflight request.
102
+ /// Dynamically adjusted as a function of recent request round-trip time.
103
+ request_timeout: vsr.Timeout,
104
+
105
+ /// The number of ticks before the client broadcasts a ping to the cluster.
106
+ /// Used for end-to-end keepalive, and to discover a new primary between requests.
107
+ ping_timeout: vsr.Timeout,
108
+
109
+ /// The round-trip time (estimated by the latest ping/pong pair) from each replica.
110
+ replica_round_trip_times_ns: [constants.replicas_max]?u64 = @splat(null),
111
+
112
+ /// Used to calculate exponential backoff with random jitter.
113
+ /// Seeded with the client's ID.
114
+ prng: stdx.PRNG,
115
+
116
+ on_reply_context: ?*anyopaque = null,
117
+ /// Used for testing. Called for replies to all operations (including `register`).
118
+ on_reply_callback: ?*const fn (
119
+ client: *Client,
120
+ request: *Message.Request,
121
+ reply: *Message.Reply,
122
+ ) void = null,
123
+
124
+ evicted: bool = false,
125
+ on_eviction_callback: ?*const fn (
126
+ client: *Client,
127
+ eviction: *const Message.Eviction,
128
+ ) void = null,
129
+
130
+ pub fn init(
131
+ allocator: mem.Allocator,
132
+ time: Time,
133
+ message_pool: *MessagePool,
134
+ options: struct {
135
+ id: u128,
136
+ cluster: u128,
137
+ replica_count: u8,
138
+ aof_recovery: bool,
139
+ message_bus_options: MessageBus.Options,
140
+ /// When eviction_callback is null, the client will panic on eviction.
141
+ ///
142
+ /// When eviction_callback is non-null, it must `deinit()` the Client.
143
+ /// After eviction, the client must not send or process any additional messages.
144
+ eviction_callback: ?*const fn (
145
+ client: *Client,
146
+ eviction: *const Message.Eviction,
147
+ ) void = null,
148
+ },
149
+ ) !Client {
150
+ assert(options.id > 0);
151
+ assert(options.replica_count > 0);
152
+
153
+ var message_bus = try MessageBus.init(
154
+ allocator,
155
+ .{ .client = options.id },
156
+ message_pool,
157
+ Client.on_messages,
158
+ options.message_bus_options,
159
+ );
160
+ errdefer message_bus.deinit(allocator);
161
+
162
+ var self = Client{
163
+ .message_bus = message_bus,
164
+ .time = time,
165
+ .id = options.id,
166
+ .cluster = options.cluster,
167
+ .replica_count = options.replica_count,
168
+ .aof_recovery = options.aof_recovery,
169
+ .request_completion_timer = .init(time),
170
+ .request_timeout = .{
171
+ .name = "request_timeout",
172
+ .id = options.id,
173
+ .after = constants.rtt_ticks * constants.rtt_multiple,
174
+ },
175
+ .ping_timeout = .{
176
+ .name = "ping_timeout",
177
+ .id = options.id,
178
+ .after = 30000 / constants.tick_ms,
179
+ },
180
+ .prng = stdx.PRNG.from_seed(@as(u64, @truncate(options.id))),
181
+ .on_eviction_callback = options.eviction_callback,
182
+ };
183
+
184
+ self.ping_timeout.start();
185
+
186
+ return self;
187
+ }
188
+
189
+ pub fn deinit(self: *Client, allocator: std.mem.Allocator) void {
190
+ if (self.request_inflight) |inflight| self.release_message(inflight.message.base());
191
+ self.message_bus.deinit(allocator);
192
+ }
193
+
194
+ pub fn on_messages(message_bus: *MessageBus, buffer: *MessageBuffer) void {
195
+ const self: *Client = @fieldParentPtr("message_bus", message_bus);
196
+ while (buffer.next_header()) |header| {
197
+ const message = buffer.consume_message(self.message_bus.pool, &header);
198
+ defer self.message_bus.unref(message);
199
+
200
+ if (message.header.cluster != self.cluster) {
201
+ buffer.invalidate(.header_cluster);
202
+ return;
203
+ }
204
+ if (!self.evicted) {
205
+ self.on_message(message);
206
+ }
207
+ }
208
+ }
209
+
210
+ pub fn on_message(self: *Client, message: *Message) void {
211
+ assert(!self.evicted);
212
+
213
+ // Switch on the header type so that we don't log opaque bytes for the per-command data.
214
+ switch (message.header.into_any()) {
215
+ inline else => |header| {
216
+ log.debug("{}: on_message: {}", .{ self.id, header });
217
+ },
218
+ }
219
+
220
+ if (message.header.invalid()) |reason| {
221
+ log.debug("{}: on_message: invalid ({s})", .{ self.id, reason });
222
+ return;
223
+ }
224
+ if (message.header.cluster != self.cluster) {
225
+ log.warn("{}: on_message: wrong cluster (cluster should be {}, not {})", .{
226
+ self.id,
227
+ self.cluster,
228
+ message.header.cluster,
229
+ });
230
+ return;
231
+ }
232
+ switch (message.into_any()) {
233
+ .pong_client => |m| self.on_pong_client(m),
234
+ .reply => |m| self.on_reply(m),
235
+ .eviction => |m| self.on_eviction(m),
236
+ else => {
237
+ log.warn("{}: on_message: ignoring misdirected {s} message", .{
238
+ self.id,
239
+ @tagName(message.header.command),
240
+ });
241
+ return;
242
+ },
243
+ }
244
+ }
245
+
246
+ pub fn tick(self: *Client) void {
247
+ assert(!self.evicted);
248
+
249
+ self.ticks += 1;
250
+
251
+ self.message_bus.tick_client();
252
+ self.time.tick();
253
+
254
+ self.ping_timeout.tick();
255
+ self.request_timeout.tick();
256
+
257
+ if (self.ping_timeout.fired()) self.on_ping_timeout();
258
+ if (self.request_timeout.fired()) self.on_request_timeout();
259
+ }
260
+
261
+ /// Registers a session with the cluster for the client, if this has not yet been done.
262
+ pub fn register(self: *Client, callback: Request.RegisterCallback, user_data: u128) void {
263
+ assert(!self.evicted);
264
+ assert(self.request_inflight == null);
265
+ assert(self.request_number == 0);
266
+
267
+ const message = self.get_message().build(.request);
268
+ errdefer self.release_message(message.base());
269
+
270
+ // We will set parent, session, view and checksums only when sending for the first time:
271
+ message.header.* = .{
272
+ .size = @sizeOf(Header) + @sizeOf(vsr.RegisterRequest),
273
+ .client = self.id,
274
+ .request = self.request_number,
275
+ .cluster = self.cluster,
276
+ .command = .request,
277
+ .operation = .register,
278
+ .release = self.release,
279
+ .previous_request_latency = 0,
280
+ // During AOF recovery, if we were to pass timestamp=0, the primary would assign the
281
+ // timestamp. Instead, we send a fixed bogus timestamp (1), to ensure that AOF
282
+ // recovery is deterministic.
283
+ .timestamp = @intFromBool(self.aof_recovery),
284
+ };
285
+
286
+ std.mem.bytesAsValue(
287
+ vsr.RegisterRequest,
288
+ message.body_used()[0..@sizeOf(vsr.RegisterRequest)],
289
+ ).* = .{
290
+ .batch_size_limit = 0,
291
+ };
292
+
293
+ assert(self.request_number == 0);
294
+ self.request_number += 1;
295
+
296
+ log.debug(
297
+ "{}: register: registering a session with the cluster user_data={}",
298
+ .{ self.id, user_data },
299
+ );
300
+
301
+ self.request_inflight = .{
302
+ .message = message,
303
+ .user_data = user_data,
304
+ .callback = .{ .register = callback },
305
+ };
306
+ self.send_request_for_the_first_time(message);
307
+ }
308
+
309
+ /// Sends a request message with the operation and events payload to the replica.
310
+ /// There must be no other request message currently inflight.
311
+ pub fn request(
312
+ self: *Client,
313
+ callback: Request.Callback,
314
+ user_data: u128,
315
+ operation: Operation,
316
+ events: []const u8,
317
+ ) void {
318
+ assert(!self.evicted);
319
+ assert(self.request_inflight == null);
320
+ assert(self.request_number > 0);
321
+
322
+ const event_size = operation.event_size();
323
+ assert(events.len <= constants.message_body_size_max);
324
+ assert(events.len <= self.batch_size_limit.?);
325
+ assert(events.len % event_size == 0);
326
+
327
+ const message = self.get_message().build(.request);
328
+ errdefer self.release_message(message.base());
329
+
330
+ message.header.* = .{
331
+ .client = self.id,
332
+ .request = 0, // Set inside `raw_request` down below.
333
+ .cluster = self.cluster,
334
+ .command = .request,
335
+ .release = self.release,
336
+ .operation = operation.to_vsr(),
337
+ .size = @intCast(@sizeOf(Header) + events.len),
338
+ .previous_request_latency = 0,
339
+ };
340
+
341
+ stdx.copy_disjoint(.exact, u8, message.body_used(), events);
342
+ self.raw_request(callback, user_data, message);
343
+ }
344
+
345
+ /// Sends a request, only setting request_number in the header.
346
+ /// There must be no other request message currently inflight.
347
+ pub fn raw_request(
348
+ self: *Client,
349
+ callback: Request.Callback,
350
+ user_data: u128,
351
+ message: *Message.Request,
352
+ ) void {
353
+ assert(self.request_inflight == null);
354
+ assert(self.request_number > 0);
355
+ assert(message.header.client == self.id);
356
+ assert(message.header.release.value == self.release.value);
357
+ assert(message.header.cluster == self.cluster);
358
+ assert(message.header.command == .request);
359
+ assert(message.header.size >= @sizeOf(Header));
360
+ assert(message.header.size <= constants.message_size_max);
361
+ assert(message.header.size <= @sizeOf(Header) + self.batch_size_limit.?);
362
+ assert(message.header.operation.valid(Operation));
363
+ assert(message.header.view == 0);
364
+ assert(message.header.parent == 0);
365
+ assert(message.header.session == 0);
366
+ assert(message.header.request == 0);
367
+ assert((message.header.timestamp == 0) != self.aof_recovery);
368
+
369
+ if (!self.aof_recovery) {
370
+ assert(message.header.operation == .noop or
371
+ !message.header.operation.vsr_reserved());
372
+ }
373
+
374
+ message.header.request = self.request_number;
375
+ self.request_number += 1;
376
+ self.request_completion_timer.reset();
377
+
378
+ log.debug("{}: request: user_data={} request={} size={} {s}", .{
379
+ self.id,
380
+ user_data,
381
+ message.header.request,
382
+ message.header.size,
383
+ message.header.operation.tag_name(Operation),
384
+ });
385
+
386
+ self.request_inflight = .{
387
+ .message = message,
388
+ .user_data = user_data,
389
+ .callback = .{ .request = callback },
390
+ };
391
+ self.send_request_for_the_first_time(message);
392
+ }
393
+
394
+ /// Acquires a message from the message bus.
395
+ /// The caller must ensure that a message is available.
396
+ ///
397
+ /// Either use it in `client.raw_request()` or discard via `client.release_message()`,
398
+ /// the reference is not guaranteed to be valid after both actions.
399
+ /// Do NOT use the reference counter function `message.ref()` for storing the message.
400
+ pub fn get_message(self: *Client) *Message {
401
+ return self.message_bus.get_message(null);
402
+ }
403
+
404
+ /// Releases a message back to the message bus.
405
+ pub fn release_message(self: *Client, message: *Message) void {
406
+ self.message_bus.unref(message);
407
+ }
408
+
409
+ fn on_eviction(self: *Client, eviction: *const Message.Eviction) void {
410
+ assert(!self.evicted);
411
+ assert(eviction.header.command == .eviction);
412
+ assert(eviction.header.cluster == self.cluster);
413
+
414
+ if (eviction.header.client != self.id) {
415
+ log.warn("{}: on_eviction: ignoring (wrong client={})", .{
416
+ self.id,
417
+ eviction.header.client,
418
+ });
419
+ return;
420
+ }
421
+
422
+ if (eviction.header.view < self.view) {
423
+ log.debug("{}: on_eviction: ignoring (older view={})", .{
424
+ self.id,
425
+ eviction.header.view,
426
+ });
427
+ return;
428
+ }
429
+
430
+ assert(eviction.header.client == self.id);
431
+ assert(eviction.header.view >= self.view);
432
+
433
+ if (self.on_eviction_callback) |callback| {
434
+ const eviction_specific_log = switch (eviction.header.reason) {
435
+ .client_release_too_low => " - your client is too old; upgrade to a version " ++
436
+ "compatible with your cluster",
437
+ .client_release_too_high => " - your client is too new; downgrade to the " ++
438
+ "same version as your cluster",
439
+ else => "",
440
+ };
441
+ log.err(
442
+ "{}: session evicted: reason={?s} (cluster_release={}, client_release={}){s}",
443
+ .{
444
+ self.id,
445
+ std.enums.tagName(vsr.Header.Eviction.Reason, eviction.header.reason),
446
+ eviction.header.release,
447
+ self.release,
448
+ eviction_specific_log,
449
+ },
450
+ );
451
+
452
+ self.evicted = true;
453
+ self.on_eviction_callback = null;
454
+ callback(self, eviction);
455
+ } else {
456
+ std.debug.panic("session evicted: {?s} (cluster_release={})", .{
457
+ std.enums.tagName(vsr.Header.Eviction.Reason, eviction.header.reason),
458
+ eviction.header.release,
459
+ });
460
+ }
461
+ }
462
+
463
+ fn on_pong_client(self: *Client, pong: *const Message.PongClient) void {
464
+ assert(pong.header.command == .pong_client);
465
+ assert(pong.header.cluster == self.cluster);
466
+
467
+ if (pong.header.view > self.view) {
468
+ log.debug("{}: on_pong: newer view={}..{}", .{
469
+ self.id,
470
+ self.view,
471
+ pong.header.view,
472
+ });
473
+ self.view = pong.header.view;
474
+ // Even if there is a request in flight, don't try to retransmit it immediately
475
+ // after a view change. Instead, ride the on_request_timeout normally to reduce the
476
+ // size of thundering herd.
477
+ maybe(self.request_inflight != null);
478
+ }
479
+
480
+ const ping_timestamp_monotonic = pong.header.ping_timestamp_monotonic;
481
+ const pong_timestamp_monotonic = self.time.monotonic().ns;
482
+ if (ping_timestamp_monotonic <= pong_timestamp_monotonic) {
483
+ self.replica_round_trip_times_ns[pong.header.replica] =
484
+ pong_timestamp_monotonic - ping_timestamp_monotonic;
485
+
486
+ var round_trip_times_ns = stdx.BoundedArrayType(u64, constants.replicas_max){};
487
+ for (self.replica_round_trip_times_ns) |round_trip_time_ns| {
488
+ if (round_trip_time_ns) |rtt_ns| {
489
+ round_trip_times_ns.push(rtt_ns);
490
+ }
491
+ }
492
+ std.mem.sort(u64, round_trip_times_ns.slice(), {}, std.sort.asc(u64));
493
+ assert(round_trip_times_ns.count() > 0);
494
+
495
+ const rtt_median_ns =
496
+ round_trip_times_ns.get(@divFloor(round_trip_times_ns.count(), 2));
497
+ self.request_timeout.set_rtt_ns(rtt_median_ns);
498
+ } else {
499
+ log.debug("{}: on_pong: monotonic timestamp regressed {}..{} replica={}", .{
500
+ self.id,
501
+ ping_timestamp_monotonic,
502
+ pong_timestamp_monotonic,
503
+ pong.header.replica,
504
+ });
505
+ }
506
+ }
507
+
508
+ fn on_reply(self: *Client, reply: *Message.Reply) void {
509
+ // We check these checksums again here because this is the last time we get to downgrade
510
+ // a correctness bug into a liveness bug, before we return data back to the application.
511
+ assert(reply.header.valid_checksum());
512
+ assert(reply.header.valid_checksum_body(reply.body_used()));
513
+ assert(reply.header.command == .reply);
514
+ assert(reply.header.release.value == self.release.value);
515
+
516
+ if (reply.header.client != self.id) {
517
+ log.debug("{}: on_reply: ignoring (wrong client={})", .{
518
+ self.id,
519
+ reply.header.client,
520
+ });
521
+ return;
522
+ }
523
+
524
+ var inflight = self.request_inflight orelse {
525
+ assert(reply.header.request < self.request_number);
526
+ log.debug("{}: on_reply: ignoring (no inflight request)", .{self.id});
527
+ return;
528
+ };
529
+
530
+ if (reply.header.request < inflight.message.header.request) {
531
+ assert(inflight.message.header.request > 0);
532
+ assert(inflight.message.header.operation != .register);
533
+
534
+ log.debug("{}: on_reply: ignoring (request {} < {})", .{
535
+ self.id,
536
+ reply.header.request,
537
+ inflight.message.header.request,
538
+ });
539
+ return;
540
+ }
541
+
542
+ assert(reply.header.request == inflight.message.header.request);
543
+ assert(reply.header.request_checksum == inflight.message.header.checksum);
544
+ const inflight_vsr_operation = inflight.message.header.operation;
545
+ const inflight_request = inflight.message.header.request;
546
+
547
+ if (inflight_vsr_operation == .register) {
548
+ assert(inflight_request == 0);
549
+ } else {
550
+ assert(inflight_request > 0);
551
+ }
552
+ // Consume the inflight request here before invoking callbacks down below in case they
553
+ // wish to queue a new `request_inflight`.
554
+ assert(inflight.message == self.request_inflight.?.message);
555
+ self.request_inflight = null;
556
+
557
+ if (self.on_reply_callback) |on_reply_callback| {
558
+ on_reply_callback(self, inflight.message, reply);
559
+ }
560
+
561
+ log.debug("{}: on_reply: user_data={} request={} size={} {s}", .{
562
+ self.id,
563
+ inflight.user_data,
564
+ reply.header.request,
565
+ reply.header.size,
566
+ reply.header.operation.tag_name(Operation),
567
+ });
568
+
569
+ assert(reply.header.request_checksum == self.parent);
570
+ assert(reply.header.client == self.id);
571
+ assert(reply.header.request == inflight_request);
572
+ assert(reply.header.cluster == self.cluster);
573
+ assert(reply.header.op == reply.header.commit);
574
+ assert(reply.header.operation == inflight_vsr_operation);
575
+
576
+ // The context of this reply becomes the parent of our next request:
577
+ self.parent = reply.header.context;
578
+
579
+ if (reply.header.view > self.view) {
580
+ log.debug("{}: on_reply: newer view={}..{}", .{
581
+ self.id,
582
+ self.view,
583
+ reply.header.view,
584
+ });
585
+ self.view = reply.header.view;
586
+ }
587
+
588
+ self.request_timeout.stop();
589
+
590
+ // Release request message to ensure that inflight's callback can submit a new one.
591
+ self.release_message(inflight.message.base());
592
+ inflight.message = undefined;
593
+
594
+ if (inflight_vsr_operation == .register) {
595
+ assert(inflight_request == 0);
596
+ assert(self.batch_size_limit == null);
597
+ assert(self.session == 0);
598
+ assert(reply.header.commit > 0);
599
+ assert(reply.header.size == @sizeOf(Header) + @sizeOf(vsr.RegisterResult));
600
+
601
+ const result = std.mem.bytesAsValue(
602
+ vsr.RegisterResult,
603
+ reply.body_used()[0..@sizeOf(vsr.RegisterResult)],
604
+ );
605
+ assert(result.batch_size_limit > 0);
606
+ assert(result.batch_size_limit <= constants.message_body_size_max);
607
+
608
+ self.session = reply.header.commit; // The commit number becomes the session number.
609
+ self.batch_size_limit = result.batch_size_limit;
610
+ inflight.callback.register(inflight.user_data, result);
611
+ } else {
612
+ // The message is the result of raw_request(), so invoke the user callback.
613
+ // NOTE: the callback is allowed to mutate `reply.body_used()` here.
614
+ inflight.callback.request(
615
+ inflight.user_data,
616
+ inflight_vsr_operation,
617
+ reply.header.timestamp,
618
+ reply.body_used(),
619
+ );
620
+ }
621
+ }
622
+
623
+ fn on_ping_timeout(self: *Client) void {
624
+ self.ping_timeout.reset();
625
+
626
+ const ping = Header.PingClient{
627
+ .command = .ping_client,
628
+ .cluster = self.cluster,
629
+ .release = self.release,
630
+ .client = self.id,
631
+ .ping_timestamp_monotonic = self.time.monotonic().ns,
632
+ };
633
+
634
+ self.send_header_to_replicas(ping.frame_const());
635
+ }
636
+
637
+ // Possible reasons for a timeout:
638
+ // - the cluster is overloaded and takes too long to respond
639
+ // - the request message got dropped by the network
640
+ // - there was a view change, and we are not speaking to the primary
641
+ fn on_request_timeout(self: *Client) void {
642
+ self.request_timeout.backoff(&self.prng); // Reduce the load.
643
+
644
+ const message = self.request_inflight.?.message;
645
+ assert(message.header.command == .request);
646
+ assert(message.header.request < self.request_number);
647
+ assert(message.header.checksum == self.parent);
648
+ assert(message.header.session == self.session);
649
+
650
+ log.debug("{}: on_request_timeout: resending request={} checksum={x:0>32}", .{
651
+ self.id,
652
+ message.header.request,
653
+ message.header.checksum,
654
+ });
655
+
656
+ self.send_request_with_hedging(message);
657
+ }
658
+
659
+ /// The caller owns the returned message, if any, which has exactly 1 reference.
660
+ fn create_message_from_header(self: *Client, header: *const Header) *Message {
661
+ assert(header.cluster == self.cluster);
662
+ assert(header.size == @sizeOf(Header));
663
+
664
+ const message = self.message_bus.get_message(null);
665
+ defer self.message_bus.unref(message);
666
+
667
+ message.header.* = header.*;
668
+ message.header.set_checksum_body(message.body_used());
669
+ message.header.set_checksum();
670
+
671
+ return message.ref();
672
+ }
673
+
674
+ fn send_header_to_replicas(self: *Client, header: *const Header) void {
675
+ const message = self.create_message_from_header(header);
676
+ defer self.message_bus.unref(message);
677
+
678
+ self.send_message_to_replicas(message);
679
+ }
680
+
681
+ fn send_message_to_replicas(self: *Client, message: *Message) void {
682
+ for (0..self.replica_count) |replica| {
683
+ self.send_message_to_replica(@intCast(replica), message);
684
+ }
685
+ }
686
+
687
+ fn send_message_to_replica(self: *Client, replica: u8, message: *Message) void {
688
+ // Switch on the header type so that we don't log opaque bytes for the per-command data.
689
+ switch (message.header.into_any()) {
690
+ inline else => |header| {
691
+ log.debug("{}: sending {s} to replica {}: {}", .{
692
+ self.id,
693
+ @tagName(message.header.command),
694
+ replica,
695
+ header,
696
+ });
697
+ },
698
+ }
699
+
700
+ assert(replica < self.replica_count);
701
+ assert(message.header.valid_checksum());
702
+ assert(message.header.cluster == self.cluster);
703
+
704
+ switch (message.into_any()) {
705
+ inline .request,
706
+ .ping_client,
707
+ => |m| assert(m.header.client == self.id),
708
+ else => unreachable,
709
+ }
710
+
711
+ self.message_bus.send_message_to_replica(replica, message);
712
+ }
713
+
714
+ // In addition to the primary, each request is also sent to a randomly chosen backup, to
715
+ // handle the case where the client → primary link is down. This ensures logical
716
+ // availability of the cluster, i.e., as long the client is connected to a backup that in
717
+ // turn is connected to the primary, the request will be processed by the cluster.
718
+ fn send_request_with_hedging(self: *Client, message: *Message.Request) void {
719
+ const primary: u8 = @intCast(self.view % self.replica_count);
720
+ self.send_message_to_replica(primary, message.base());
721
+
722
+ if (self.replica_count > 1) {
723
+ const offset_random = self.prng.range_inclusive(u8, 1, self.replica_count - 1);
724
+ const backup_random = (primary + offset_random) % self.replica_count;
725
+ assert(backup_random != primary);
726
+ self.send_message_to_replica(backup_random, message.base());
727
+ }
728
+ }
729
+
730
+ fn send_request_for_the_first_time(self: *Client, message: *Message.Request) void {
731
+ assert(self.request_inflight.?.message == message);
732
+ assert(self.request_number > 0);
733
+
734
+ assert(message.header.command == .request);
735
+ assert(message.header.parent == 0);
736
+ assert(message.header.session == 0);
737
+ assert(message.header.request < self.request_number);
738
+ assert(message.header.view == 0);
739
+ assert(message.header.size <= constants.message_size_max);
740
+
741
+ // We set the message checksums only when sending the request for the first time,
742
+ // which is when we have the checksum of the latest reply available to set as `parent`,
743
+ // and similarly also the session number if requests were queued while registering:
744
+ message.header.parent = self.parent;
745
+ message.header.session = self.session;
746
+ // We also try to include our highest view number, so we wait until the request is ready
747
+ // to be sent for the first time. However, beyond that, it is not necessary to update
748
+ // the view number again, for example if it should change between now and resending.
749
+ message.header.view = self.view;
750
+ message.header.set_checksum_body(message.body_used());
751
+ message.header.set_checksum();
752
+
753
+ // The checksum of this request becomes the parent of our next reply:
754
+ self.parent = message.header.checksum;
755
+
756
+ log.debug("{}: send_request_for_the_first_time: request={} checksum={x:0>32}", .{
757
+ self.id,
758
+ message.header.request,
759
+ message.header.checksum,
760
+ });
761
+
762
+ assert(!self.request_timeout.ticking);
763
+ self.request_timeout.start();
764
+
765
+ self.send_request_with_hedging(message);
766
+ }
767
+ };
768
+ }