npm - tigerbeetle-node - Versions diffs - 0.5.2 → 0.8.1 - Mend

tigerbeetle-node 0.5.2 → 0.8.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

package/README.md +97 -78
package/dist/benchmark.js +96 -94
package/dist/benchmark.js.map +1 -1
package/dist/index.d.ts +82 -82
package/dist/index.js +74 -93
package/dist/index.js.map +1 -1
package/dist/test.js +134 -111
package/dist/test.js.map +1 -1
package/package.json +3 -2
package/scripts/download_node_headers.sh +3 -1
package/src/benchmark.ts +114 -118
package/src/index.ts +102 -111
package/src/node.zig +55 -63
package/src/test.ts +146 -125
package/src/tigerbeetle/scripts/benchmark.bat +46 -0
package/src/tigerbeetle/scripts/benchmark.sh +5 -0
package/src/tigerbeetle/scripts/install_zig.bat +109 -109
package/src/tigerbeetle/scripts/install_zig.sh +8 -4
package/src/tigerbeetle/scripts/vopr.bat +47 -47
package/src/tigerbeetle/scripts/vopr.sh +2 -2
package/src/tigerbeetle/src/benchmark.zig +65 -102
package/src/tigerbeetle/src/cli.zig +39 -18
package/src/tigerbeetle/src/config.zig +44 -25
package/src/tigerbeetle/src/demo.zig +2 -15
package/src/tigerbeetle/src/demo_01_create_accounts.zig +10 -10
package/src/tigerbeetle/src/demo_03_create_transfers.zig +5 -3
package/src/tigerbeetle/src/{demo_04_create_transfers_two_phase_commit.zig → demo_04_create_pending_transfers.zig} +18 -12
package/src/tigerbeetle/src/demo_05_post_pending_transfers.zig +37 -0
package/src/tigerbeetle/src/demo_06_void_pending_transfers.zig +24 -0
package/src/tigerbeetle/src/demo_07_lookup_transfers.zig +1 -1
package/src/tigerbeetle/src/io/benchmark.zig +24 -49
package/src/tigerbeetle/src/io/darwin.zig +175 -44
package/src/tigerbeetle/src/io/linux.zig +177 -72
package/src/tigerbeetle/src/io/test.zig +61 -39
package/src/tigerbeetle/src/io/windows.zig +1161 -0
package/src/tigerbeetle/src/io.zig +2 -0
package/src/tigerbeetle/src/main.zig +31 -10
package/src/tigerbeetle/src/message_bus.zig +49 -61
package/src/tigerbeetle/src/message_pool.zig +66 -57
package/src/tigerbeetle/src/ring_buffer.zig +55 -3
package/src/tigerbeetle/src/simulator.zig +108 -12
package/src/tigerbeetle/src/state_machine.zig +1813 -816
package/src/tigerbeetle/src/storage.zig +0 -230
package/src/tigerbeetle/src/test/cluster.zig +168 -38
package/src/tigerbeetle/src/test/message_bus.zig +4 -3
package/src/tigerbeetle/src/test/network.zig +13 -16
package/src/tigerbeetle/src/test/packet_simulator.zig +14 -1
package/src/tigerbeetle/src/test/state_checker.zig +6 -3
package/src/tigerbeetle/src/test/state_machine.zig +8 -7
package/src/tigerbeetle/src/test/storage.zig +99 -40
package/src/tigerbeetle/src/tigerbeetle.zig +108 -101
package/src/tigerbeetle/src/time.zig +58 -11
package/src/tigerbeetle/src/vsr/client.zig +18 -32
package/src/tigerbeetle/src/vsr/clock.zig +1 -1
package/src/tigerbeetle/src/vsr/journal.zig +1388 -464
package/src/tigerbeetle/src/vsr/replica.zig +1340 -576
package/src/tigerbeetle/src/vsr.zig +452 -40
package/src/translate.zig +10 -0
package/src/tigerbeetle/src/demo_05_accept_transfers.zig +0 -23
package/src/tigerbeetle/src/demo_06_reject_transfers.zig +0 -17
package/src/tigerbeetle/src/format_test.zig +0 -69

package/src/tigerbeetle/src/simulator.zig CHANGED Viewed

@@ -20,6 +20,8 @@ const output = std.log.scoped(.state_checker);
 /// This will run much slower but will trace all logic across the cluster.
 const log_state_transitions_only = builtin.mode != .Debug;
+const log_health = std.log.scoped(.health);
 /// You can fine tune your log levels even further (debug/info/notice/warn/err/crit/alert/emerg):
 pub const log_level: std.log.Level = if (log_state_transitions_only) .info else .debug;
@@ -64,7 +66,6 @@ pub fn main() !void {
     const node_count = replica_count + client_count;
     const ticks_max = 100_000_000;
-    const transitions_max = config.journal_size_max / config.message_size_max;
     const request_probability = 1 + random.uintLessThan(u8, 99);
     const idle_on_probability = random.uintLessThan(u8, 20);
     const idle_off_probability = 10 + random.uintLessThan(u8, 10);
@@ -84,7 +85,7 @@ pub fn main() !void {
                 .one_way_delay_mean = 3 + random.uintLessThan(u16, 10),
                 .one_way_delay_min = random.uintLessThan(u16, 3),
                 .packet_loss_probability = random.uintLessThan(u8, 30),
-                .path_maximum_capacity = 20 + random.uintLessThan(u8, 20),
+                .path_maximum_capacity = 2 + random.uintLessThan(u8, 19),
                 .path_clog_duration_mean = random.uintLessThan(u16, 500),
                 .path_clog_probability = random.uintLessThan(u8, 2),
                 .packet_replay_probability = random.uintLessThan(u8, 50),
@@ -101,10 +102,16 @@ pub fn main() !void {
             .read_latency_min = random.uintLessThan(u16, 3),
             .read_latency_mean = 3 + random.uintLessThan(u16, 10),
             .write_latency_min = random.uintLessThan(u16, 3),
-            .write_latency_mean = 3 + random.uintLessThan(u16, 10),
+            .write_latency_mean = 3 + random.uintLessThan(u16, 100),
             .read_fault_probability = random.uintLessThan(u8, 10),
             .write_fault_probability = random.uintLessThan(u8, 10),
         },
+        .health_options = .{
+            .crash_probability = 0.0001,
+            .crash_stability = random.uintLessThan(u32, 1_000),
+            .restart_probability = 0.01,
+            .restart_stability = random.uintLessThan(u32, 1_000),
+        },
     });
     defer cluster.destroy();
@@ -143,6 +150,10 @@ pub fn main() !void {
         \\          write_latency_mean={}
         \\          read_fault_probability={}%
         \\          write_fault_probability={}%
+        \\          crash_probability={d}%
+        \\          crash_stability={} ticks
+        \\          restart_probability={d}%
+        \\          restart_stability={} ticks
         \\
     , .{
         seed,
@@ -169,26 +180,105 @@ pub fn main() !void {
         cluster.options.storage_options.write_latency_mean,
         cluster.options.storage_options.read_fault_probability,
         cluster.options.storage_options.write_fault_probability,
+        cluster.options.health_options.crash_probability * 100,
+        cluster.options.health_options.crash_stability,
+        cluster.options.health_options.restart_probability * 100,
+        cluster.options.health_options.restart_stability,
     });
     var requests_sent: u64 = 0;
     var idle = false;
+    // The minimum number of healthy replicas required for a crashed replica to be able to recover.
+    const replica_normal_min = replicas: {
+        if (replica_count == 1) {
+            // A cluster of 1 can crash safely (as long as there is no disk corruption) since it
+            // does not run the recovery protocol.
+            break :replicas 0;
+        } else {
+            break :replicas cluster.replicas[0].quorum_view_change;
+        }
+    };
+    // Disable most faults at startup, so that the replicas don't get stuck in recovery mode.
+    for (cluster.storages) |*storage, i| {
+        storage.faulty = replica_normal_min <= i;
+    }
+    // TODO When storage is supported, run more transitions than fit in the journal.
+    const transitions_max = config.journal_slot_count / 2;
     var tick: u64 = 0;
     while (tick < ticks_max) : (tick += 1) {
-        for (cluster.storages) |*storage| storage.tick();
+        const health_options = &cluster.options.health_options;
+        // The maximum number of replicas that can crash, with the cluster still able to recover.
+        var crashes = cluster.replica_normal_count() -| replica_normal_min;
+        for (cluster.storages) |*storage, replica| {
+            if (cluster.replicas[replica].journal.recovered) {
+                // TODO Remove this workaround when VSR recovery protocol is disabled.
+                // When only the minimum number of replicas are healthy (no more crashes allowed),
+                // disable storage faults on all healthy replicas.
+                //
+                // This is a workaround to avoid the deadlock that occurs when (for example) in a
+                // cluster of 3 replicas, one is down, another has a corrupt prepare, and the last does
+                // not have the prepare. The two healthy replicas can never complete a view change,
+                // because two replicas are not enough to nack, and the unhealthy replica cannot
+                // complete the VSR recovery protocol either.
+                if (cluster.health[replica] == .up and crashes == 0) {
+                    storage.faulty = false;
+                } else {
+                    // When a journal recovers for the first time, enable its storage faults.
+                    // Future crashes will recover in the presence of faults.
+                    storage.faulty = true;
+                }
+            }
+            storage.tick();
+        }
-        for (cluster.replicas) |*replica, i| {
-            replica.tick();
-            cluster.state_checker.check_state(@intCast(u8, i));
+        for (cluster.replicas) |*replica| {
+            switch (cluster.health[replica.replica]) {
+                .up => |*ticks| {
+                    ticks.* -|= 1;
+                    replica.tick();
+                    cluster.state_checker.check_state(replica.replica);
+                    if (ticks.* != 0) continue;
+                    if (crashes == 0) continue;
+                    if (cluster.storages[replica.replica].writes.count() == 0) {
+                        if (!chance_f64(random, health_options.crash_probability)) continue;
+                    } else {
+                        if (!chance_f64(random, health_options.crash_probability * 10.0)) continue;
+                    }
+                    if (!try cluster.crash_replica(replica.replica)) continue;
+                    log_health.debug("crash replica={}", .{replica.replica});
+                    crashes -= 1;
+                },
+                .down => |*ticks| {
+                    ticks.* -|= 1;
+                    // Keep ticking the time so that it won't have diverged too far to synchronize
+                    // when the replica restarts.
+                    replica.clock.time.tick();
+                    assert(replica.status == .recovering);
+                    if (ticks.* == 0 and chance_f64(random, health_options.restart_probability)) {
+                        cluster.health[replica.replica] = .{ .up = health_options.restart_stability };
+                        log_health.debug("restart replica={}", .{replica.replica});
+                    }
+                },
+            }
         }
-        cluster.network.packet_simulator.tick();
+        cluster.network.packet_simulator.tick(cluster.health);
         for (cluster.clients) |*client| client.tick();
         if (cluster.state_checker.transitions == transitions_max) {
-            if (cluster.state_checker.convergence()) break;
+            if (cluster.state_checker.convergence() and
+                cluster.replica_up_count() == replica_count)
+            {
+                break;
+            }
             continue;
         } else {
             assert(cluster.state_checker.transitions < transitions_max);
@@ -213,7 +303,7 @@ pub fn main() !void {
     assert(cluster.state_checker.convergence());
-    output.info("\n          PASSED", .{});
+    output.info("\n          PASSED ({} ticks)", .{tick});
 }
 /// Returns true, `p` percent of the time, else false.
@@ -222,6 +312,12 @@ fn chance(random: std.rand.Random, p: u8) bool {
     return random.uintLessThan(u8, 100) < p;
 }
+/// Returns true, `p` percent of the time, else false.
+fn chance_f64(random: std.rand.Random, p: f64) bool {
+    assert(p <= 100.0);
+    return random.float(f64) < p;
+}
 /// Returns the next argument for the simulator or null (if none available)
 fn args_next(args: *std.process.ArgIterator, allocator: std.mem.Allocator) ?[:0]const u8 {
     const err_or_bytes = args.next(allocator) orelse return null;
@@ -244,7 +340,7 @@ fn send_request(random: std.rand.Random) bool {
     if (client.request_queue.full()) return false;
     if (checker_request_queue.full()) return false;
-    const message = client.get_message() orelse return false;
+    const message = client.get_message();
     defer client.unref(message);
     const body_size_max = config.message_size_max - @sizeOf(Header);
@@ -265,7 +361,7 @@ fn send_request(random: std.rand.Random) bool {
     // While hashing the client ID with the request body prevents input collisions across clients,
     // it's still possible for the same client to generate the same body, and therefore input hash.
     const client_input = StateMachine.hash(client.id, body);
-    checker_request_queue.push(client_input) catch unreachable;
+    checker_request_queue.push_assume_capacity(client_input);
     std.log.scoped(.test_client).debug("client {} sending input={x}", .{
         client_index,
         client_input,