1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
// SPDX-License-Identifier: BUSL-1.1
//! KV engine operations dispatched to the Data Plane.
use nodedb_types::Surrogate;
/// KV engine physical operations.
///
/// All operations target a hash-indexed collection with O(1) point lookups.
/// Keys and values are serialized as Binary Tuples.
#[derive(
Debug,
Clone,
PartialEq,
serde::Serialize,
serde::Deserialize,
zerompk::ToMessagePack,
zerompk::FromMessagePack,
)]
pub enum KvOp {
/// Point lookup by primary key. Returns Binary Tuple value or nil.
Get {
collection: String,
key: Vec<u8>,
/// RLS post-fetch filters. Evaluated after fetching the value.
/// Returns nil on denial (no info leak).
rls_filters: Vec<u8>,
/// Clone snapshot-isolation ceiling: when set, a fetched entry
/// whose surrogate exceeds this value is treated as not-found.
/// Populated by the clone resolver when rewriting a target-side
/// `Get` for delegation to the source database — bindings the
/// source allocated AFTER the clone's AS-OF must not leak
/// through. `None` for normal (non-clone-delegated) gets.
#[serde(default)]
surrogate_ceiling: Option<u32>,
},
/// Insert or update (RESP SET / SQL UPSERT semantics). Writes a Binary
/// Tuple value keyed by primary key, overwriting any existing row.
///
/// If the collection has secondary indexes, they are maintained synchronously.
/// If no secondary indexes, takes the zero-index fast path.
Put {
collection: String,
key: Vec<u8>,
/// Binary Tuple encoded value (all value columns).
value: Vec<u8>,
/// Per-key TTL override in milliseconds. 0 = use collection default.
ttl_ms: u64,
/// Stable cross-engine identity assigned by the CP-side
/// `SurrogateAssigner` from `(collection, key)`.
/// `Surrogate::ZERO` only appears in test fixtures.
surrogate: Surrogate,
},
/// SQL `INSERT` semantics: write only if the key does not already exist.
/// Returns `unique_violation` (SQLSTATE 23505, via `NodeDbError`) on
/// duplicate key. Reserved for the `INSERT` SQL path — RESP `SET` and
/// `UPSERT` continue to use `Put`.
Insert {
collection: String,
key: Vec<u8>,
value: Vec<u8>,
ttl_ms: u64,
/// Stable cross-engine identity. `Surrogate::ZERO` only in tests.
surrogate: Surrogate,
},
/// SQL `INSERT ... ON CONFLICT DO NOTHING` semantics: write if the key
/// does not exist, silently no-op on duplicate. No error on conflict.
InsertIfAbsent {
collection: String,
key: Vec<u8>,
value: Vec<u8>,
ttl_ms: u64,
/// Stable cross-engine identity. `Surrogate::ZERO` only in tests.
surrogate: Surrogate,
},
/// SQL `INSERT ... ON CONFLICT (key) DO UPDATE SET ...` semantics:
/// write if absent; on duplicate, read-modify-write — apply the
/// `updates` (which may reference `EXCLUDED.col` on the incoming row)
/// to the existing value and write the merged result. `value` is the
/// would-be-inserted row, used both as the write target when absent
/// and as `EXCLUDED` when the handler evaluates expressions.
InsertOnConflictUpdate {
collection: String,
key: Vec<u8>,
value: Vec<u8>,
ttl_ms: u64,
updates: Vec<(String, super::document::UpdateValue)>,
/// Stable cross-engine identity. `Surrogate::ZERO` only in tests.
surrogate: Surrogate,
},
/// Delete by primary key(s). Returns count of keys actually deleted.
Delete {
collection: String,
keys: Vec<Vec<u8>>,
},
/// Cursor-based scan with optional filter predicate.
Scan {
collection: String,
/// Opaque cursor from a previous scan. Empty = start from beginning.
cursor: Vec<u8>,
/// Maximum entries to return in this batch.
count: usize,
/// Optional filter predicates (same format as DocumentScan filters).
filters: Vec<u8>,
/// Optional glob pattern for key matching (e.g., "user:*").
match_pattern: Option<String>,
/// Sort keys: `(field, descending)` pairs applied to the scan result
/// before encoding. Empty = unsorted (engine native order).
#[serde(default)]
sort_keys: Vec<(String, bool)>,
/// Clone snapshot-isolation ceiling: when set, scan results
/// drop entries whose surrogate exceeds this value. Populated
/// by the clone resolver when rewriting a target-side scan for
/// delegation to the source database — bindings the source
/// allocated AFTER the clone's AS-OF must not leak through.
/// `None` for normal (non-clone-delegated) scans.
#[serde(default)]
surrogate_ceiling: Option<u32>,
},
/// Set or update TTL on an existing key.
Expire {
collection: String,
key: Vec<u8>,
/// TTL in milliseconds from now.
ttl_ms: u64,
},
/// Remove TTL from an existing key (make it persistent).
Persist { collection: String, key: Vec<u8> },
/// Get remaining TTL for a key without fetching the value.
///
/// Returns JSON `{"ttl_ms": N}` where N is:
/// - `-2` — key does not exist
/// - `-1` — key exists but has no TTL (persistent)
/// - `>= 0` — remaining milliseconds until expiry
GetTtl { collection: String, key: Vec<u8> },
/// Batch get: fetch multiple keys in a single bridge round-trip.
BatchGet {
collection: String,
keys: Vec<Vec<u8>>,
},
/// Batch put: insert/update multiple key-value pairs atomically.
BatchPut {
collection: String,
/// `(key, value)` pairs.
entries: Vec<(Vec<u8>, Vec<u8>)>,
/// Per-key TTL override in milliseconds. 0 = use collection default.
ttl_ms: u64,
},
/// Register a secondary index on a value field (DDL).
///
/// Dispatched when `CREATE INDEX idx ON kv_collection (field)` is executed.
/// If `backfill` is true, scans all existing entries to populate the index.
RegisterIndex {
collection: String,
/// Field name to index (must match a column in the KV schema).
field: String,
/// Position of the field in the schema column list.
field_position: usize,
/// Whether to backfill the index with existing entries.
backfill: bool,
},
/// Remove a secondary index from a value field (DDL).
DropIndex { collection: String, field: String },
/// Extract one or more fields from a key's value (HGET/HMGET).
///
/// Deserializes the stored value, extracts the named fields, and returns
/// them as a JSON object. O(1) key lookup + field extraction.
FieldGet {
collection: String,
key: Vec<u8>,
/// Field names to extract.
fields: Vec<String>,
},
/// Update specific fields in a key's value (HSET).
///
/// Read-modify-write: reads the current value, merges field updates,
/// writes back. Maintains secondary indexes if any.
FieldSet {
collection: String,
key: Vec<u8>,
/// Field name → new value (JSON-encoded bytes).
updates: Vec<(String, Vec<u8>)>,
},
/// Truncate: delete ALL entries in a KV collection.
Truncate { collection: String },
/// Atomic increment on a numeric value. Returns new value.
///
/// If key doesn't exist, initializes to 0 then adds delta.
/// If value is not i64, returns `TypeMismatch`.
/// On overflow (i64::MAX + 1), returns `OverflowError`.
/// TTL: if `ttl_ms > 0` and key is new, sets TTL; if key exists, resets TTL.
/// If `ttl_ms == 0`, preserves existing TTL (no change).
Incr {
collection: String,
key: Vec<u8>,
delta: i64,
/// TTL in milliseconds. 0 = preserve existing TTL.
ttl_ms: u64,
},
/// Atomic float increment on a numeric value. Returns new value.
///
/// Same semantics as `Incr` but for f64 values.
/// If value is not f64, returns `TypeMismatch`.
IncrFloat {
collection: String,
key: Vec<u8>,
delta: f64,
},
/// Compare-and-swap: set value to `new_value` only if current equals `expected`.
///
/// Returns JSON `{"success": bool, "current_value": "<base64>"}`.
/// If key doesn't exist and `expected` is empty, creates the key (create-if-not-exists).
Cas {
collection: String,
key: Vec<u8>,
expected: Vec<u8>,
new_value: Vec<u8>,
},
/// Atomic get-and-set: set new value, return old value.
///
/// Returns the previous value (or null if key didn't exist).
GetSet {
collection: String,
key: Vec<u8>,
new_value: Vec<u8>,
},
// ── Atomic Transfer Operations ───────────────────────────────────
/// Atomic fungible transfer: read-validate-write in one Data Plane pass.
///
/// Reads source and dest values, validates source.field >= amount,
/// then atomically writes both updated values. No TOCTOU race.
Transfer {
collection: String,
source_key: Vec<u8>,
dest_key: Vec<u8>,
field: String,
/// Amount to transfer (encoded as f64 bytes).
amount: f64,
},
/// Atomic non-fungible item transfer: verify + delete + insert in one pass.
///
/// Verifies source owns the item, then atomically deletes from source
/// and inserts at dest. Fails with NotFound if source doesn't own it.
TransferItem {
source_collection: String,
dest_collection: String,
item_key: Vec<u8>,
dest_key: Vec<u8>,
},
// ── Sorted Index (Leaderboard) Operations ──────────────────────────
/// Register a sorted index on a KV collection (DDL).
RegisterSortedIndex {
collection: String,
index_name: String,
/// Sort columns: (column_name, direction "ASC"/"DESC").
sort_columns: Vec<(String, String)>,
/// Primary key column name.
key_column: String,
/// Window type: "none", "daily", "weekly", "monthly", or "custom".
window_type: String,
/// Window timestamp column (empty if window_type == "none").
window_timestamp_column: String,
/// Custom window start (ms since epoch, 0 if N/A).
window_start_ms: u64,
/// Custom window end (ms since epoch, 0 if N/A).
window_end_ms: u64,
},
/// Drop a sorted index.
DropSortedIndex { index_name: String },
/// Get the 1-based rank of a key in a sorted index.
SortedIndexRank {
index_name: String,
primary_key: Vec<u8>,
},
/// Get the top K entries from a sorted index.
SortedIndexTopK { index_name: String, k: u32 },
/// Get entries in a score range from a sorted index.
SortedIndexRange {
index_name: String,
score_min: Option<Vec<u8>>,
score_max: Option<Vec<u8>>,
},
/// Get total count of entries in a sorted index.
SortedIndexCount { index_name: String },
/// Get the sort key (score) for a key in a sorted index (ZSCORE equivalent).
SortedIndexScore {
index_name: String,
primary_key: Vec<u8>,
},
/// Cursor-paginated raw scan for the clone materializer.
///
/// Unlike `Scan`, this returns raw `(key, value)` byte pairs **plus** the
/// next-cursor in a single payload, so the materializer can drive the
/// scan to completion in O(N / count) round-trips. The response payload
/// is msgpack-encoded as a 2-element array:
/// `[ next_cursor: bytes, entries: [[key: bytes, value: bytes], ...] ]`
/// `next_cursor` is empty when the scan is complete.
MaterializeScan {
collection: String,
cursor: Vec<u8>,
count: usize,
},
}