fortress-api-server 1.0.0

REST API server for Fortress secure database system
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
//! # Node Discovery Module
//!
//! This module handles automatic discovery and registration of cluster nodes,
//! enabling dynamic cluster formation and maintenance.

use crate::cluster::ClusterResult;
use serde::{Deserialize, Serialize};
use std::collections::HashMap;
use std::sync::Arc;
use std::time::Duration;
use tokio::sync::{RwLock, Mutex};
use tokio::time::interval;
use tracing::{debug, error, info, warn};
use uuid::Uuid;

/// Node discovery configuration
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct DiscoveryConfig {
    /// Discovery interval in seconds
    pub discovery_interval_secs: u64,
    /// Node timeout in seconds
    pub node_timeout_secs: u64,
    /// Maximum number of discovery attempts
    pub max_discovery_attempts: u32,
    /// Enable multicast discovery
    pub enable_multicast: bool,
    /// Multicast address
    pub multicast_address: String,
    /// Multicast port
    pub multicast_port: u16,
    /// Enable DNS-based discovery
    pub enable_dns_discovery: bool,
    /// DNS domain for cluster nodes
    pub dns_domain: Option<String>,
    /// Enable static seed nodes
    pub enable_static_seeds: bool,
    /// Static seed node addresses
    pub static_seed_nodes: Vec<String>,
}

impl Default for DiscoveryConfig {
    fn default() -> Self {
        Self {
            discovery_interval_secs: 30,
            node_timeout_secs: 90,
            max_discovery_attempts: 3,
            enable_multicast: true,
            multicast_address: "239.255.0.1".to_string(),
            multicast_port: 8082,
            enable_dns_discovery: false,
            dns_domain: None,
            enable_static_seeds: true,
            static_seed_nodes: Vec::new(),
        }
    }
}

/// Node information for discovery
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct NodeInfo {
    /// Unique node identifier
    pub node_id: Uuid,
    /// Node address
    pub address: String,
    /// Node port
    pub port: u16,
    /// Node role in cluster
    pub role: String,
    /// Node capabilities
    pub capabilities: Vec<String>,
    /// Last seen timestamp
    pub last_seen: chrono::DateTime<chrono::Utc>,
    /// Node metadata
    pub metadata: HashMap<String, String>,
}

/// Discovery message types
#[derive(Debug, Clone, Serialize, Deserialize)]
pub enum DiscoveryMessage {
    /// Node announcement
    NodeAnnouncement {
        /// Information about the announcing node
        node_info: NodeInfo,
    },
    
    /// Node discovery request
    DiscoveryRequest {
        /// ID of the requesting node
        requester_id: Uuid,
        /// When the request was sent
        timestamp: chrono::DateTime<chrono::Utc>,
    },
    
    /// Node discovery response
    DiscoveryResponse {
        /// ID of the requesting node
        requester_id: Uuid,
        /// List of known nodes
        known_nodes: Vec<NodeInfo>,
        /// When the response was sent
        timestamp: chrono::DateTime<chrono::Utc>,
    },
    
    /// Node leave notification
    NodeLeave {
        /// ID of the leaving node
        node_id: Uuid,
        /// When the leave notification was sent
        timestamp: chrono::DateTime<chrono::Utc>,
        /// Reason for leaving
        reason: String,
    },
    
    /// Heartbeat message
    Heartbeat {
        /// ID of the node sending heartbeat
        node_id: Uuid,
        /// When the heartbeat was sent
        timestamp: chrono::DateTime<chrono::Utc>,
        /// Current election term
        term: u64,
    },
}

/// Discovery-specific errors
#[derive(Debug, thiserror::Error)]
pub enum DiscoveryError {
    /// Network discovery failed
    #[error("Network discovery failed: {0}")]
    NetworkDiscoveryFailed(String),
    
    /// DNS discovery failed
    #[error("DNS discovery failed: {0}")]
    DnsDiscoveryFailed(String),
    
    /// Invalid node address
    #[error("Invalid node address: {0}")]
    InvalidNodeAddress(String),
    
    /// Node already exists
    #[error("Node already exists: {0}")]
    NodeAlreadyExists(Uuid),
    
    /// Node not found in cluster
    #[error("Node not found: {0}")]
    NodeNotFound(Uuid),
    
    /// Discovery operation timed out
    #[error("Discovery timeout")]
    DiscoveryTimeout,
    
    /// Multicast communication error
    #[error("Multicast error: {0}")]
    MulticastError(String),
}

/// Node discovery manager
pub struct NodeDiscovery {
    /// This node's information
    local_node_info: NodeInfo,
    /// Configuration
    config: DiscoveryConfig,
    /// Known nodes
    known_nodes: Arc<RwLock<HashMap<Uuid, NodeInfo>>>,
    /// Discovery callbacks
    callbacks: Arc<Mutex<Vec<Box<dyn NodeDiscoveryCallback + Send + Sync>>>>,
    /// Network sender
    network_sender: Arc<Mutex<dyn DiscoveryNetworkSender + Send + Sync>>,
}

/// Callback trait for node discovery events
#[async_trait::async_trait]
pub trait NodeDiscoveryCallback {
    /// Called when a new node joins the cluster
    async fn on_node_joined(&self, node_info: &NodeInfo);
    
    /// Called when a node leaves the cluster
    async fn on_node_left(&self, node_id: Uuid, reason: &str);
    
    /// Called when a node's information is updated
    async fn on_node_updated(&self, node_info: &NodeInfo);
}

/// Trait for network discovery operations
#[async_trait::async_trait]
pub trait DiscoveryNetworkSender {
    /// Send a discovery message to a specific target
    async fn send_discovery_message(&self, target: &str, message: DiscoveryMessage) -> ClusterResult<()>;
    
    /// Broadcast a discovery message to all nodes
    async fn broadcast_discovery_message(&self, message: DiscoveryMessage) -> ClusterResult<()>;
    
    /// Receive discovery messages from the network
    async fn receive_discovery_messages(&self) -> Vec<(String, DiscoveryMessage)>;
}

impl NodeDiscovery {
    /// Create a new node discovery manager
    pub fn new(
        local_node_info: NodeInfo,
        config: DiscoveryConfig,
        network_sender: Arc<Mutex<dyn DiscoveryNetworkSender + Send + Sync>>,
    ) -> Self {
        Self {
            local_node_info,
            config,
            known_nodes: Arc::new(RwLock::new(HashMap::new())),
            callbacks: Arc::new(Mutex::new(Vec::new())),
            network_sender,
        }
    }

    /// Start the discovery service
    pub async fn start(&self) -> ClusterResult<()> {
        info!("Starting node discovery for {}", self.local_node_info.node_id);
        
        // Start discovery loop
        let discovery = self.clone();
        tokio::spawn(async move {
            discovery.discovery_loop().await;
        });

        // Start node cleanup loop
        let discovery = self.clone();
        tokio::spawn(async move {
            discovery.cleanup_loop().await;
        });

        // Initial discovery
        self.perform_initial_discovery().await?;

        Ok(())
    }

    /// Main discovery loop
    async fn discovery_loop(&self) {
        let mut interval = interval(Duration::from_secs(self.config.discovery_interval_secs));
        
        loop {
            interval.tick().await;
            
            if let Err(e) = self.perform_discovery().await {
                error!("Discovery failed: {}", e);
            }
        }
    }

    /// Node cleanup loop
    async fn cleanup_loop(&self) {
        let mut interval = interval(Duration::from_secs(30));
        
        loop {
            interval.tick().await;
            
            if let Err(e) = self.cleanup_stale_nodes().await {
                error!("Node cleanup failed: {}", e);
            }
        }
    }

    /// Perform initial discovery
    async fn perform_initial_discovery(&self) -> ClusterResult<()> {
        info!("Performing initial node discovery");
        
        // Try static seed nodes first
        if self.config.enable_static_seeds {
            self.discover_static_seeds().await?;
        }

        // Try DNS discovery
        if self.config.enable_dns_discovery {
            self.discover_dns_nodes().await?;
        }

        // Try multicast discovery
        if self.config.enable_multicast {
            self.discover_multicast_nodes().await?;
        }

        Ok(())
    }

    /// Perform regular discovery
    async fn perform_discovery(&self) -> ClusterResult<()> {
        // Send discovery request
        let request = DiscoveryMessage::DiscoveryRequest {
            requester_id: self.local_node_info.node_id,
            timestamp: chrono::Utc::now(),
        };

        let sender = self.network_sender.lock().await;
        sender.broadcast_discovery_message(request).await?;

        Ok(())
    }

    /// Discover static seed nodes
    async fn discover_static_seeds(&self) -> ClusterResult<()> {
        info!("Discovering static seed nodes");
        
        for seed_address in &self.config.static_seed_nodes {
            let request = DiscoveryMessage::DiscoveryRequest {
                requester_id: self.local_node_info.node_id,
                timestamp: chrono::Utc::now(),
            };

            let sender = self.network_sender.lock().await;
            if let Err(e) = sender.send_discovery_message(seed_address, request).await {
                warn!("Failed to contact seed node {}: {}", seed_address, e);
            }
        }

        Ok(())
    }

    /// Discover nodes via DNS
    async fn discover_dns_nodes(&self) -> ClusterResult<()> {
        if let Some(domain) = &self.config.dns_domain {
            info!("Discovering nodes via DNS domain: {}", domain);
            
            // DNS SRV record lookup would go here
            // For now, this is a placeholder
            debug!("DNS discovery not yet implemented");
        }

        Ok(())
    }

    /// Discover nodes via multicast
    async fn discover_multicast_nodes(&self) -> ClusterResult<()> {
        info!("Discovering nodes via multicast");
        
        let announcement = DiscoveryMessage::NodeAnnouncement {
            node_info: self.local_node_info.clone(),
        };

        let multicast_address = format!("{}:{}", self.config.multicast_address, self.config.multicast_port);
        let sender = self.network_sender.lock().await;
        
        if let Err(e) = sender.send_discovery_message(&multicast_address, announcement).await {
            warn!("Failed to send multicast announcement: {}", e);
        }

        Ok(())
    }

    /// Clean up stale nodes
    async fn cleanup_stale_nodes(&self) -> ClusterResult<()> {
        let now = chrono::Utc::now();
        let timeout_duration = chrono::Duration::seconds(self.config.node_timeout_secs as i64);
        
        let mut nodes_to_remove = Vec::new();
        {
            let known_nodes = self.known_nodes.read().await;
            for (node_id, node_info) in known_nodes.iter() {
                if now.signed_duration_since(node_info.last_seen) > timeout_duration {
                    nodes_to_remove.push(*node_id);
                }
            }
        }

        for node_id in nodes_to_remove {
            self.remove_node(node_id, "timeout").await?;
        }

        Ok(())
    }

    /// Handle incoming discovery message
    pub async fn handle_message(&self, source: &str, message: DiscoveryMessage) -> ClusterResult<()> {
        match message {
            DiscoveryMessage::NodeAnnouncement { node_info } => {
                self.handle_node_announcement(node_info).await?;
            }
            DiscoveryMessage::DiscoveryRequest { requester_id, timestamp } => {
                self.handle_discovery_request(source, requester_id, timestamp).await?;
            }
            DiscoveryMessage::DiscoveryResponse { requester_id, known_nodes, timestamp } => {
                self.handle_discovery_response(requester_id, known_nodes, timestamp).await?;
            }
            DiscoveryMessage::NodeLeave { node_id, timestamp: _, reason } => {
                self.handle_node_leave(node_id, &reason).await?;
            }
            DiscoveryMessage::Heartbeat { node_id, timestamp, term: _ } => {
                self.handle_heartbeat(node_id, timestamp).await?;
            }
        }

        Ok(())
    }

    /// Handle node announcement
    async fn handle_node_announcement(&self, node_info: NodeInfo) -> ClusterResult<()> {
        let node_id = node_info.node_id;
        
        // Skip if it's our own announcement
        if node_id == self.local_node_info.node_id {
            return Ok(());
        }

        let mut known_nodes = self.known_nodes.write().await;
        
        if let Some(existing_info) = known_nodes.get_mut(&node_id) {
            // Update existing node
            if existing_info.last_seen < node_info.last_seen {
                *existing_info = node_info.clone();
                drop(known_nodes);
                
                // Notify callbacks
                let callbacks = self.callbacks.lock().await;
                for callback in callbacks.iter() {
                    callback.on_node_updated(&node_info).await;
                }
            }
        } else {
            // Add new node
            known_nodes.insert(node_id, node_info.clone());
            drop(known_nodes);
            
            info!("Discovered new node: {}", node_id);
            
            // Notify callbacks
            let callbacks = self.callbacks.lock().await;
            for callback in callbacks.iter() {
                callback.on_node_joined(&node_info).await;
            }
        }

        Ok(())
    }

    /// Handle discovery request
    async fn handle_discovery_request(&self, source: &str, requester_id: Uuid, timestamp: chrono::DateTime<chrono::Utc>) -> ClusterResult<()> {
        if requester_id == self.local_node_info.node_id {
            return Ok(());
        }

        let known_nodes = self.known_nodes.read().await;
        let nodes: Vec<NodeInfo> = known_nodes.values().cloned().collect();
        drop(known_nodes);

        let response = DiscoveryMessage::DiscoveryResponse {
            requester_id,
            known_nodes: nodes,
            timestamp,
        };

        let sender = self.network_sender.lock().await;
        sender.send_discovery_message(source, response).await?;

        Ok(())
    }

    /// Handle discovery response
    async fn handle_discovery_response(&self, requester_id: Uuid, known_nodes: Vec<NodeInfo>, _timestamp: chrono::DateTime<chrono::Utc>) -> ClusterResult<()> {
        if requester_id != self.local_node_info.node_id {
            return Ok(());
        }

        for node_info in known_nodes {
            self.handle_node_announcement(node_info).await?;
        }

        Ok(())
    }

    /// Handle node leave
    async fn handle_node_leave(&self, node_id: Uuid, reason: &str) -> ClusterResult<()> {
        self.remove_node(node_id, reason).await
    }

    /// Handle heartbeat
    async fn handle_heartbeat(&self, node_id: Uuid, timestamp: chrono::DateTime<chrono::Utc>) -> ClusterResult<()> {
        let mut known_nodes = self.known_nodes.write().await;
        
        if let Some(node_info) = known_nodes.get_mut(&node_id) {
            node_info.last_seen = timestamp;
        }

        Ok(())
    }

    /// Remove a node from the known nodes
    async fn remove_node(&self, node_id: Uuid, reason: &str) -> ClusterResult<()> {
        let mut known_nodes = self.known_nodes.write().await;
        
        if known_nodes.remove(&node_id).is_some() {
            info!("Node {} left: {}", node_id, reason);
            drop(known_nodes);
            
            // Notify callbacks
            let callbacks = self.callbacks.lock().await;
            for callback in callbacks.iter() {
                callback.on_node_left(node_id, reason).await;
            }
        }

        Ok(())
    }

    /// Add a node discovery callback
    pub async fn add_callback(&self, callback: Box<dyn NodeDiscoveryCallback + Send + Sync>) {
        let mut callbacks = self.callbacks.lock().await;
        callbacks.push(callback);
    }

    /// Get all known nodes
    pub async fn get_known_nodes(&self) -> Vec<NodeInfo> {
        self.known_nodes.read().await.values().cloned().collect()
    }

    /// Get specific node information
    pub async fn get_node_info(&self, node_id: Uuid) -> Option<NodeInfo> {
        self.known_nodes.read().await.get(&node_id).cloned()
    }

    /// Send node leave notification
    pub async fn send_leave_notification(&self, reason: &str) -> ClusterResult<()> {
        let message = DiscoveryMessage::NodeLeave {
            node_id: self.local_node_info.node_id,
            timestamp: chrono::Utc::now(),
            reason: reason.to_string(),
        };

        let sender = self.network_sender.lock().await;
        sender.broadcast_discovery_message(message).await?;

        Ok(())
    }
}

impl Clone for NodeDiscovery {
    fn clone(&self) -> Self {
        Self {
            local_node_info: self.local_node_info.clone(),
            config: self.config.clone(),
            known_nodes: Arc::clone(&self.known_nodes),
            callbacks: Arc::clone(&self.callbacks),
            network_sender: Arc::clone(&self.network_sender),
        }
    }
}