aboutsummaryrefslogtreecommitdiff
path: root/seaweedfs-rdma-sidecar/rdma-engine/src/main.rs
blob: 996d3a9d56f5e09c7fad73b14648e661d1fd7205 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
//! RDMA Engine Server
//!
//! High-performance RDMA engine server that communicates with the Go sidecar
//! via IPC and handles RDMA operations with zero-copy semantics.
//!
//! Usage:
//! ```bash
//! rdma-engine-server --device mlx5_0 --port 18515 --ipc-socket /tmp/rdma-engine.sock
//! ```

use clap::Parser;
use rdma_engine::{RdmaEngine, RdmaEngineConfig};
use std::path::PathBuf;
use tracing::{info, error};
use tracing_subscriber::{EnvFilter, fmt::layer, prelude::*};

#[derive(Parser)]
#[command(
    name = "rdma-engine-server",
    about = "High-performance RDMA engine for SeaweedFS",
    version = env!("CARGO_PKG_VERSION")
)]
struct Args {
    /// UCX device name preference (e.g., mlx5_0, or 'auto' for UCX auto-selection)
    #[arg(short, long, default_value = "auto")]
    device: String,
    
    /// RDMA port number
    #[arg(short, long, default_value_t = 18515)]
    port: u16,
    
    /// Maximum number of concurrent sessions
    #[arg(long, default_value_t = 1000)]
    max_sessions: usize,
    
    /// Session timeout in seconds
    #[arg(long, default_value_t = 300)]
    session_timeout: u64,
    
    /// Memory buffer size in bytes
    #[arg(long, default_value_t = 1024 * 1024 * 1024)]
    buffer_size: usize,
    
    /// IPC socket path
    #[arg(long, default_value = "/tmp/rdma-engine.sock")]
    ipc_socket: PathBuf,
    
    /// Enable debug logging
    #[arg(long)]
    debug: bool,
    
    /// Configuration file path
    #[arg(short, long)]
    config: Option<PathBuf>,
}

#[tokio::main]
async fn main() -> anyhow::Result<()> {
    let args = Args::parse();
    
    // Initialize tracing
    let filter = if args.debug {
        EnvFilter::try_from_default_env()
            .or_else(|_| EnvFilter::try_new("debug"))
            .unwrap()
    } else {
        EnvFilter::try_from_default_env()
            .or_else(|_| EnvFilter::try_new("info"))
            .unwrap()
    };
    
    tracing_subscriber::registry()
        .with(layer().with_target(false))
        .with(filter)
        .init();
    
    info!("🚀 Starting SeaweedFS UCX RDMA Engine Server");
    info!("   Version: {}", env!("CARGO_PKG_VERSION"));
    info!("   UCX Device Preference: {}", args.device);
    info!("   Port: {}", args.port);
    info!("   Max Sessions: {}", args.max_sessions);
    info!("   Buffer Size: {} bytes", args.buffer_size);
    info!("   IPC Socket: {}", args.ipc_socket.display());
    info!("   Debug Mode: {}", args.debug);
    
    // Load configuration
    let config = RdmaEngineConfig {
        device_name: args.device,
        port: args.port,
        max_sessions: args.max_sessions,
        session_timeout_secs: args.session_timeout,
        buffer_size: args.buffer_size,
        ipc_socket_path: args.ipc_socket.to_string_lossy().to_string(),
        debug: args.debug,
    };
    
    // Override with config file if provided
    if let Some(config_path) = args.config {
        info!("Loading configuration from: {}", config_path.display());
        // TODO: Implement configuration file loading
    }
    
    // Create and run RDMA engine
    let mut engine = match RdmaEngine::new(config).await {
        Ok(engine) => {
            info!("✅ RDMA engine initialized successfully");
            engine
        }
        Err(e) => {
            error!("❌ Failed to initialize RDMA engine: {}", e);
            return Err(e);
        }
    };
    
    // Set up signal handlers for graceful shutdown
    let mut sigterm = tokio::signal::unix::signal(tokio::signal::unix::SignalKind::terminate())?;
    let mut sigint = tokio::signal::unix::signal(tokio::signal::unix::SignalKind::interrupt())?;
    
    // Run engine in background
    let engine_handle = tokio::spawn(async move {
        if let Err(e) = engine.run().await {
            error!("RDMA engine error: {}", e);
            return Err(e);
        }
        Ok(())
    });
    
    info!("🎯 RDMA engine is running and ready to accept connections");
    info!("   Send SIGTERM or SIGINT to shutdown gracefully");
    
    // Wait for shutdown signal
    tokio::select! {
        _ = sigterm.recv() => {
            info!("📡 Received SIGTERM, shutting down gracefully");
        }
        _ = sigint.recv() => {
            info!("📡 Received SIGINT (Ctrl+C), shutting down gracefully");
        }
        result = engine_handle => {
            match result {
                Ok(Ok(())) => info!("🏁 RDMA engine completed successfully"),
                Ok(Err(e)) => {
                    error!("❌ RDMA engine failed: {}", e);
                    return Err(e);
                }
                Err(e) => {
                    error!("❌ RDMA engine task panicked: {}", e);
                    return Err(anyhow::anyhow!("Engine task panicked: {}", e));
                }
            }
        }
    }
    
    info!("🛑 RDMA engine server shut down complete");
    Ok(())
}

#[cfg(test)]
mod tests {
    use super::*;
    
    #[test]
    fn test_args_parsing() {
        let args = Args::try_parse_from(&[
            "rdma-engine-server",
            "--device", "mlx5_0",
            "--port", "18515",
            "--debug"
        ]).unwrap();
        
        assert_eq!(args.device, "mlx5_0");
        assert_eq!(args.port, 18515);
        assert!(args.debug);
    }
}