nucleus/security/
seccomp_trace.rs1use crate::error::{NucleusError, Result};
13use serde::{Deserialize, Serialize};
14use std::collections::BTreeMap;
15use std::io::{BufRead, BufReader, Write};
16use std::path::{Path, PathBuf};
17use std::sync::atomic::{AtomicBool, Ordering};
18use std::sync::Arc;
19use std::thread::JoinHandle;
20use tracing::{debug, info, warn};
21
22#[derive(Debug, Clone, Serialize, Deserialize)]
24pub struct TraceRecord {
25 pub syscall: i64,
27 pub name: Option<String>,
29 pub count: u64,
31}
32
33pub struct SeccompTraceReader {
35 pid: u32,
36 output_path: PathBuf,
37 stop: Arc<AtomicBool>,
38 handle: Option<JoinHandle<()>>,
39}
40
41impl SeccompTraceReader {
42 pub fn new(pid: u32, output_path: &Path) -> Self {
44 Self {
45 pid,
46 output_path: output_path.to_path_buf(),
47 stop: Arc::new(AtomicBool::new(false)),
48 handle: None,
49 }
50 }
51
52 pub fn start_recording(&mut self) -> Result<()> {
57 let pid = self.pid;
58 let output_path = self.output_path.clone();
59 let stop = self.stop.clone();
60
61 let handle = std::thread::spawn(move || {
62 if let Err(e) = record_loop(pid, &output_path, &stop) {
63 warn!("Seccomp trace reader error: {}", e);
64 }
65 });
66
67 self.handle = Some(handle);
68 info!("Seccomp trace reader started for PID {}", self.pid);
69 Ok(())
70 }
71
72 pub fn stop_and_flush(mut self) {
74 self.stop.store(true, Ordering::Release);
75 if let Some(handle) = self.handle.take() {
76 let _ = handle.join();
77 }
78 info!(
79 "Seccomp trace reader stopped, output at {:?}",
80 self.output_path
81 );
82 }
83}
84
85impl Drop for SeccompTraceReader {
86 fn drop(&mut self) {
87 self.stop.store(true, Ordering::Release);
88 if let Some(handle) = self.handle.take() {
89 let _ = handle.join();
90 }
91 }
92}
93
94fn record_loop(pid: u32, output_path: &Path, stop: &AtomicBool) -> Result<()> {
96 let mut syscalls: BTreeMap<i64, u64> = BTreeMap::new();
97
98 let kmsg_path = std::path::Path::new("/dev/kmsg");
100 if let Ok(meta) = std::fs::symlink_metadata(kmsg_path) {
101 if meta.file_type().is_symlink() {
102 warn!("/dev/kmsg is a symlink — refusing to open for seccomp tracing");
103 write_trace_file(output_path, &syscalls)?;
104 return Ok(());
105 }
106 }
107
108 let file = match std::fs::File::open(kmsg_path) {
110 Ok(f) => f,
111 Err(e) => {
112 warn!(
113 "Cannot open /dev/kmsg for seccomp tracing: {} \
114 (requires root or CAP_SYSLOG). Falling back to no-trace mode.",
115 e
116 );
117 write_trace_file(output_path, &syscalls)?;
119 return Ok(());
120 }
121 };
122
123 use std::os::unix::io::AsRawFd;
128 let fd = file.as_raw_fd();
129 unsafe {
133 let flags = libc::fcntl(fd, libc::F_GETFL);
134 if flags >= 0 {
135 libc::fcntl(fd, libc::F_SETFL, flags | libc::O_NONBLOCK);
136 }
137 }
138
139 let reader = BufReader::new(file);
140 let pid_pattern = format!("pid={}", pid);
141
142 for line in reader.lines() {
143 if stop.load(Ordering::Acquire) {
144 break;
145 }
146
147 let line = match line {
148 Ok(l) => l,
149 Err(e) => {
150 if e.kind() == std::io::ErrorKind::WouldBlock {
151 let mut pfd = libc::pollfd {
153 fd,
154 events: libc::POLLIN,
155 revents: 0,
156 };
157 unsafe { libc::poll(&mut pfd, 1, 2000) };
160 continue;
161 }
162 debug!("kmsg read error: {}", e);
163 continue;
164 }
165 };
166
167 if line.contains("type=1326") && line.contains(&pid_pattern) {
170 if let Some(nr) = extract_syscall_nr(&line) {
171 *syscalls.entry(nr).or_insert(0) += 1;
172 }
173 }
174 }
175
176 write_trace_file(output_path, &syscalls)?;
177 info!("Seccomp trace: recorded {} unique syscalls", syscalls.len());
178 Ok(())
179}
180
181fn extract_syscall_nr(line: &str) -> Option<i64> {
183 line.split_whitespace()
185 .find(|s| s.starts_with("syscall="))
186 .and_then(|s| s.strip_prefix("syscall="))
187 .and_then(|s| s.parse().ok())
188}
189
190fn write_trace_file(path: &Path, syscalls: &BTreeMap<i64, u64>) -> Result<()> {
192 let mut file = std::fs::File::create(path).map_err(|e| {
193 NucleusError::ConfigError(format!("Failed to create trace file {:?}: {}", path, e))
194 })?;
195
196 for (&nr, &count) in syscalls {
197 let record = TraceRecord {
198 syscall: nr,
199 name: super::seccomp_generate::syscall_number_to_name(nr).map(String::from),
200 count,
201 };
202 let line =
203 serde_json::to_string(&record).unwrap_or_else(|e| format!("{{\"error\":\"{}\"}}", e));
204 writeln!(file, "{}", line).map_err(|e| {
205 NucleusError::ConfigError(format!("Failed to write trace record: {}", e))
206 })?;
207 }
208
209 Ok(())
210}
211
212#[cfg(test)]
213mod tests {
214 use super::*;
215
216 #[test]
217 fn test_extract_syscall_nr() {
218 let line = "6,1234,5678,-;audit: type=1326 audit(123:456): auid=0 uid=0 gid=0 ses=1 pid=42 comm=\"test\" exe=\"/bin/test\" sig=0 arch=c000003e syscall=257 compat=0 ip=0x7f action=0x7fff0000";
219 assert_eq!(extract_syscall_nr(line), Some(257));
220 }
221
222 #[test]
223 fn test_extract_syscall_nr_missing() {
224 assert_eq!(extract_syscall_nr("no syscall here"), None);
225 }
226
227 fn extract_fn_body<'a>(source: &'a str, fn_signature: &str) -> &'a str {
230 let fn_start = source
231 .find(fn_signature)
232 .unwrap_or_else(|| panic!("function '{}' not found in source", fn_signature));
233 let after = &source[fn_start..];
234 let open = after
235 .find('{')
236 .unwrap_or_else(|| panic!("no opening brace found for '{}'", fn_signature));
237 let mut depth = 0u32;
238 let mut end = open;
239 for (i, ch) in after[open..].char_indices() {
240 match ch {
241 '{' => depth += 1,
242 '}' => {
243 depth -= 1;
244 if depth == 0 {
245 end = open + i + 1;
246 break;
247 }
248 }
249 _ => {}
250 }
251 }
252 &after[..end]
253 }
254
255 #[test]
256 fn test_reader_uses_nonblocking_io() {
257 let source = include_str!("seccomp_trace.rs");
261 let fn_body = extract_fn_body(source, "fn record_loop");
262 assert!(
263 fn_body.contains("O_NONBLOCK"),
264 "record_loop must use O_NONBLOCK for non-blocking reads on /dev/kmsg"
265 );
266 assert!(
267 fn_body.contains("libc::poll"),
268 "record_loop must use poll() for timed waits on /dev/kmsg"
269 );
270 let setsockopt_lines: Vec<&str> = fn_body
272 .lines()
273 .filter(|l| !l.trim().starts_with("//"))
274 .filter(|l| l.contains("setsockopt"))
275 .collect();
276 assert!(
277 setsockopt_lines.is_empty(),
278 "record_loop must not call setsockopt on /dev/kmsg"
279 );
280 }
281
282 #[test]
283 fn test_trace_record_serialization() {
284 let record = TraceRecord {
285 syscall: 0,
286 name: Some("read".to_string()),
287 count: 42,
288 };
289 let json = serde_json::to_string(&record).unwrap();
290 assert!(json.contains("\"syscall\":0"));
291 assert!(json.contains("\"name\":\"read\""));
292 assert!(json.contains("\"count\":42"));
293 }
294}