use anyhow::{Result, anyhow}; use std::path::Path; use std::fs; use std::time::{Duration, Instant}; use std::process::Command; use tracing::{debug, warn}; use std::sync::Mutex; use crate::sal::traits::{SensorBus, ActuatorBus, EnvironmentGuard, HardwareWatchdog, PreflightAuditor, AuditStep, AuditError, SafetyStatus}; use crate::sal::heuristic::discovery::SystemFactSheet; use crate::sal::heuristic::schema::HardwareDb; pub struct GenericLinuxSal { fact_sheet: SystemFactSheet, db: HardwareDb, suppressed_services: Mutex>, last_valid_temp: Mutex<(f32, Instant)>, current_pl1: Mutex, last_energy: Mutex<(u64, Instant)>, } impl GenericLinuxSal { pub fn new(facts: SystemFactSheet, db: HardwareDb) -> Self { Self { db, suppressed_services: Mutex::new(Vec::new()), last_valid_temp: Mutex::new((0.0, Instant::now())), current_pl1: Mutex::new(15.0), last_energy: Mutex::new((0, Instant::now())), fact_sheet: facts, } } fn is_dell(&self) -> bool { self.fact_sheet.vendor.to_lowercase().contains("dell") } /// Read sysfs safely. We removed the thread-per-read timeout logic /// as it was inefficient. sysfs reads are generally fast enough. fn read_sysfs(&self, path: &Path) -> Result { fs::read_to_string(path).map(|s| s.trim().to_string()).map_err(|e| anyhow!(e)) } } impl PreflightAuditor for GenericLinuxSal { fn audit(&self) -> Box + '_> { let mut steps = Vec::new(); for check in &self.db.preflight_checks { let status = Command::new("sh").arg("-c").arg(&check.check_cmd).status(); steps.push(AuditStep { description: check.name.clone(), outcome: match status { Ok(s) if s.success() => Ok(()), _ => Err(AuditError::KernelIncompatible(check.fail_help.clone())), } }); } for conflict_id in &self.fact_sheet.active_conflicts { if let Some(conflict) = self.db.conflicts.iter().find(|c| &c.id == conflict_id) { if conflict.severity == "Critical" { steps.push(AuditStep { description: format!("Conflict: {}", conflict.id), outcome: Err(AuditError::ToolMissing(conflict.help_text.clone())), }); } } } Box::new(steps.into_iter()) } } impl SensorBus for GenericLinuxSal { fn get_temp(&self) -> Result { let path = self.fact_sheet.temp_path.as_ref() .ok_or_else(|| anyhow!("No temperature sensor path found"))?; let content = self.read_sysfs(path)?; let temp = content.parse::()? / 1000.0; let mut last = self.last_valid_temp.lock().unwrap(); if (temp - last.0).abs() > 0.01 { *last = (temp, Instant::now()); } Ok(temp) } fn get_power_w(&self) -> Result { let rapl_path = self.fact_sheet.rapl_paths.first() .ok_or_else(|| anyhow!("No RAPL path found"))?; let energy_path = rapl_path.join("energy_uj"); let mut last = self.last_energy.lock().unwrap(); let e2: u64 = self.read_sysfs(&energy_path)?.parse()?; let t2 = Instant::now(); let (e1, t1) = *last; let delta_e = e2.wrapping_sub(e1); let delta_t = t2.duration_since(t1).as_secs_f32(); *last = (e2, t2); if delta_t < 0.01 { return Ok(0.0); } Ok((delta_e as f32 / 1_000_000.0) / delta_t) } fn get_fan_rpms(&self) -> Result> { let mut rpms = Vec::new(); for path in &self.fact_sheet.fan_paths { if let Ok(content) = self.read_sysfs(path) { if let Ok(rpm) = content.parse() { rpms.push(rpm); } } } Ok(rpms) } fn get_freq_mhz(&self) -> Result { let path = Path::new("/sys/devices/system/cpu/cpu0/cpufreq/scaling_cur_freq"); if path.exists() { Ok(self.read_sysfs(path)?.parse::()? / 1000.0) } else { let cpuinfo = fs::read_to_string("/proc/cpuinfo")?; for line in cpuinfo.lines() { if line.starts_with("cpu MHz") { if let Some((_, mhz)) = line.split_once(':') { return Ok(mhz.trim().parse()?); } } } Err(anyhow!("Could not determine CPU frequency")) } } } impl ActuatorBus for GenericLinuxSal { fn set_fan_mode(&self, mode: &str) -> Result<()> { if self.is_dell() { let cmd = match mode { "manual" | "max" => self.db.ecosystems.get("dell").and_then(|e| e.fan_manual_mode_cmd.as_ref()), "auto" => self.db.ecosystems.get("dell").and_then(|e| e.fan_auto_mode_cmd.as_ref()), _ => return Err(anyhow!("Unsupported fan mode: {}", mode)), }; if let Some(cmd_str) = cmd { let parts: Vec<&str> = cmd_str.split_whitespace().collect(); Command::new(parts[0]).args(&parts[1..]).status()?; Ok(()) } else { Err(anyhow!("Dell fan command missing")) } } else { Ok(()) } } fn set_sustained_power_limit(&self, watts: f32) -> Result<()> { let rapl_path = self.fact_sheet.rapl_paths.first().ok_or_else(|| anyhow!("No PL1 path"))?; fs::write(rapl_path.join("constraint_0_power_limit_uw"), ((watts * 1_000_000.0) as u64).to_string())?; *self.current_pl1.lock().unwrap() = watts; Ok(()) } fn set_burst_power_limit(&self, watts: f32) -> Result<()> { let rapl_path = self.fact_sheet.rapl_paths.first().ok_or_else(|| anyhow!("No PL2 path"))?; fs::write(rapl_path.join("constraint_1_power_limit_uw"), ((watts * 1_000_000.0) as u64).to_string())?; Ok(()) } } impl EnvironmentGuard for GenericLinuxSal { fn suppress(&self) -> Result<()> { let mut suppressed = self.suppressed_services.lock().unwrap(); for conflict_id in &self.fact_sheet.active_conflicts { if let Some(conflict) = self.db.conflicts.iter().find(|c| &c.id == conflict_id) { for service in &conflict.services { if Command::new("systemctl").arg("stop").arg(service).status()?.success() { suppressed.push(service.clone()); } } } } Ok(()) } fn restore(&self) -> Result<()> { let mut suppressed = self.suppressed_services.lock().unwrap(); for service in suppressed.drain(..) { let _ = Command::new("systemctl").arg("start").arg(service).status(); } if self.is_dell() { let _ = self.set_fan_mode("auto"); } Ok(()) } } impl HardwareWatchdog for GenericLinuxSal { fn get_safety_status(&self) -> Result { let temp = self.get_temp()?; if temp > 100.0 { return Ok(SafetyStatus::EmergencyAbort(format!("Thermal runaway: {:.1}°C", temp))); } let last = self.last_valid_temp.lock().unwrap(); if last.1.elapsed() > Duration::from_secs(5) { return Ok(SafetyStatus::EmergencyAbort("Temperature sensor stalled".to_string())); } Ok(SafetyStatus::Nominal) } } impl Drop for GenericLinuxSal { fn drop(&mut self) { let _ = self.restore(); } }