Add responsive column visibility to service panel

Service panel now dynamically shows/hides columns based on terminal width: - ≥80 chars: All columns (Name, Status, RAM, Uptime, Restarts) - ≥60 chars: Hide Restarts only - ≥45 chars: Hide Uptime and Restarts - <45 chars: Minimal (Name and Status only) Improves dashboard usability on smaller terminal sizes.
Remove debug logging from disk collector
2025-11-30 10:50:08 +01:00 · 2025-11-30 00:44:38 +01:00 · 2025-11-30 00:35:19 +01:00 · 2025-11-30 00:14:25 +01:00 · 2025-11-29 23:51:43 +01:00 · 2025-11-29 23:25:17 +01:00
16 changed files with 549 additions and 281 deletions
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -327,9 +327,16 @@ Storage:
  ├─ ● Data_2: GGA04461 T: 28°C
  └─ ● Parity: WDZS8RY0 T: 29°C
 Backup:
 ● Repo: 4
  ├─ getea
  ├─ vaultwarden
  ├─ mysql
  └─ immich
 ● W800639Y W: 2%
  ├─ ● Backup: 2025-11-29T04:00:01.324623
  └─ ● Usage: 8% 70GB/916GB
 ● WD-WCC7K1234567 T: 32°C W: 12%
-  ├─ Last: 2h ago (12.3GB)
+  ├─ ● Backup: 2025-11-29T04:00:01.324623
  ├─ Next: in 22h
  └─ ● Usage: 45% 678GB/1.5TB
 ```
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -279,7 +279,7 @@ checksum = "a1d728cc89cf3aee9ff92b05e62b19ee65a02b5702cff7d5a377e32c6ae29d8d"
 [[package]]
 name = "cm-dashboard"
-version = "0.1.205"
+version = "0.1.226"
 dependencies = [
 "anyhow",
 "chrono",
@@ -301,7 +301,7 @@ dependencies = [
 [[package]]
 name = "cm-dashboard-agent"
-version = "0.1.205"
+version = "0.1.226"
 dependencies = [
 "anyhow",
 "async-trait",
@@ -309,6 +309,7 @@ dependencies = [
 "chrono-tz",
 "clap",
 "cm-dashboard-shared",
 "futures",
 "gethostname",
 "lettre",
 "reqwest",
@@ -324,7 +325,7 @@ dependencies = [
 [[package]]
 name = "cm-dashboard-shared"
-version = "0.1.205"
+version = "0.1.226"
 dependencies = [
 "chrono",
 "serde",
@@ -552,6 +553,21 @@ dependencies = [
 "percent-encoding",
 ]
 [[package]]
 name = "futures"
 version = "0.3.31"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "65bc07b1a8bc7c85c5f2e110c476c7389b4554ba72af57d8445ea63a576b0876"
 dependencies = [
 "futures-channel",
 "futures-core",
 "futures-executor",
 "futures-io",
 "futures-sink",
 "futures-task",
 "futures-util",
 ]
 [[package]]
 name = "futures-channel"
 version = "0.3.31"
@@ -559,6 +575,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "2dff15bf788c671c1934e366d07e30c1814a8ef514e1af724a602e8a2fbe1b10"
 dependencies = [
 "futures-core",
 "futures-sink",
 ]
 [[package]]
@@ -567,12 +584,34 @@ version = "0.3.31"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "05f29059c0c2090612e8d742178b0580d2dc940c837851ad723096f87af6663e"
 [[package]]
 name = "futures-executor"
 version = "0.3.31"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1e28d1d997f585e54aebc3f97d39e72338912123a67330d723fdbb564d646c9f"
 dependencies = [
 "futures-core",
 "futures-task",
 "futures-util",
 ]
 [[package]]
 name = "futures-io"
 version = "0.3.31"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "9e5c1b78ca4aae1ac06c48a526a655760685149f0d465d21f37abfe57ce075c6"
 [[package]]
 name = "futures-macro"
 version = "0.3.31"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "162ee34ebcb7c64a8abebc059ce0fee27c2262618d7b60ed8faf72fef13c3650"
 dependencies = [
 "proc-macro2",
 "quote",
 "syn",
 ]
 [[package]]
 name = "futures-sink"
 version = "0.3.31"
@@ -591,8 +630,11 @@ version = "0.3.31"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "9fa08315bb612088cc391249efdc3bc77536f16c91f6cf495e6fbe85b20a4a81"
 dependencies = [
 "futures-channel",
 "futures-core",
 "futures-io",
 "futures-macro",
 "futures-sink",
 "futures-task",
 "memchr",
 "pin-project-lite",
--- a/agent/Cargo.toml
+++ b/agent/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "cm-dashboard-agent"
-version = "0.1.206"
+version = "0.1.227"
 edition = "2021"
 [dependencies]
@@ -20,4 +20,5 @@ gethostname = { workspace = true }
 chrono-tz = "0.8"
 toml = { workspace = true }
 async-trait = "0.1"
-reqwest = { version = "0.11", features = ["json", "blocking"] }
+reqwest = { version = "0.11", features = ["json", "blocking"] }
 futures = "0.3"
--- a/agent/src/agent.rs
+++ b/agent/src/agent.rs
@@ -114,7 +114,7 @@ impl Agent {
        // Set up intervals
        let mut transmission_interval = interval(Duration::from_secs(
-            self.config.collection_interval_seconds,
+            self.config.zmq.transmission_interval_seconds,
        ));
        let mut notification_interval = interval(Duration::from_secs(30)); // Check notifications every 30s
--- a/agent/src/collectors/backup.rs
+++ b/agent/src/collectors/backup.rs
@@ -1,36 +1,66 @@
 use async_trait::async_trait;
-use cm_dashboard_shared::{AgentData, BackupData, BackupDiskData};
+use cm_dashboard_shared::{AgentData, BackupData, BackupDiskData, Status};
 use serde::{Deserialize, Serialize};
-use std::collections::HashMap;
+use std::collections::{HashMap, HashSet};
 use std::fs;
-use std::path::Path;
+use std::path::{Path, PathBuf};
-use tracing::debug;
+use tracing::{debug, warn};
 use super::{Collector, CollectorError};
 /// Backup collector that reads backup status from TOML files with structured data output
 pub struct BackupCollector {
-    /// Path to backup status file
+    /// Directory containing backup status files
-    status_file_path: String,
+    status_dir: String,
 }
 impl BackupCollector {
    pub fn new() -> Self {
        Self {
-            status_file_path: "/var/lib/backup/backup-status.toml".to_string(),
+            status_dir: "/var/lib/backup/status".to_string(),
        }
    }
-    /// Read backup status from TOML file
+    /// Scan directory for all backup status files
-    async fn read_backup_status(&self) -> Result<Option<BackupStatusToml>, CollectorError> {
+    async fn scan_status_files(&self) -> Result<Vec<PathBuf>, CollectorError> {
-        if !Path::new(&self.status_file_path).exists() {
+        let status_path = Path::new(&self.status_dir);
-            debug!("Backup status file not found: {}", self.status_file_path);
+
-            return Ok(None);
+        if !status_path.exists() {
            debug!("Backup status directory not found: {}", self.status_dir);
            return Ok(Vec::new());
        }
-        let content = fs::read_to_string(&self.status_file_path)
+        let mut status_files = Vec::new();
        match fs::read_dir(status_path) {
            Ok(entries) => {
                for entry in entries {
                    if let Ok(entry) = entry {
                        let path = entry.path();
                        if path.is_file() {
                            if let Some(filename) = path.file_name().and_then(|n| n.to_str()) {
                                if filename.starts_with("backup-status-") && filename.ends_with(".toml") {
                                    status_files.push(path);
                                }
                            }
                        }
                    }
                }
            }
            Err(e) => {
                warn!("Failed to read backup status directory: {}", e);
                return Ok(Vec::new());
            }
        }
        Ok(status_files)
    }
    /// Read a single backup status file
    async fn read_status_file(&self, path: &Path) -> Result<BackupStatusToml, CollectorError> {
        let content = fs::read_to_string(path)
            .map_err(|e| CollectorError::SystemRead {
-                path: self.status_file_path.clone(),
+                path: path.to_string_lossy().to_string(),
                error: e.to_string(),
            })?;
@@ -40,66 +70,122 @@ impl BackupCollector {
                error: format!("Failed to parse backup status TOML: {}", e),
            })?;
-        Ok(Some(status))
+        Ok(status)
    }
    /// Calculate backup status from TOML status field
    fn calculate_backup_status(status_str: &str) -> Status {
        match status_str.to_lowercase().as_str() {
            "success" => Status::Ok,
            "warning" => Status::Warning,
            "failed" | "error" => Status::Critical,
            _ => Status::Unknown,
        }
    }
    /// Calculate usage status from disk usage percentage
    fn calculate_usage_status(usage_percent: f32) -> Status {
        if usage_percent < 80.0 {
            Status::Ok
        } else if usage_percent < 90.0 {
            Status::Warning
        } else {
            Status::Critical
        }
    }
    /// Convert BackupStatusToml to BackupData and populate AgentData
    async fn populate_backup_data(&self, agent_data: &mut AgentData) -> Result<(), CollectorError> {
-        if let Some(backup_status) = self.read_backup_status().await? {
+        let status_files = self.scan_status_files().await?;
            // Use raw start_time string from TOML
-            // Extract disk information
+        if status_files.is_empty() {
-            let repository_disk = if let Some(disk_space) = &backup_status.disk_space {
+            debug!("No backup status files found");
                Some(BackupDiskData {
                    serial: backup_status.disk_serial_number.clone().unwrap_or_else(|| "Unknown".to_string()),
                    usage_percent: disk_space.usage_percent as f32,
                    used_gb: disk_space.used_gb as f32,
                    total_gb: disk_space.total_gb as f32,
                    wear_percent: backup_status.disk_wear_percent,
                    temperature_celsius: None, // Not available in current TOML
                })
            } else if let Some(serial) = &backup_status.disk_serial_number {
                // Fallback: create minimal disk info if we have serial but no disk_space
                Some(BackupDiskData {
                    serial: serial.clone(),
                    usage_percent: 0.0,
                    used_gb: 0.0,
                    total_gb: 0.0,
                    wear_percent: backup_status.disk_wear_percent,
                    temperature_celsius: None,
                })
            } else {
                None
            };
            // Calculate total repository size from services
            let total_size_gb = backup_status.services
                .values()
                .map(|service| service.repo_size_bytes as f32 / (1024.0 * 1024.0 * 1024.0))
                .sum::<f32>();
            let backup_data = BackupData {
                status: backup_status.status,
                total_size_gb: Some(total_size_gb),
                repository_health: Some("ok".to_string()), // Derive from status if needed
                repository_disk,
                last_backup_size_gb: None, // Not available in current TOML format
                start_time_raw: Some(backup_status.start_time),
            };
            agent_data.backup = backup_data;
        } else {
            // No backup status available - set default values
            agent_data.backup = BackupData {
-                status: "unavailable".to_string(),
+                repositories: Vec::new(),
-                total_size_gb: None,
+                repository_status: Status::Unknown,
-                repository_health: None,
+                disks: Vec::new(),
                repository_disk: None,
                last_backup_size_gb: None,
                start_time_raw: None,
            };
            return Ok(());
        }
        let mut all_repositories = HashSet::new();
        let mut disks = Vec::new();
        let mut worst_status = Status::Ok;
        for status_file in status_files {
            match self.read_status_file(&status_file).await {
                Ok(backup_status) => {
                    // Collect all service names
                    for service_name in backup_status.services.keys() {
                        all_repositories.insert(service_name.clone());
                    }
                    // Calculate backup status
                    let backup_status_enum = Self::calculate_backup_status(&backup_status.status);
                    // Calculate usage status from disk space
                    let (usage_percent, used_gb, total_gb, usage_status) = if let Some(disk_space) = &backup_status.disk_space {
                        let usage_pct = disk_space.usage_percent as f32;
                        (
                            usage_pct,
                            disk_space.used_gb as f32,
                            disk_space.total_gb as f32,
                            Self::calculate_usage_status(usage_pct),
                        )
                    } else {
                        (0.0, 0.0, 0.0, Status::Unknown)
                    };
                    // Update worst status
                    worst_status = worst_status.max(backup_status_enum).max(usage_status);
                    // Build service list for this disk
                    let services: Vec<String> = backup_status.services.keys().cloned().collect();
                    // Get min and max archive counts to detect inconsistencies
                    let archives_min: i64 = backup_status.services.values()
                        .map(|service| service.archive_count)
                        .min()
                        .unwrap_or(0);
                    let archives_max: i64 = backup_status.services.values()
                        .map(|service| service.archive_count)
                        .max()
                        .unwrap_or(0);
                    // Create disk data
                    let disk_data = BackupDiskData {
                        serial: backup_status.disk_serial_number.unwrap_or_else(|| "Unknown".to_string()),
                        product_name: backup_status.disk_product_name,
                        wear_percent: backup_status.disk_wear_percent,
                        temperature_celsius: None, // Not available in current TOML
                        last_backup_time: Some(backup_status.start_time),
                        backup_status: backup_status_enum,
                        disk_usage_percent: usage_percent,
                        disk_used_gb: used_gb,
                        disk_total_gb: total_gb,
                        usage_status,
                        services,
                        archives_min,
                        archives_max,
                    };
                    disks.push(disk_data);
                }
                Err(e) => {
                    warn!("Failed to read backup status file {:?}: {}", status_file, e);
                }
            }
        }
        let repositories: Vec<String> = all_repositories.into_iter().collect();
        agent_data.backup = BackupData {
            repositories,
            repository_status: worst_status,
            disks,
        };
        Ok(())
    }
 }
--- a/agent/src/collectors/cpu.rs
+++ b/agent/src/collectors/cpu.rs
@@ -119,36 +119,69 @@ impl CpuCollector {
        utils::parse_u64(content.trim())
    }
-    /// Collect CPU frequency and populate AgentData
+    /// Collect CPU C-state (idle depth) and populate AgentData with top 3 C-states by usage
-    async fn collect_frequency(&self, agent_data: &mut AgentData) -> Result<(), CollectorError> {
+    async fn collect_cstate(&self, agent_data: &mut AgentData) -> Result<(), CollectorError> {
-        // Try scaling frequency first (more accurate for current frequency)
+        // Read C-state usage from first CPU (representative of overall system)
-        if let Ok(freq) =
+        // C-states indicate CPU idle depth: C1=light sleep, C6=deep sleep, C10=deepest
            utils::read_proc_file("/sys/devices/system/cpu/cpu0/cpufreq/scaling_cur_freq")
        {
            if let Ok(freq_khz) = utils::parse_u64(freq.trim()) {
                let freq_mhz = freq_khz as f32 / 1000.0;
                agent_data.system.cpu.frequency_mhz = freq_mhz;
                return Ok(());
            }
        }
-        // Fallback: parse /proc/cpuinfo for base frequency
+        let mut cstate_times: Vec<(String, u64)> = Vec::new();
-        if let Ok(content) = utils::read_proc_file("/proc/cpuinfo") {
+        let mut total_time: u64 = 0;
-            for line in content.lines() {
+
-                if line.starts_with("cpu MHz") {
+        // Collect all C-state times from CPU0
-                    if let Some(freq_str) = line.split(':').nth(1) {
+        for state_num in 0..=10 {
-                        if let Ok(freq_mhz) = utils::parse_f32(freq_str) {
+            let time_path = format!("/sys/devices/system/cpu/cpu0/cpuidle/state{}/time", state_num);
-                            agent_data.system.cpu.frequency_mhz = freq_mhz;
+            let name_path = format!("/sys/devices/system/cpu/cpu0/cpuidle/state{}/name", state_num);
-                            return Ok(());
+
            if let Ok(time_str) = utils::read_proc_file(&time_path) {
                if let Ok(time) = utils::parse_u64(time_str.trim()) {
                    if let Ok(name) = utils::read_proc_file(&name_path) {
                        let state_name = name.trim();
                        // Skip POLL state (not real idle)
                        if state_name != "POLL" && time > 0 {
                            // Extract "C" + digits pattern (C3, C10, etc.) to reduce JSON size
                            // Handles formats like "C3_ACPI", "C10_MWAIT", etc.
                            let clean_name = if let Some(c_pos) = state_name.find('C') {
                                let rest = &state_name[c_pos + 1..];
                                let digit_count = rest.chars().take_while(|c| c.is_ascii_digit()).count();
                                if digit_count > 0 {
                                    state_name[c_pos..c_pos + 1 + digit_count].to_string()
                                } else {
                                    state_name.to_string()
                                }
                            } else {
                                state_name.to_string()
                            };
                            cstate_times.push((clean_name, time));
                            total_time += time;
                        }
                    }
                    break; // Only need first CPU entry
                }
            } else {
                // No more states available
                break;
            }
        }
-        debug!("CPU frequency not available");
+        // Sort by time descending to get top 3
-        // Leave frequency as 0.0 if not available
+        cstate_times.sort_by(|a, b| b.1.cmp(&a.1));
        // Calculate percentages for top 3 and populate AgentData
        agent_data.system.cpu.cstates = cstate_times
            .iter()
            .take(3)
            .map(|(name, time)| {
                let percent = if total_time > 0 {
                    (*time as f32 / total_time as f32) * 100.0
                } else {
                    0.0
                };
                cm_dashboard_shared::CStateInfo {
                    name: name.clone(),
                    percent,
                }
            })
            .collect();
        Ok(())
    }
 }
@@ -165,8 +198,8 @@ impl Collector for CpuCollector {
        // Collect temperature (optional)
        self.collect_temperature(agent_data).await?;
-        // Collect frequency (optional)
+        // Collect C-state (CPU idle depth)
-        self.collect_frequency(agent_data).await?;
+        self.collect_cstate(agent_data).await?;
        let duration = start.elapsed();
        debug!("CPU collection completed in {:?}", duration);
--- a/agent/src/collectors/disk.rs
+++ b/agent/src/collectors/disk.rs
@@ -3,10 +3,9 @@ use async_trait::async_trait;
 use cm_dashboard_shared::{AgentData, DriveData, FilesystemData, PoolData, HysteresisThresholds, Status};
 use crate::config::DiskConfig;
-use std::process::Command;
+use tokio::process::Command as TokioCommand;
-use std::time::Instant;
+use std::process::Command as StdCommand;
 use std::collections::HashMap;
 use tracing::debug;
 use super::{Collector, CollectorError};
@@ -67,9 +66,6 @@ impl DiskCollector {
    /// Collect all storage data and populate AgentData
    async fn collect_storage_data(&self, agent_data: &mut AgentData) -> Result<(), CollectorError> {
        let start_time = Instant::now();
        debug!("Starting clean storage collection");
        // Step 1: Get mount points and their backing devices
        let mount_devices = self.get_mount_devices().await?;
@@ -104,9 +100,6 @@ impl DiskCollector {
        self.populate_drives_data(&physical_drives, &smart_data, agent_data)?;
        self.populate_pools_data(&mergerfs_pools, &smart_data, agent_data)?;
        let elapsed = start_time.elapsed();
        debug!("Storage collection completed in {:?}", elapsed);
        Ok(())
    }
@@ -114,7 +107,7 @@ impl DiskCollector {
    async fn get_mount_devices(&self) -> Result<HashMap<String, String>, CollectorError> {
        use super::run_command_with_timeout;
-        let mut cmd = Command::new("lsblk");
+        let mut cmd = TokioCommand::new("lsblk");
        cmd.args(&["-rn", "-o", "NAME,MOUNTPOINT"]);
        let output = run_command_with_timeout(cmd, 2).await
@@ -141,7 +134,6 @@ impl DiskCollector {
            }
        }
        debug!("Found {} mounted block devices", mount_devices.len());
        Ok(mount_devices)
    }
@@ -154,8 +146,8 @@ impl DiskCollector {
                Ok((total, used)) => {
                    filesystem_usage.insert(mount_point.clone(), (total, used));
                }
-                Err(e) => {
+                Err(_e) => {
-                    debug!("Failed to get filesystem info for {}: {}", mount_point, e);
+                    // Silently skip filesystems we can't read
                }
            }
        }
@@ -176,8 +168,6 @@ impl DiskCollector {
                // Only add if we don't already have usage data for this mount point
                if !filesystem_usage.contains_key(&mount_point) {
                    if let Ok((total, used)) = self.get_filesystem_info(&mount_point) {
                        debug!("Added MergerFS filesystem usage for {}: {}GB total, {}GB used", 
                            mount_point, total as f32 / (1024.0 * 1024.0 * 1024.0), used as f32 / (1024.0 * 1024.0 * 1024.0));
                        filesystem_usage.insert(mount_point, (total, used));
                    }
                }
@@ -189,7 +179,7 @@ impl DiskCollector {
    /// Get filesystem info for a single mount point
    fn get_filesystem_info(&self, mount_point: &str) -> Result<(u64, u64), CollectorError> {
-        let output = std::process::Command::new("timeout")
+        let output = StdCommand::new("timeout")
            .args(&["2", "df", "--block-size=1", mount_point])
            .output()
            .map_err(|e| CollectorError::SystemRead {
@@ -252,9 +242,8 @@ impl DiskCollector {
                } else {
                    mount_point.trim_start_matches('/').replace('/', "_")
                };
-                
+
                if pool_name.is_empty() {
                    debug!("Skipping mergerfs pool with empty name: {}", mount_point);
                    continue;
                }
@@ -282,8 +271,7 @@ impl DiskCollector {
                // Categorize as data vs parity drives
                let (data_drives, parity_drives) = match self.categorize_pool_drives(&all_member_paths) {
                    Ok(drives) => drives,
-                    Err(e) => {
+                    Err(_e) => {
                        debug!("Failed to categorize drives for pool {}: {}. Skipping.", mount_point, e);
                        continue;
                    }
                };
@@ -298,8 +286,7 @@ impl DiskCollector {
                });
            }
        }
-        
+
        debug!("Found {} mergerfs pools", pools.len());
        Ok(pools)
    }
@@ -386,9 +373,9 @@ impl DiskCollector {
        device.to_string()
    }
-    /// Get SMART data for drives
+    /// Get SMART data for drives in parallel
    async fn get_smart_data_for_drives(&self, physical_drives: &[PhysicalDrive], mergerfs_pools: &[MergerfsPool]) -> HashMap<String, SmartData> {
-        let mut smart_data = HashMap::new();
+        use futures::future::join_all;
        // Collect all drive names
        let mut all_drives = std::collections::HashSet::new();
@@ -404,9 +391,24 @@ impl DiskCollector {
            }
        }
-        // Get SMART data for each drive
+        // Collect SMART data for all drives in parallel
-        for drive_name in all_drives {
+        let futures: Vec<_> = all_drives
-            if let Ok(data) = self.get_smart_data(&drive_name).await {
+            .iter()
            .map(|drive_name| {
                let drive = drive_name.clone();
                async move {
                    let result = self.get_smart_data(&drive).await;
                    (drive, result)
                }
            })
            .collect();
        let results = join_all(futures).await;
        // Build HashMap from results
        let mut smart_data = HashMap::new();
        for (drive_name, result) in results {
            if let Ok(data) = result {
                smart_data.insert(drive_name, data);
            }
        }
@@ -420,7 +422,7 @@ impl DiskCollector {
        // Use direct smartctl (no sudo) - service has CAP_SYS_RAWIO and CAP_SYS_ADMIN capabilities
        // For NVMe drives, specify device type explicitly
-        let mut cmd = Command::new("smartctl");
+        let mut cmd = TokioCommand::new("smartctl");
        if drive_name.starts_with("nvme") {
            cmd.args(&["-d", "nvme", "-a", &format!("/dev/{}", drive_name)]);
        } else {
@@ -435,8 +437,10 @@ impl DiskCollector {
        let output_str = String::from_utf8_lossy(&output.stdout);
-        if !output.status.success() {
+        // Note: smartctl returns non-zero exit codes for warnings (like exit code 32
-            // Return unknown data rather than failing completely
+        // for "temperature was high in the past"), but the output data is still valid.
        // Only check if we got any output at all, don't reject based on exit code.
        if output_str.is_empty() {
            return Ok(SmartData {
                health: "UNKNOWN".to_string(),
                serial_number: None,
@@ -444,7 +448,7 @@ impl DiskCollector {
                wear_percent: None,
            });
        }
-        
+
        let mut health = "UNKNOWN".to_string();
        let mut serial_number = None;
        let mut temperature = None;
@@ -763,7 +767,7 @@ impl DiskCollector {
    /// Get drive information for a mount path
    fn get_drive_info_for_path(&self, path: &str) -> anyhow::Result<PoolDrive> {
        // Use lsblk to find the backing device with timeout
-        let output = Command::new("timeout")
+        let output = StdCommand::new("timeout")
            .args(&["2", "lsblk", "-rn", "-o", "NAME,MOUNTPOINT"])
            .output()
            .map_err(|e| anyhow::anyhow!("Failed to run lsblk: {}", e))?;
@@ -785,20 +789,13 @@ impl DiskCollector {
        // Extract base device name (e.g., "sda1" -> "sda")
        let base_device = self.extract_base_device(&format!("/dev/{}", device));
-        
+
-        // Get temperature from SMART data if available
+        // Temperature will be filled in later from parallel SMART collection
-        let temperature = if let Ok(smart_data) = tokio::task::block_in_place(|| {
+        // Don't collect it here to avoid sequential blocking with problematic async nesting
            tokio::runtime::Handle::current().block_on(self.get_smart_data(&base_device))
        }) {
            smart_data.temperature_celsius
        } else {
            None
        };
        Ok(PoolDrive {
            name: base_device,
            mount_point: path.to_string(),
-            temperature_celsius: temperature,
+            temperature_celsius: None,
        })
    }
--- a/agent/src/collectors/mod.rs
+++ b/agent/src/collectors/mod.rs
@@ -1,8 +1,7 @@
 use async_trait::async_trait;
 use cm_dashboard_shared::{AgentData};
-use std::process::{Command, Output};
+use std::process::Output;
 use std::time::Duration;
 use tokio::time::timeout;
 pub mod backup;
 pub mod cpu;
@@ -16,16 +15,34 @@ pub mod systemd;
 pub use error::CollectorError;
 /// Run a command with a timeout to prevent blocking
-pub async fn run_command_with_timeout(mut cmd: Command, timeout_secs: u64) -> std::io::Result<Output> {
+/// Properly kills the process if timeout is exceeded
 pub async fn run_command_with_timeout(mut cmd: tokio::process::Command, timeout_secs: u64) -> std::io::Result<Output> {
    use tokio::time::timeout;
    use std::process::Stdio;
    let timeout_duration = Duration::from_secs(timeout_secs);
-    match timeout(timeout_duration, tokio::task::spawn_blocking(move || cmd.output())).await {
+    // Configure stdio to capture output
-        Ok(Ok(result)) => result,
+    cmd.stdout(Stdio::piped());
-        Ok(Err(e)) => Err(std::io::Error::new(std::io::ErrorKind::Other, e)),
+    cmd.stderr(Stdio::piped());
-        Err(_) => Err(std::io::Error::new(
+
-            std::io::ErrorKind::TimedOut,
+    let child = cmd.spawn()?;
-            format!("Command timed out after {} seconds", timeout_secs)
+    let pid = child.id();
-        )),
+
    match timeout(timeout_duration, child.wait_with_output()).await {
        Ok(result) => result,
        Err(_) => {
            // Timeout - force kill the process using system kill command
            if let Some(process_id) = pid {
                let _ = tokio::process::Command::new("kill")
                    .args(&["-9", &process_id.to_string()])
                    .output()
                    .await;
            }
            Err(std::io::Error::new(
                std::io::ErrorKind::TimedOut,
                format!("Command timed out after {} seconds", timeout_secs)
            ))
        }
    }
 }
--- a/agent/src/collectors/systemd.rs
+++ b/agent/src/collectors/systemd.rs
@@ -353,16 +353,12 @@ impl SystemdCollector {
        Ok((services, status_cache))
    }
-    /// Get service status from cache (if available) or fallback to systemctl
+    /// Get service status with detailed metrics from systemctl
    fn get_service_status(&self, service: &str) -> Result<ServiceStatusInfo> {
-        // Try to get status from cache first
+        // Always fetch fresh data to get detailed metrics (memory, restarts, uptime)
-        if let Ok(state) = self.state.read() {
+        // Note: Cache in service_status_cache only has basic active_state from discovery,
-            if let Some(cached_info) = state.service_status_cache.get(service) {
+        // with all detailed metrics set to None. We need fresh systemctl show data.
                return Ok(cached_info.clone());
            }
        }
        // Fallback to systemctl if not in cache (with 2 second timeout)
        let output = Command::new("timeout")
            .args(&[
                "2",
--- a/agent/src/config/mod.rs
+++ b/agent/src/config/mod.rs
@@ -13,7 +13,6 @@ pub struct AgentConfig {
    pub collectors: CollectorConfig,
    pub cache: CacheConfig,
    pub notifications: NotificationConfig,
    pub collection_interval_seconds: u64,
 }
 /// ZMQ communication configuration
--- a/agent/src/config/validation.rs
+++ b/agent/src/config/validation.rs
@@ -11,9 +11,9 @@ pub fn validate_config(config: &AgentConfig) -> Result<()> {
        bail!("ZMQ bind address cannot be empty");
    }
-    // Validate collection interval
+    // Validate ZMQ transmission interval
-    if config.collection_interval_seconds == 0 {
+    if config.zmq.transmission_interval_seconds == 0 {
-        bail!("Collection interval cannot be 0");
+        bail!("ZMQ transmission interval cannot be 0");
    }
    // Validate CPU thresholds
--- a/dashboard/Cargo.toml
+++ b/dashboard/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "cm-dashboard"
-version = "0.1.206"
+version = "0.1.227"
 edition = "2021"
 [dependencies]
--- a/dashboard/src/ui/widgets/services.rs
+++ b/dashboard/src/ui/widgets/services.rs
@@ -11,6 +11,59 @@ use tracing::debug;
 use crate::ui::theme::{Components, StatusIcons, Theme, Typography};
 use ratatui::style::Style;
 /// Column visibility configuration based on terminal width
 #[derive(Debug, Clone, Copy)]
 struct ColumnVisibility {
    show_name: bool,
    show_status: bool,
    show_ram: bool,
    show_uptime: bool,
    show_restarts: bool,
 }
 impl ColumnVisibility {
    /// Determine which columns to show based on available width
    fn from_width(width: u16) -> Self {
        if width >= 80 {
            // Full layout: Name (25) + Status (10) + RAM (8) + Uptime (8) + Restarts (5) = 56 chars
            Self {
                show_name: true,
                show_status: true,
                show_ram: true,
                show_uptime: true,
                show_restarts: true,
            }
        } else if width >= 60 {
            // Hide restarts: Name (25) + Status (10) + RAM (8) + Uptime (8) = 51 chars
            Self {
                show_name: true,
                show_status: true,
                show_ram: true,
                show_uptime: true,
                show_restarts: false,
            }
        } else if width >= 45 {
            // Hide uptime and restarts: Name (25) + Status (10) + RAM (8) = 43 chars
            Self {
                show_name: true,
                show_status: true,
                show_ram: true,
                show_uptime: false,
                show_restarts: false,
            }
        } else {
            // Minimal: Name (25) + Status (10) = 35 chars
            Self {
                show_name: true,
                show_status: true,
                show_ram: false,
                show_uptime: false,
                show_restarts: false,
            }
        }
    }
 }
 /// Services widget displaying hierarchical systemd service statuses
 #[derive(Clone)]
 pub struct ServicesWidget {
@@ -76,7 +129,7 @@ impl ServicesWidget {
    }
    /// Format parent service line - returns text without icon for span formatting
-    fn format_parent_service_line(&self, name: &str, info: &ServiceInfo) -> String {
+    fn format_parent_service_line(&self, name: &str, info: &ServiceInfo, columns: ColumnVisibility) -> String {
        // Truncate long service names to fit layout (account for icon space)
        let short_name = if name.len() > 22 {
            format!("{}...", &name[..19])
@@ -129,10 +182,25 @@ impl ServicesWidget {
            }
        });
-        format!(
+        // Build format string based on column visibility
-            "{:<23} {:<10} {:<8} {:<8} {:<5}",
+        let mut parts = Vec::new();
-            short_name, status_str, memory_str, uptime_str, restart_str
+        if columns.show_name {
-        )
+            parts.push(format!("{:<23}", short_name));
        }
        if columns.show_status {
            parts.push(format!("{:<10}", status_str));
        }
        if columns.show_ram {
            parts.push(format!("{:<8}", memory_str));
        }
        if columns.show_uptime {
            parts.push(format!("{:<8}", uptime_str));
        }
        if columns.show_restarts {
            parts.push(format!("{:<5}", restart_str));
        }
        parts.join(" ")
    }
@@ -476,11 +544,28 @@ impl ServicesWidget {
            .constraints([Constraint::Length(1), Constraint::Min(0)])
            .split(inner_area);
-        // Header
+        // Determine which columns to show based on available width
-        let header = format!(
+        let columns = ColumnVisibility::from_width(inner_area.width);
-            "{:<25} {:<10} {:<8} {:<8} {:<5}",
+
-            "Service:", "Status:", "RAM:", "Uptime:", "↻:"
+        // Build header based on visible columns
-        );
+        let mut header_parts = Vec::new();
        if columns.show_name {
            header_parts.push(format!("{:<25}", "Service:"));
        }
        if columns.show_status {
            header_parts.push(format!("{:<10}", "Status:"));
        }
        if columns.show_ram {
            header_parts.push(format!("{:<8}", "RAM:"));
        }
        if columns.show_uptime {
            header_parts.push(format!("{:<8}", "Uptime:"));
        }
        if columns.show_restarts {
            header_parts.push(format!("{:<5}", "↻:"));
        }
        let header = header_parts.join(" ");
        let header_para = Paragraph::new(header).style(Typography::muted());
        frame.render_widget(header_para, content_chunks[0]);
@@ -492,11 +577,11 @@ impl ServicesWidget {
        }
        // Render the services list
-        self.render_services(frame, content_chunks[1], is_focused);
+        self.render_services(frame, content_chunks[1], is_focused, columns);
    }
    /// Render services list
-    fn render_services(&mut self, frame: &mut Frame, area: Rect, is_focused: bool) {
+    fn render_services(&mut self, frame: &mut Frame, area: Rect, is_focused: bool, columns: ColumnVisibility) {
        // Build hierarchical service list for display
        let mut display_lines: Vec<(String, Status, bool, Option<(ServiceInfo, bool)>)> = Vec::new();
@@ -506,7 +591,7 @@ impl ServicesWidget {
        for (parent_name, parent_info) in parent_services {
            // Add parent service line
-            let parent_line = self.format_parent_service_line(parent_name, parent_info);
+            let parent_line = self.format_parent_service_line(parent_name, parent_info, columns);
            display_lines.push((parent_line, parent_info.widget_status, false, None));
            // Add sub-services for this parent (if any)
--- a/dashboard/src/ui/widgets/system.rs
+++ b/dashboard/src/ui/widgets/system.rs
@@ -26,7 +26,7 @@ pub struct SystemWidget {
    cpu_load_1min: Option<f32>,
    cpu_load_5min: Option<f32>,
    cpu_load_15min: Option<f32>,
-    cpu_frequency: Option<f32>,
+    cpu_cstates: Vec<cm_dashboard_shared::CStateInfo>,
    cpu_status: Status,
    // Memory metrics
@@ -45,15 +45,9 @@ pub struct SystemWidget {
    storage_pools: Vec<StoragePool>,
    // Backup metrics
-    backup_status: String,
+    backup_repositories: Vec<String>,
-    backup_start_time_raw: Option<String>,
+    backup_repository_status: Status,
-    backup_disk_serial: Option<String>,
+    backup_disks: Vec<cm_dashboard_shared::BackupDiskData>,
    backup_disk_usage_percent: Option<f32>,
    backup_disk_used_gb: Option<f32>,
    backup_disk_total_gb: Option<f32>,
    backup_disk_wear_percent: Option<f32>,
    backup_disk_temperature: Option<f32>,
    backup_last_size_gb: Option<f32>,
    // Overall status
    has_data: bool,
@@ -102,7 +96,7 @@ impl SystemWidget {
            cpu_load_1min: None,
            cpu_load_5min: None,
            cpu_load_15min: None,
-            cpu_frequency: None,
+            cpu_cstates: Vec::new(),
            cpu_status: Status::Unknown,
            memory_usage_percent: None,
            memory_used_gb: None,
@@ -114,15 +108,9 @@ impl SystemWidget {
            tmp_status: Status::Unknown,
            tmpfs_mounts: Vec::new(),
            storage_pools: Vec::new(),
-            backup_status: "unknown".to_string(),
+            backup_repositories: Vec::new(),
-            backup_start_time_raw: None,
+            backup_repository_status: Status::Unknown,
-            backup_disk_serial: None,
+            backup_disks: Vec::new(),
            backup_disk_usage_percent: None,
            backup_disk_used_gb: None,
            backup_disk_total_gb: None,
            backup_disk_wear_percent: None,
            backup_disk_temperature: None,
            backup_last_size_gb: None,
            has_data: false,
        }
    }
@@ -137,12 +125,19 @@ impl SystemWidget {
        }
    }
-    /// Format CPU frequency
+    /// Format CPU C-states (idle depth) with percentages
-    fn format_cpu_frequency(&self) -> String {
+    fn format_cpu_cstate(&self) -> String {
-        match self.cpu_frequency {
+        if self.cpu_cstates.is_empty() {
-            Some(freq) => format!("{:.0} MHz", freq),
+            return "—".to_string();
            None => "— MHz".to_string(),
        }
        // Format top 3 C-states with percentages: "C10:79% C8:10% C6:8%"
        // Agent already sends clean names (C3, C10, etc.)
        self.cpu_cstates
            .iter()
            .map(|cs| format!("{}:{:.0}%", cs.name, cs.percent))
            .collect::<Vec<_>>()
            .join(" ")
    }
    /// Format memory usage
@@ -188,7 +183,7 @@ impl Widget for SystemWidget {
        self.cpu_load_1min = Some(cpu.load_1min);
        self.cpu_load_5min = Some(cpu.load_5min);
        self.cpu_load_15min = Some(cpu.load_15min);
-        self.cpu_frequency = Some(cpu.frequency_mhz);
+        self.cpu_cstates = cpu.cstates.clone();
        self.cpu_status = Status::Ok;
        // Extract memory data directly
@@ -214,25 +209,9 @@ impl Widget for SystemWidget {
        // Extract backup data
        let backup = &agent_data.backup;
-        self.backup_status = backup.status.clone();
+        self.backup_repositories = backup.repositories.clone();
-        self.backup_start_time_raw = backup.start_time_raw.clone();
+        self.backup_repository_status = backup.repository_status;
-        self.backup_last_size_gb = backup.last_backup_size_gb;
+        self.backup_disks = backup.disks.clone();
        if let Some(disk) = &backup.repository_disk {
            self.backup_disk_serial = Some(disk.serial.clone());
            self.backup_disk_usage_percent = Some(disk.usage_percent);
            self.backup_disk_used_gb = Some(disk.used_gb);
            self.backup_disk_total_gb = Some(disk.total_gb);
            self.backup_disk_wear_percent = disk.wear_percent;
            self.backup_disk_temperature = disk.temperature_celsius;
        } else {
            self.backup_disk_serial = None;
            self.backup_disk_usage_percent = None;
            self.backup_disk_used_gb = None;
            self.backup_disk_total_gb = None;
            self.backup_disk_wear_percent = None;
            self.backup_disk_temperature = None;
        }
    }
 }
@@ -532,14 +511,36 @@ impl SystemWidget {
    fn render_backup(&self) -> Vec<Line<'_>> {
        let mut lines = Vec::new();
-        // First line: serial number with temperature and wear
+        // First section: Repository status and list
-        if let Some(serial) = &self.backup_disk_serial {
+        if !self.backup_repositories.is_empty() {
-            let truncated_serial = truncate_serial(serial);
+            let repo_text = format!("Repo: {}", self.backup_repositories.len());
            let repo_spans = StatusIcons::create_status_spans(self.backup_repository_status, &repo_text);
            lines.push(Line::from(repo_spans));
            // List all repositories (sorted for consistent display)
            let mut sorted_repos = self.backup_repositories.clone();
            sorted_repos.sort();
            let repo_count = sorted_repos.len();
            for (idx, repo) in sorted_repos.iter().enumerate() {
                let tree_char = if idx == repo_count - 1 { "└─" } else { "├─" };
                lines.push(Line::from(vec![
                    Span::styled(format!("  {} ", tree_char), Typography::tree()),
                    Span::styled(repo.clone(), Typography::secondary()),
                ]));
            }
        }
        // Second section: Per-disk backup information (sorted by serial for consistent display)
        let mut sorted_disks = self.backup_disks.clone();
        sorted_disks.sort_by(|a, b| a.serial.cmp(&b.serial));
        for disk in &sorted_disks {
            let truncated_serial = truncate_serial(&disk.serial);
            let mut details = Vec::new();
-            if let Some(temp) = self.backup_disk_temperature {
+
            if let Some(temp) = disk.temperature_celsius {
                details.push(format!("T: {}°C", temp as i32));
            }
-            if let Some(wear) = self.backup_disk_wear_percent {
+            if let Some(wear) = disk.wear_percent {
                details.push(format!("W: {}%", wear as i32));
            }
@@ -549,44 +550,40 @@ impl SystemWidget {
                truncated_serial
            };
-            let backup_status = match self.backup_status.as_str() {
+            // Overall disk status (worst of backup and usage)
-                "completed" | "success" => Status::Ok,
+            let disk_status = disk.backup_status.max(disk.usage_status);
-                "running" => Status::Pending,
+            let disk_spans = StatusIcons::create_status_spans(disk_status, &disk_text);
                "failed" => Status::Critical,
                _ => Status::Unknown,
            };
            let disk_spans = StatusIcons::create_status_spans(backup_status, &disk_text);
            lines.push(Line::from(disk_spans));
-            // Show backup time from TOML if available
+            // Show backup time with status
-            if let Some(start_time) = &self.backup_start_time_raw {
+            if let Some(backup_time) = &disk.last_backup_time {
-                let time_text = if let Some(size) = self.backup_last_size_gb {
+                let time_text = format!("Backup: {}", backup_time);
-                    format!("Time: {} ({:.1}GB)", start_time, size)
+                let mut time_spans = vec![
                } else {
                    format!("Time: {}", start_time)
                };
                lines.push(Line::from(vec![
                    Span::styled("  ├─ ", Typography::tree()),
-                    Span::styled(time_text, Typography::secondary())
+                ];
-                ]));
+                time_spans.extend(StatusIcons::create_status_spans(disk.backup_status, &time_text));
                lines.push(Line::from(time_spans));
            }
-            // Usage information
+            // Show usage with status and archive count
-            if let (Some(used), Some(total), Some(usage_percent)) = (
+            let archive_display = if disk.archives_min == disk.archives_max {
-                self.backup_disk_used_gb, 
+                format!("{}", disk.archives_min)
-                self.backup_disk_total_gb,
+            } else {
-                self.backup_disk_usage_percent
+                format!("{}-{}", disk.archives_min, disk.archives_max)
-            ) {
+            };
-                let usage_text = format!("Usage: {:.0}% {:.0}GB/{:.0}GB", usage_percent, used, total);
+
-                let usage_spans = StatusIcons::create_status_spans(Status::Ok, &usage_text);
+            let usage_text = format!(
-                let mut full_spans = vec![
+                "Usage: ({}) {:.0}% {:.0}GB/{:.0}GB",
-                    Span::styled("  └─ ", Typography::tree()),
+                archive_display,
-                ];
+                disk.disk_usage_percent,
-                full_spans.extend(usage_spans);
+                disk.disk_used_gb,
-                lines.push(Line::from(full_spans));
+                disk.disk_total_gb
-            }
+            );
            let mut usage_spans = vec![
                Span::styled("  └─ ", Typography::tree()),
            ];
            usage_spans.extend(StatusIcons::create_status_spans(disk.usage_status, &usage_text));
            lines.push(Line::from(usage_spans));
        }
        lines
@@ -832,10 +829,10 @@ impl SystemWidget {
        );
        lines.push(Line::from(cpu_spans));
-        let freq_text = self.format_cpu_frequency();
+        let cstate_text = self.format_cpu_cstate();
        lines.push(Line::from(vec![
            Span::styled("  └─ ", Typography::tree()),
-            Span::styled(format!("Freq: {}", freq_text), Typography::secondary())
+            Span::styled(format!("C-state: {}", cstate_text), Typography::secondary())
        ]));
        // RAM section
@@ -894,7 +891,7 @@ impl SystemWidget {
        lines.extend(storage_lines);
        // Backup section (if available)
-        if self.backup_status != "unavailable" && self.backup_status != "unknown" {
+        if !self.backup_repositories.is_empty() || !self.backup_disks.is_empty() {
            lines.push(Line::from(vec![
                Span::styled("Backup:", Typography::widget_title())
            ]));
--- a/shared/Cargo.toml
+++ b/shared/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "cm-dashboard-shared"
-version = "0.1.206"
+version = "0.1.227"
 edition = "2021"
 [dependencies]
--- a/shared/src/agent_data.rs
+++ b/shared/src/agent_data.rs
@@ -40,13 +40,20 @@ pub struct NetworkInterfaceData {
    pub vlan_id: Option<u16>,
 }
 /// CPU C-state usage information
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct CStateInfo {
    pub name: String,
    pub percent: f32,
 }
 /// CPU monitoring data
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct CpuData {
    pub load_1min: f32,
    pub load_5min: f32,
    pub load_15min: f32,
-    pub frequency_mhz: f32,
+    pub cstates: Vec<CStateInfo>, // C-state usage percentages (C1, C6, C10, etc.) - indicates CPU idle depth distribution
    pub temperature_celsius: Option<f32>,
    pub load_status: Status,
    pub temperature_status: Status,
@@ -169,23 +176,27 @@ pub struct SubServiceMetric {
 /// Backup system data
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct BackupData {
-    pub status: String,
+    pub repositories: Vec<String>,
-    pub total_size_gb: Option<f32>,
+    pub repository_status: Status,
-    pub repository_health: Option<String>,
+    pub disks: Vec<BackupDiskData>,
    pub repository_disk: Option<BackupDiskData>,
    pub last_backup_size_gb: Option<f32>,
    pub start_time_raw: Option<String>,
 }
 /// Backup repository disk information
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct BackupDiskData {
    pub serial: String,
-    pub usage_percent: f32,
+    pub product_name: Option<String>,
    pub used_gb: f32,
    pub total_gb: f32,
    pub wear_percent: Option<f32>,
    pub temperature_celsius: Option<f32>,
    pub last_backup_time: Option<String>,
    pub backup_status: Status,
    pub disk_usage_percent: f32,
    pub disk_used_gb: f32,
    pub disk_total_gb: f32,
    pub usage_status: Status,
    pub services: Vec<String>,
    pub archives_min: i64,
    pub archives_max: i64,
 }
 impl AgentData {
@@ -204,7 +215,7 @@ impl AgentData {
                    load_1min: 0.0,
                    load_5min: 0.0,
                    load_15min: 0.0,
-                    frequency_mhz: 0.0,
+                    cstates: Vec::new(),
                    temperature_celsius: None,
                    load_status: Status::Unknown,
                    temperature_status: Status::Unknown,
@@ -226,12 +237,9 @@ impl AgentData {
            },
            services: Vec::new(),
            backup: BackupData {
-                status: "unknown".to_string(),
+                repositories: Vec::new(),
-                total_size_gb: None,
+                repository_status: Status::Unknown,
-                repository_health: None,
+                disks: Vec::new(),
                repository_disk: None,
                last_backup_size_gb: None,
                start_time_raw: None,
            },
        }
    }
Author	SHA1	Message	Date
Christoffer Martinsson	67034c84b9	Add responsive column visibility to service panel All checks were successful Build and Release / build-and-release (push) Successful in 1m47s Details Service panel now dynamically shows/hides columns based on terminal width: - ≥80 chars: All columns (Name, Status, RAM, Uptime, Restarts) - ≥60 chars: Hide Restarts only - ≥45 chars: Hide Uptime and Restarts - <45 chars: Minimal (Name and Status only) Improves dashboard usability on smaller terminal sizes.	2025-11-30 10:50:08 +01:00
Christoffer Martinsson	c62c7fa698	Remove debug logging from disk collector All checks were successful Build and Release / build-and-release (push) Successful in 1m11s Details Removed all debug! statements from disk collector to reduce log noise. Bump version to v0.1.226	2025-11-30 00:44:38 +01:00
Christoffer Martinsson	0b1d8c0a73	Fix Data_3 showing as unknown by handling smartctl warning exit codes All checks were successful Build and Release / build-and-release (push) Successful in 1m11s Details Root cause: sda's temperature exceeded threshold in the past, causing smartctl to return exit code 32 (warning: "Attributes have been <= threshold in the past"). The agent checked output.status.success() and rejected the entire output as failed, even though the data (serial, temperature, health) was perfectly valid. Smartctl exit codes are bit flags for informational warnings: - Exit 0: No warnings - Exit 32 (bit 5): Attributes were at/below threshold in past - Exit 64 (bit 6): Error log has entries - etc. The output data is valid regardless of these warning flags. Solution: Parse output as long as it's not empty, ignore exit code. Only return UNKNOWN if output is actually empty (command truly failed). Result: Data_3 will now show "ZDZ4VE0B T: 31°C" instead of "? Data_3: sda" Bump version to v0.1.225	2025-11-30 00:35:19 +01:00
Christoffer Martinsson	c77aa6eaaa	Fix Data_3 timeout by removing sequential SMART during pool detection All checks were successful Build and Release / build-and-release (push) Successful in 1m34s Details Root cause: SMART data was collected TWICE: 1. Sequential collection during pool detection in get_drive_info_for_path() using problematic tokio::task::block_in_place() nesting 2. Parallel collection in get_smart_data_for_drives() (v0.1.223) The sequential collection happened FIRST during pool detection, causing sda (Data_3) to timeout due to: - Bad async nesting: block_in_place() wrapping block_on() - Sequential execution causing runtime issues - sda being third in sequence, runtime degraded by then Solution: Remove SMART collection from get_drive_info_for_path(). Pool drive temperatures are populated later from the parallel SMART collection which properly uses futures::join_all. Benefits: - Eliminates problematic async nesting - All SMART queries happen once in parallel only - sda/Data_3 should now show serial (ZDZ4VE0B) and temperature Bump version to v0.1.224	2025-11-30 00:14:25 +01:00
Christoffer Martinsson	8a0e68f0e3	Fix Data_3 timeout by parallelizing SMART collection All checks were successful Build and Release / build-and-release (push) Successful in 1m10s Details Root cause: SMART data was collected sequentially, one drive at a time. With 5 drives taking ~500ms each, total collection time was 2.5+ seconds. When disk collector runs every 1 second, this caused overlapping collections creating resource contention. The last drive (sda/Data_3) would timeout due to the drive being accessed by the previous collection. Solution: Query all drives in parallel using futures::join_all. Now all drives get their SMART data collected simultaneously with independent 3-second timeouts, eliminating contention and reducing total collection time from 2.5+ seconds to ~500ms (the slowest single drive). Benefits: - All drives complete in ~500ms instead of 2.5+ seconds - No overlapping collections causing resource contention - Each drive gets full 3-second timeout window - sda/Data_3 should now show temperature and serial number Bump version to v0.1.223	2025-11-29 23:51:43 +01:00
Christoffer Martinsson	2d653fe9ae	Fix empty Storage section by configuring stdio pipes All checks were successful Build and Release / build-and-release (push) Successful in 1m15s Details Root cause: run_command_with_timeout() was calling cmd.spawn() without configuring stdout/stderr pipes. This caused command output to go to journald instead of being captured by wait_with_output(). The disk collector received empty output and failed silently. Solution: Configure stdout(Stdio::piped()) and stderr(Stdio::piped()) before spawning commands. This ensures wait_with_output() can properly capture command output. Fixes: Empty Storage section, lsblk output appearing in journald Bump version to v0.1.222	2025-11-29 23:25:17 +01:00
Christoffer Martinsson	caba78004e	Fix empty Storage section by properly aliasing command types All checks were successful Build and Release / build-and-release (push) Successful in 2m6s Details v0.1.220 broke disk collector by changing the import from std::process::Command to tokio::process::Command, but lines 193 and 767 explicitly used std::process::Command::new() which silently failed. Solution: Import both as aliases (TokioCommand/StdCommand) and use appropriate type for each operation - async commands use TokioCommand with run_command_with_timeout, sync commands use StdCommand with system timeout wrapper. Fixes: Empty Storage section after v0.1.220 deployment Bump version to v0.1.221	2025-11-29 21:29:33 +01:00
Christoffer Martinsson	77bf08a978	Fix blocking smartctl commands with proper async/timeout handling All checks were successful Build and Release / build-and-release (push) Successful in 2m2s Details - Changed disk collector to use tokio::process::Command instead of std::process::Command - Updated run_command_with_timeout to properly kill processes on timeout - Fixes issue where smartctl hangs on problematic drives (/dev/sda) freezing entire agent - Timeout now force-kills hung processes using kill -9, preventing orphaned smartctl processes This resolves the issue where Data_3 showed unknown status because smartctl was hanging indefinitely trying to read from a problematic drive, blocking the entire collector. Bump version to v0.1.220 Co-Authored-By: Claude <noreply@anthropic.com>	2025-11-29 21:09:04 +01:00
Christoffer Martinsson	929870f8b6	Bump version to v0.1.219 All checks were successful Build and Release / build-and-release (push) Successful in 1m11s Details	2025-11-29 18:35:14 +01:00
Christoffer Martinsson	7aae852b7b	Bump version to v0.1.218 All checks were successful Build and Release / build-and-release (push) Successful in 1m19s Details	2025-11-29 17:59:33 +01:00
Christoffer Martinsson	40f3ff66d8	Show archive count range to detect inconsistencies - Display single number if all services have same count - Display min-max range if counts differ (indicates problem)	2025-11-29 17:59:24 +01:00
Christoffer Martinsson	1c1beddb55	Bump version to v0.1.217 All checks were successful Build and Release / build-and-release (push) Successful in 1m20s Details	2025-11-29 17:51:13 +01:00
Christoffer Martinsson	620d1f10b6	Show archive count per service instead of total sum	2025-11-29 17:51:01 +01:00
Christoffer Martinsson	a0d571a40e	Bump version to v0.1.216 All checks were successful Build and Release / build-and-release (push) Successful in 1m19s Details	2025-11-29 17:44:12 +01:00
Christoffer Martinsson	977200fff3	Move archive count to Usage line in backup display	2025-11-29 17:44:05 +01:00
Christoffer Martinsson	d692de5f83	Bump version to v0.1.215 All checks were successful Build and Release / build-and-release (push) Successful in 1m11s Details	2025-11-29 17:41:49 +01:00
Christoffer Martinsson	f5913dbd43	Add archive count to backup disk display	2025-11-29 17:41:11 +01:00
Christoffer Martinsson	faa30a7839	Sort backup repositories and disks for stable display All checks were successful Build and Release / build-and-release (push) Successful in 1m21s Details - Sort repositories alphabetically before rendering - Sort backup disks by serial number - Prevents display jumping between different orderings on updates - Consistent display order across refreshes Bump version to v0.1.214 Co-Authored-By: Claude <noreply@anthropic.com>	2025-11-29 17:15:17 +01:00
Christoffer Martinsson	6e4a42799f	Bump version to v0.1.213 All checks were successful Build and Release / build-and-release (push) Successful in 1m22s Details	2025-11-29 16:46:16 +01:00
Christoffer Martinsson	afb8d68e03	Implement multi-disk backup support - Update BackupData structure to support multiple backup disks - Scan /var/lib/backup/status/ directory for all status files - Calculate status icons for backup and disk usage - Aggregate repository status from all disks - Update dashboard to display all backup disks with per-disk status - Display repository list with count and aggregated status	2025-11-29 16:44:50 +01:00
Christoffer Martinsson	5e08b34280	Move C-state name cleaning to agent for smaller JSON All checks were successful Build and Release / build-and-release (push) Successful in 1m32s Details - Agent now extracts "C" + digits pattern (C3, C10) using char parsing - Removes suffixes like "_ACPI", "_MWAIT" at source - Reduces JSON payload size over ZMQ - No regex dependency - uses fast char iteration (~1μs overhead) - Robust fallback to original name if pattern not found - Dashboard simplified to use clean names directly Bump version to v0.1.212 Co-Authored-By: Claude <noreply@anthropic.com>	2025-11-29 14:05:55 +01:00
Christoffer Martinsson	0d8284b69c	Clean C-state display to show only CX format All checks were successful Build and Release / build-and-release (push) Successful in 1m18s Details - Strip suffixes like "_ACPI" from C-state names - Display changes from "C3_ACPI:51%" to "C3:51%" - Cleaner, more concise presentation Bump version to v0.1.211 Co-Authored-By: Claude <noreply@anthropic.com>	2025-11-29 13:34:01 +01:00
Christoffer Martinsson	d84690cb3b	Move transmission interval to ZMQ config section All checks were successful Build and Release / build-and-release (push) Successful in 1m43s Details - Changed code to use zmq.transmission_interval_seconds instead of top-level collection_interval_seconds - Removed collection_interval_seconds from AgentConfig - Updated validation to check zmq.transmission_interval_seconds - Improves config organization by grouping all ZMQ settings together Bump version to v0.1.210 Co-Authored-By: Claude <noreply@anthropic.com>	2025-11-29 13:31:39 +01:00
Christoffer Martinsson	7c030b33d6	Show top 3 C-states with usage percentages All checks were successful Build and Release / build-and-release (push) Successful in 1m21s Details - Changed CpuData.cstate from String to Vec<CStateInfo> - Added CStateInfo struct with name and percent fields - Collector calculates percentage for each C-state based on accumulated time - Sorts and returns top 3 C-states by usage - Dashboard displays: "C10:79% C8:10% C6:8%" Provides better visibility into CPU idle state distribution. Bump version to v0.1.209 Co-Authored-By: Claude <noreply@anthropic.com>	2025-11-28 23:45:46 +01:00
Christoffer Martinsson	c6817537a8	Replace CPU frequency with C-state monitoring All checks were successful Build and Release / build-and-release (push) Successful in 1m20s Details - Changed CpuData.frequency_mhz to CpuData.cstate (String) - Implemented collect_cstate() to read CPU idle depth from sysfs - Finds deepest C-state with most accumulated time (C0-C10) - Updated dashboard to display C-state instead of frequency - More accurate indicator of CPU activity vs power management Bump version to v0.1.208 Co-Authored-By: Claude <noreply@anthropic.com>	2025-11-28 23:30:14 +01:00
Christoffer Martinsson	2189d34b16	Bump version to v0.1.207 All checks were successful Build and Release / build-and-release (push) Successful in 1m9s Details	2025-11-28 23:16:33 +01:00
Christoffer Martinsson	28cfd5758f	Fix service metrics not showing - remove cache check The service_status_cache from discovery only has active_state with all detailed metrics set to None. During collection, get_service_status() was returning cached data instead of fetching fresh systemctl show data. Now always fetch fresh data to populate memory_bytes, restart_count, and uptime_seconds properly.	2025-11-28 23:15:51 +01:00