#!/bin/bash # Complete Unraid Monitoring Dashboard (Multi-Server) # Gets system status, disk health, and resource usage for all configured servers set -euo pipefail SCRIPT_DIR="$(cd -P "$(dirname "${BASH_SOURCE[0]}")" && pwd)" REPO_ROOT="$(cd "$SCRIPT_DIR/../../.." && pwd)" source "$REPO_ROOT/lib/load-env.sh" QUERY_SCRIPT="$SCRIPT_DIR/unraid-query.sh" OUTPUT_FILE="$HOME/memory/bank/unraid-inventory.md" # Load credentials from .env for all servers load_env_file || exit 1 # Discover configured servers dynamically from UNRAID__URL env vars SERVERS=() while IFS='=' read -r var_name _; do if [[ "$var_name" =~ ^UNRAID_(.+)_URL$ ]]; then SERVERS+=("${BASH_REMATCH[1]}") fi done < <(env) if [ ${#SERVERS[@]} -eq 0 ]; then echo "Error: No servers found. Set UNRAID__URL and UNRAID__API_KEY env vars." exit 1 fi for server in "${SERVERS[@]}"; do url_var="UNRAID_${server}_URL" key_var="UNRAID_${server}_API_KEY" validate_env_vars "$url_var" "$key_var" || exit 1 done # Ensure output directory exists mkdir -p "$(dirname "$OUTPUT_FILE")" # Start the report echo "# Unraid Fleet Dashboard" > "$OUTPUT_FILE" echo "Generated at: $(date)" >> "$OUTPUT_FILE" echo "" >> "$OUTPUT_FILE" # Function to process a single server process_server() { local NAME="$1" local URL="$2" local API_KEY="$3" echo "Querying server: $NAME..." UNRAID_URL="$URL" UNRAID_API_KEY="$API_KEY" IGNORE_ERRORS="true" export UNRAID_URL UNRAID_API_KEY IGNORE_ERRORS QUERY='query Dashboard { info { time cpu { model cores threads } os { platform distro release arch } system { manufacturer model version uuid } } metrics { cpu { percentTotal } memory { total used free percentTotal } } array { state capacity { kilobytes { total free used } } disks { name device temp status fsSize fsFree fsUsed isSpinning numErrors } caches { name device temp status fsSize fsFree fsUsed fsType type } parityCheckStatus { status progress errors } } disks { id name device size status temp numErrors } shares { name comment free } docker { containers { names image state status } } vms { domains { id name state } } vars { timeZone regTy regTo } notifications { id title subject description importance timestamp } recentLog: logFile(path: \"syslog\", lines: 50) { content } online isSSOEnabled }' RESPONSE=$("$QUERY_SCRIPT" -q "$QUERY" -f json) # Debug output (only when DEBUG is set) if [ "${DEBUG:-}" = "true" ]; then echo "$RESPONSE" > "/tmp/${NAME}_debug.json" fi # Check if response is valid JSON if ! echo "$RESPONSE" | jq -e . >/dev/null 2>&1; then echo "Error querying $NAME: Invalid response" echo "$RESPONSE" > "/tmp/${NAME}_debug.json" echo "Response saved to /tmp/${NAME}_debug.json" echo "## Server: $NAME (⚠️ Error)" >> "$OUTPUT_FILE" echo "Failed to retrieve data." >> "$OUTPUT_FILE" return fi # Append to report echo "## Server: $NAME" >> "$OUTPUT_FILE" # System Info CPU_MODEL=$(echo "$RESPONSE" | jq -r '.data.info.cpu.model') CPU_CORES=$(echo "$RESPONSE" | jq -r '.data.info.cpu.cores') CPU_THREADS=$(echo "$RESPONSE" | jq -r '.data.info.cpu.threads') OS_REL=$(echo "$RESPONSE" | jq -r '.data.info.os.release') OS_ARCH=$(echo "$RESPONSE" | jq -r '.data.info.os.arch // "x64"') SYS_MFG=$(echo "$RESPONSE" | jq -r '.data.info.system.manufacturer // "Unknown"') SYS_MODEL=$(echo "$RESPONSE" | jq -r '.data.info.system.model // "Unknown"') TIMEZONE=$(echo "$RESPONSE" | jq -r '.data.vars.timeZone // "N/A"') LICENSE=$(echo "$RESPONSE" | jq -r '.data.vars.regTy // "Unknown"') REG_TO=$(echo "$RESPONSE" | jq -r '.data.vars.regTo // "N/A"') CPU_LOAD=$(echo "$RESPONSE" | jq -r '.data.metrics.cpu.percentTotal // 0') TOTAL_MEM=$(echo "$RESPONSE" | jq -r '.data.metrics.memory.total // 0') MEM_USED_PCT=$(echo "$RESPONSE" | jq -r '.data.metrics.memory.percentTotal // 0') TOTAL_MEM_GB=$((TOTAL_MEM / 1024 / 1024 / 1024)) echo "### System" >> "$OUTPUT_FILE" echo "- **Hardware:** $SYS_MFG $SYS_MODEL" >> "$OUTPUT_FILE" echo "- **OS:** Unraid $OS_REL ($OS_ARCH)" >> "$OUTPUT_FILE" echo "- **License:** $LICENSE (Registered to: $REG_TO)" >> "$OUTPUT_FILE" echo "- **Timezone:** $TIMEZONE" >> "$OUTPUT_FILE" echo "- **CPU:** Model $CPU_MODEL ($CPU_CORES cores / $CPU_THREADS threads) - **${CPU_LOAD}% load**" >> "$OUTPUT_FILE" echo "- **Memory:** ${TOTAL_MEM_GB}GB - **${MEM_USED_PCT}% used**" >> "$OUTPUT_FILE" echo "" >> "$OUTPUT_FILE" # Array capacity ARRAY_TOTAL=$(echo "$RESPONSE" | jq -r '.data.array.capacity.kilobytes.total') ARRAY_USED=$(echo "$RESPONSE" | jq -r '.data.array.capacity.kilobytes.used') if [ "$ARRAY_TOTAL" != "null" ] && [ "$ARRAY_TOTAL" -gt 0 ]; then ARRAY_TOTAL_GB=$((ARRAY_TOTAL / 1024 / 1024)) ARRAY_USED_GB=$((ARRAY_USED / 1024 / 1024)) ARRAY_USED_PCT=$((ARRAY_USED * 100 / ARRAY_TOTAL)) echo "### Storage" >> "$OUTPUT_FILE" echo "- **Array:** ${ARRAY_USED_GB}GB / ${ARRAY_TOTAL_GB}GB used (${ARRAY_USED_PCT}%)" >> "$OUTPUT_FILE" # Cache pools echo "- **Cache Pools:**" >> "$OUTPUT_FILE" echo "$RESPONSE" | jq -r '(.data.array.caches // [])[] | " - \(.name) (\(.device)): \(.temp)°C - \(.status) - \(if .fsSize then "\((.fsUsed / 1024 / 1024 | floor))GB / \((.fsSize / 1024 / 1024 | floor))GB used" else "N/A" end)"' >> "$OUTPUT_FILE" fi # Docker TOTAL_CONTAINERS=$(echo "$RESPONSE" | jq '[(.data.docker.containers // [])[]] | length') RUNNING_CONTAINERS=$(echo "$RESPONSE" | jq '[(.data.docker.containers // [])[] | select(.state == "RUNNING")] | length') echo "" >> "$OUTPUT_FILE" echo "### Workloads" >> "$OUTPUT_FILE" echo "- **Docker:** ${TOTAL_CONTAINERS} containers (${RUNNING_CONTAINERS} running)" >> "$OUTPUT_FILE" # Unhealthy containers UNHEALTHY=$(echo "$RESPONSE" | jq -r '(.data.docker.containers // [])[] | select(.status | test("unhealthy|restarting"; "i")) | " - ⚠️ \(.names[0]): \(.status)"') if [ -n "$UNHEALTHY" ]; then echo "$UNHEALTHY" >> "$OUTPUT_FILE" fi # VMs if [ "$(echo "$RESPONSE" | jq -r '.data.vms.domains')" != "null" ]; then TOTAL_VMS=$(echo "$RESPONSE" | jq '[.data.vms.domains[]] | length') RUNNING_VMS=$(echo "$RESPONSE" | jq '[.data.vms.domains[] | select(.state == "RUNNING")] | length') echo "- **VMs:** ${TOTAL_VMS} VMs (${RUNNING_VMS} running)" >> "$OUTPUT_FILE" else echo "- **VMs:** Service disabled or no data" >> "$OUTPUT_FILE" fi # Disk Health echo "" >> "$OUTPUT_FILE" echo "### Health" >> "$OUTPUT_FILE" HOT_DISKS=$(echo "$RESPONSE" | jq -r '.data.array.disks[] | select(.temp > 45) | "- ⚠️ \(.name): \(.temp)°C (HIGH)"') DISK_ERRORS=$(echo "$RESPONSE" | jq -r '.data.array.disks[] | select(.numErrors > 0) | "- ❌ \(.name): \(.numErrors) errors"') if [ -z "$HOT_DISKS" ] && [ -z "$DISK_ERRORS" ]; then echo "- ✅ All disks healthy" >> "$OUTPUT_FILE" else [ -n "$HOT_DISKS" ] && echo "$HOT_DISKS" >> "$OUTPUT_FILE" [ -n "$DISK_ERRORS" ] && echo "$DISK_ERRORS" >> "$OUTPUT_FILE" fi # Notifications (Alerts) echo "" >> "$OUTPUT_FILE" echo "### Notifications" >> "$OUTPUT_FILE" NOTIF_COUNT=$(echo "$RESPONSE" | jq '[.data.notifications[]] | length' 2>/dev/null || echo "0") if [ "$NOTIF_COUNT" != "null" ] && [ -n "$NOTIF_COUNT" ] && [ "$NOTIF_COUNT" -gt 0 ]; then # Show recent notifications (last 10) ALERT_NOTIFS=$(echo "$RESPONSE" | jq -r '.data.notifications | sort_by(.timestamp) | reverse | .[0:10][] | "- [\(.importance // "info")] \(.title // .subject): \(.description // "No description") (\(.timestamp | split("T")[0]))"' 2>/dev/null) if [ -n "$ALERT_NOTIFS" ]; then echo "$ALERT_NOTIFS" >> "$OUTPUT_FILE" else echo "- ✅ No recent notifications" >> "$OUTPUT_FILE" fi # Count by importance ALERT_COUNT=$(echo "$RESPONSE" | jq '[.data.notifications[] | select(.importance == "alert" or .importance == "warning")] | length' 2>/dev/null || echo "0") if [ "$ALERT_COUNT" -gt 0 ]; then echo "" >> "$OUTPUT_FILE" echo "**⚠️ $ALERT_COUNT alert/warning notifications**" >> "$OUTPUT_FILE" fi else echo "- ✅ No notifications" >> "$OUTPUT_FILE" fi echo "" >> "$OUTPUT_FILE" echo "---" >> "$OUTPUT_FILE" echo "" >> "$OUTPUT_FILE" } # Main loop - process each server from environment variables for server in "${SERVERS[@]}"; do name_var="UNRAID_${server}_NAME" url_var="UNRAID_${server}_URL" key_var="UNRAID_${server}_API_KEY" NAME="${!name_var}" URL="${!url_var}" KEY="${!key_var}" process_server "$NAME" "$URL" "$KEY" done echo "Dashboard saved to: $OUTPUT_FILE" cat "$OUTPUT_FILE"