Added get_storage_controllers() function that detects SAS, SATA, RAID, and NVMe controllers via lspci. Updated all layout functions (10bay, large1, micro) to display detected storage controllers with their PCI address and model info. Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
421 lines
20 KiB
Bash
421 lines
20 KiB
Bash
#!/bin/bash
|
|
|
|
#==============================================================================
|
|
# Drive Atlas - Server Drive Mapping Tool
|
|
# Maps physical drive bays to logical device names using PCI paths
|
|
#==============================================================================
|
|
|
|
#------------------------------------------------------------------------------
|
|
# Chassis Type Definitions
|
|
# These define the physical layout and display formatting for each chassis type
|
|
#------------------------------------------------------------------------------
|
|
|
|
generate_10bay_layout() {
|
|
local hostname=$1
|
|
build_drive_map
|
|
|
|
# Fixed width for consistent box drawing (fits device names like "nvme0n1")
|
|
local drive_width=10
|
|
|
|
# Main chassis section
|
|
printf "┌────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┐\n"
|
|
printf "│ %-126s │\n" "$hostname - Sliger CX4712 (10x 3.5\" Hot-swap)"
|
|
printf "│ │\n"
|
|
|
|
# Show storage controllers
|
|
printf "│ Storage Controllers: │\n"
|
|
while IFS= read -r ctrl; do
|
|
[[ -n "$ctrl" ]] && printf "│ %-126s│\n" "$ctrl"
|
|
done < <(get_storage_controllers)
|
|
printf "│ │\n"
|
|
|
|
# M.2 NVMe slot if present
|
|
if [[ -n "${DRIVE_MAP[m2-1]}" ]]; then
|
|
printf "│ M.2 NVMe: %-10s │\n" "${DRIVE_MAP[m2-1]}"
|
|
printf "│ │\n"
|
|
fi
|
|
|
|
printf "│ Front Hot-swap Bays: │\n"
|
|
printf "│ │\n"
|
|
|
|
# Bay top borders
|
|
printf "│ "
|
|
for bay in {1..10}; do
|
|
printf "┌──────────┐ "
|
|
done
|
|
printf " │\n"
|
|
|
|
# Bay contents
|
|
printf "│ "
|
|
for bay in {1..10}; do
|
|
printf "│%-2d:%-7s│ " "$bay" "${DRIVE_MAP[$bay]:-EMPTY}"
|
|
done
|
|
printf " │\n"
|
|
|
|
# Bay bottom borders
|
|
printf "│ "
|
|
for bay in {1..10}; do
|
|
printf "└──────────┘ "
|
|
done
|
|
printf " │\n"
|
|
|
|
printf "└────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘\n"
|
|
}
|
|
|
|
generate_micro_layout() {
|
|
local hostname=$1
|
|
build_drive_map
|
|
|
|
# Check for eMMC storage
|
|
local emmc_device=""
|
|
if [[ -b /dev/mmcblk0 ]]; then
|
|
emmc_device="mmcblk0"
|
|
fi
|
|
|
|
printf "┌─────────────────────────────────────────────────────────────┐\n"
|
|
printf "│ %-57s │\n" "$hostname - Micro SBC"
|
|
printf "│ │\n"
|
|
printf "│ Storage Controllers: │\n"
|
|
while IFS= read -r ctrl; do
|
|
[[ -n "$ctrl" ]] && printf "│ %-57s│\n" "$ctrl"
|
|
done < <(get_storage_controllers)
|
|
printf "│ │\n"
|
|
|
|
# Show eMMC if present
|
|
if [[ -n "$emmc_device" ]]; then
|
|
local emmc_size=$(lsblk -d -n -o SIZE "/dev/$emmc_device" 2>/dev/null | xargs)
|
|
printf "│ ┌─────────────────────────────────────────────────────┐ │\n"
|
|
printf "│ │ Onboard eMMC: %-10s (%s) │ │\n" "$emmc_device" "$emmc_size"
|
|
printf "│ └─────────────────────────────────────────────────────┘ │\n"
|
|
printf "│ │\n"
|
|
fi
|
|
|
|
printf "│ SATA Ports (rear): │\n"
|
|
printf "│ ┌──────────────┐ ┌──────────────┐ │\n"
|
|
printf "│ │ 1: %-9s │ │ 2: %-9s │ │\n" "${DRIVE_MAP[1]:-EMPTY}" "${DRIVE_MAP[2]:-EMPTY}"
|
|
printf "│ └──────────────┘ └──────────────┘ │\n"
|
|
printf "└─────────────────────────────────────────────────────────────┘\n"
|
|
}
|
|
|
|
generate_large1_layout() {
|
|
local hostname=$1
|
|
build_drive_map
|
|
|
|
# large1 has 3 stacks of 5 bays at front (15 total) + 2 M.2 slots
|
|
# Physical bay mapping TBD - current mapping is by controller order
|
|
printf "┌─────────────────────────────────────────────────────────────────────────┐\n"
|
|
printf "│ %-69s │\n" "$hostname - Rosewill RSV-L4500U (15x 3.5\" Bays)"
|
|
printf "│ │\n"
|
|
printf "│ Storage Controllers: │\n"
|
|
while IFS= read -r ctrl; do
|
|
[[ -n "$ctrl" ]] && printf "│ %-69s│\n" "$ctrl"
|
|
done < <(get_storage_controllers)
|
|
printf "│ │\n"
|
|
printf "│ M.2 NVMe: M1: %-10s M2: %-10s │\n" "${DRIVE_MAP[m2-1]:-EMPTY}" "${DRIVE_MAP[m2-2]:-EMPTY}"
|
|
printf "│ │\n"
|
|
printf "│ Front Bays (3 stacks x 5 rows): [Bay mapping TBD] │\n"
|
|
printf "│ Stack A Stack B Stack C │\n"
|
|
printf "│ ┌──────────┐ ┌──────────┐ ┌──────────┐ │\n"
|
|
printf "│ │1:%-8s│ │2:%-8s│ │3:%-8s│ │\n" "${DRIVE_MAP[1]:-EMPTY}" "${DRIVE_MAP[2]:-EMPTY}" "${DRIVE_MAP[3]:-EMPTY}"
|
|
printf "│ ├──────────┤ ├──────────┤ ├──────────┤ │\n"
|
|
printf "│ │4:%-8s│ │5:%-8s│ │6:%-8s│ │\n" "${DRIVE_MAP[4]:-EMPTY}" "${DRIVE_MAP[5]:-EMPTY}" "${DRIVE_MAP[6]:-EMPTY}"
|
|
printf "│ ├──────────┤ ├──────────┤ ├──────────┤ │\n"
|
|
printf "│ │7:%-8s│ │8:%-8s│ │9:%-8s│ │\n" "${DRIVE_MAP[7]:-EMPTY}" "${DRIVE_MAP[8]:-EMPTY}" "${DRIVE_MAP[9]:-EMPTY}"
|
|
printf "│ ├──────────┤ ├──────────┤ ├──────────┤ │\n"
|
|
printf "│ │10:%-7s│ │11:%-7s│ │12:%-7s│ │\n" "${DRIVE_MAP[10]:-EMPTY}" "${DRIVE_MAP[11]:-EMPTY}" "${DRIVE_MAP[12]:-EMPTY}"
|
|
printf "│ ├──────────┤ ├──────────┤ ├──────────┤ │\n"
|
|
printf "│ │13:%-7s│ │14:%-7s│ │15:%-7s│ │\n" "${DRIVE_MAP[13]:-EMPTY}" "${DRIVE_MAP[14]:-EMPTY}" "${DRIVE_MAP[15]:-EMPTY}"
|
|
printf "│ └──────────┘ └──────────┘ └──────────┘ │\n"
|
|
printf "└─────────────────────────────────────────────────────────────────────────┘\n"
|
|
}
|
|
|
|
#------------------------------------------------------------------------------
|
|
# Server-Specific Drive Mappings
|
|
# Maps PCI paths to physical bay numbers for each server
|
|
# Format: "pci-path bay-number"
|
|
#------------------------------------------------------------------------------
|
|
|
|
declare -A SERVER_MAPPINGS=(
|
|
# compute-storage-01 (formerly medium2)
|
|
# Motherboard: B650D4U3-2Q/BCM with AMD SATA controller
|
|
# HBA: LSI SAS3008 at 01:00.0 (mini-SAS HD ports)
|
|
# Cable mapping from user notes:
|
|
# - Mobo SATA: top-right=bay1, bottom-right=bay2, bottom-left=bay3, top-left=bay4
|
|
# - HBA bottom mini-SAS: bays 5,6,7,8
|
|
# - HBA top mini-SAS: bays 9,10
|
|
["compute-storage-01"]="
|
|
pci-0000:0d:00.0-ata-2 1
|
|
pci-0000:0d:00.0-ata-1 2
|
|
pci-0000:0d:00.0-ata-3 3
|
|
pci-0000:0d:00.0-ata-4 4
|
|
pci-0000:01:00.0-sas-phy6-lun-0 5
|
|
pci-0000:01:00.0-sas-phy7-lun-0 6
|
|
pci-0000:01:00.0-sas-phy5-lun-0 7
|
|
pci-0000:01:00.0-sas-phy2-lun-0 8
|
|
pci-0000:01:00.0-sas-phy4-lun-0 9
|
|
pci-0000:01:00.0-sas-phy3-lun-0 10
|
|
pci-0000:0e:00.0-nvme-1 m2-1
|
|
"
|
|
|
|
# compute-storage-gpu-01
|
|
# Motherboard: ASUS PRIME B550-PLUS with AMD SATA controller at 02:00.1
|
|
# 5 SATA ports + 1 M.2 NVMe slot
|
|
# sdf is USB/card reader - not mapped
|
|
["compute-storage-gpu-01"]="
|
|
pci-0000:02:00.1-ata-1 1
|
|
pci-0000:02:00.1-ata-2 2
|
|
pci-0000:02:00.1-ata-3 3
|
|
pci-0000:02:00.1-ata-4 4
|
|
pci-0000:02:00.1-ata-5 5
|
|
pci-0000:0c:00.0-nvme-1 m2-1
|
|
"
|
|
|
|
# storage-01
|
|
# Motherboard: ASRock A320M-HDV R4.0 with AMD SATA controller at 02:00.1
|
|
# 4 SATA ports used (ata-1, ata-2, ata-5, ata-6) - ata-3/4 empty
|
|
["storage-01"]="
|
|
pci-0000:02:00.1-ata-1 1
|
|
pci-0000:02:00.1-ata-2 2
|
|
pci-0000:02:00.1-ata-5 3
|
|
pci-0000:02:00.1-ata-6 4
|
|
"
|
|
|
|
# large1
|
|
# Custom tower with multiple controllers:
|
|
# - HBA: LSI SAS2008 at 10:00.0 (7 drives)
|
|
# - AMD SATA at 16:00.1 (3 drives)
|
|
# - ASMedia SATA at 25:00.0 (2 drives)
|
|
# - 2x NVMe slots
|
|
["large1"]="
|
|
pci-0000:10:00.0-sas-phy0-lun-0 1
|
|
pci-0000:10:00.0-sas-phy1-lun-0 2
|
|
pci-0000:10:00.0-sas-phy3-lun-0 3
|
|
pci-0000:10:00.0-sas-phy4-lun-0 4
|
|
pci-0000:10:00.0-sas-phy5-lun-0 5
|
|
pci-0000:10:00.0-sas-phy6-lun-0 6
|
|
pci-0000:10:00.0-sas-phy7-lun-0 7
|
|
pci-0000:16:00.1-ata-3 8
|
|
pci-0000:16:00.1-ata-7 9
|
|
pci-0000:16:00.1-ata-8 10
|
|
pci-0000:25:00.0-ata-1 11
|
|
pci-0000:25:00.0-ata-2 12
|
|
pci-0000:2a:00.0-nvme-1 m2-1
|
|
pci-0000:26:00.0-nvme-1 m2-2
|
|
"
|
|
|
|
# micro1
|
|
# ZimaBoard 832 - Single board computer
|
|
# 2 SATA ports on rear (currently unused)
|
|
# Boot from onboard eMMC (mmcblk0)
|
|
# SATA controller at 00:12.0
|
|
["micro1"]="
|
|
"
|
|
|
|
# monitor-02
|
|
# ZimaBoard 832 - Single board computer
|
|
# 2 SATA ports on rear (currently unused)
|
|
# Boot from onboard eMMC (mmcblk0)
|
|
# SATA controller would be at a specific PCI address when drives connected
|
|
["monitor-02"]="
|
|
"
|
|
)
|
|
|
|
declare -A CHASSIS_TYPES=(
|
|
["compute-storage-01"]="10bay"
|
|
["compute-storage-gpu-01"]="10bay"
|
|
["storage-01"]="10bay"
|
|
["large1"]="large1"
|
|
["micro1"]="micro" # ZimaBoard 832
|
|
["monitor-02"]="micro" # ZimaBoard 832
|
|
)
|
|
|
|
#------------------------------------------------------------------------------
|
|
# Core Functions
|
|
#------------------------------------------------------------------------------
|
|
|
|
get_storage_controllers() {
|
|
# Returns a formatted list of storage controllers (HBAs, SATA, NVMe)
|
|
lspci 2>/dev/null | grep -iE "SAS|SATA|RAID|Mass storage|NVMe" | while read -r line; do
|
|
pci_addr=$(echo "$line" | awk '{print $1}')
|
|
# Get short description (strip PCI address)
|
|
desc=$(echo "$line" | sed 's/^[0-9a-f:.]\+ //')
|
|
echo " $pci_addr: $desc"
|
|
done
|
|
}
|
|
|
|
build_drive_map() {
|
|
local host=$(hostname)
|
|
declare -A drive_map
|
|
|
|
local mapping=${SERVER_MAPPINGS[$host]}
|
|
|
|
if [[ -n "$mapping" ]]; then
|
|
while read -r path slot; do
|
|
[[ -z "$path" || -z "$slot" ]] && continue
|
|
|
|
if [[ -L "/dev/disk/by-path/$path" ]]; then
|
|
local drive=$(readlink -f "/dev/disk/by-path/$path" | sed 's/.*\///')
|
|
drive_map[$slot]=$drive
|
|
fi
|
|
done <<< "$mapping"
|
|
fi
|
|
|
|
# Make drive_map available globally
|
|
declare -g -A DRIVE_MAP=()
|
|
for key in "${!drive_map[@]}"; do
|
|
DRIVE_MAP[$key]=${drive_map[$key]}
|
|
done
|
|
}
|
|
|
|
get_drive_smart_info() {
|
|
local device=$1
|
|
local smart_info=$(sudo smartctl -A -i -H /dev/$device 2>/dev/null)
|
|
local temp=$(echo "$smart_info" | grep "Temperature" | awk '{print $10}' | head -1)
|
|
local type=$(echo "$smart_info" | grep "Rotation Rate" | grep -q "Solid State" && echo "SSD" || echo "HDD")
|
|
local health=$(echo "$smart_info" | grep "SMART overall-health" | grep -q "PASSED" && echo "✓" || echo "✗")
|
|
local model=$(echo "$smart_info" | grep "Device Model\|Model Number" | cut -d: -f2 | xargs)
|
|
local serial=$(echo "$smart_info" | grep "Serial Number" | awk '{print $3}')
|
|
|
|
echo "$type|$temp°C|$health|$model|$serial"
|
|
}
|
|
|
|
#------------------------------------------------------------------------------
|
|
# Main Display Logic
|
|
#------------------------------------------------------------------------------
|
|
|
|
HOSTNAME=$(hostname)
|
|
CHASSIS_TYPE=${CHASSIS_TYPES[$HOSTNAME]:-"unknown"}
|
|
|
|
# Display chassis layout
|
|
case "$CHASSIS_TYPE" in
|
|
"10bay")
|
|
generate_10bay_layout "$HOSTNAME"
|
|
;;
|
|
"large1")
|
|
generate_large1_layout "$HOSTNAME"
|
|
;;
|
|
"micro")
|
|
generate_micro_layout "$HOSTNAME"
|
|
;;
|
|
*)
|
|
echo "┌─────────────────────────────────────────────────────────┐"
|
|
echo "│ Unknown server: $HOSTNAME"
|
|
echo "│ No chassis mapping defined yet"
|
|
echo "│ Run diagnose-drives.sh to gather PCI path information"
|
|
echo "└─────────────────────────────────────────────────────────┘"
|
|
;;
|
|
esac
|
|
|
|
#------------------------------------------------------------------------------
|
|
# Drive Details Section
|
|
#------------------------------------------------------------------------------
|
|
|
|
echo -e "\n=== Drive Details with SMART Status (by Bay Position) ==="
|
|
printf "%-5s %-15s %-10s %-8s %-8s %-8s %-30s %-20s %-12s %-10s %-10s\n" "BAY" "DEVICE" "SIZE" "TYPE" "TEMP" "HEALTH" "MODEL" "SERIAL" "CEPH OSD" "STATUS" "USAGE"
|
|
echo "----------------------------------------------------------------------------------------------------------------------------------------------------"
|
|
|
|
# Build reverse map: device -> bay
|
|
declare -A DEVICE_TO_BAY
|
|
for bay in "${!DRIVE_MAP[@]}"; do
|
|
device="${DRIVE_MAP[$bay]}"
|
|
if [[ -n "$device" && "$device" != "EMPTY" ]]; then
|
|
DEVICE_TO_BAY[$device]=$bay
|
|
fi
|
|
done
|
|
|
|
# Sort drives by bay position
|
|
for bay in $(printf '%s\n' "${!DRIVE_MAP[@]}" | grep -E '^[0-9]+$' | sort -n); do
|
|
device="${DRIVE_MAP[$bay]}"
|
|
if [[ -n "$device" && "$device" != "EMPTY" && -b "/dev/$device" ]]; then
|
|
size=$(lsblk -d -n -o SIZE "/dev/$device" 2>/dev/null)
|
|
smart_info=$(get_drive_smart_info "$device")
|
|
IFS='|' read -r type temp health model serial <<< "$smart_info"
|
|
|
|
# Check for Ceph OSD
|
|
osd_id=$(ceph-volume lvm list 2>/dev/null | grep -B 20 "/dev/$device" | grep "osd id" | awk '{print "osd."$3}' | head -1)
|
|
|
|
# Get Ceph status if OSD exists
|
|
ceph_status="-"
|
|
if [[ -n "$osd_id" ]]; then
|
|
# Get in/out and up/down status from ceph osd tree
|
|
osd_num=$(echo "$osd_id" | sed 's/osd\.//')
|
|
# Parse ceph osd tree output - column 5 is STATUS (up/down), column 6 is REWEIGHT (1.0 = in, 0 = out)
|
|
tree_line=$(ceph osd tree 2>/dev/null | grep -E "^\s*${osd_num}\s+" | grep "osd.${osd_num}")
|
|
up_status=$(echo "$tree_line" | awk '{print $5}')
|
|
reweight=$(echo "$tree_line" | awk '{print $6}')
|
|
|
|
# Default to unknown if we can't parse
|
|
[[ -z "$up_status" ]] && up_status="unknown"
|
|
[[ -z "$reweight" ]] && reweight="0"
|
|
|
|
# Determine in/out based on reweight (1.0 = in, 0 = out)
|
|
if (( $(echo "$reweight > 0" | bc -l 2>/dev/null || echo 0) )); then
|
|
in_status="in"
|
|
else
|
|
in_status="out"
|
|
fi
|
|
|
|
ceph_status="${up_status}/${in_status}"
|
|
else
|
|
osd_id="-"
|
|
fi
|
|
|
|
# Check if boot drive
|
|
usage="-"
|
|
if mount | grep -q "^/dev/${device}"; then
|
|
mount_point=$(mount | grep "^/dev/${device}" | awk '{print $3}' | head -1)
|
|
if [[ "$mount_point" == "/" ]]; then
|
|
usage="BOOT"
|
|
else
|
|
usage="$mount_point"
|
|
fi
|
|
fi
|
|
|
|
printf "%-5s %-15s %-10s %-8s %-8s %-8s %-30s %-20s %-12s %-10s %-10s\n" "$bay" "/dev/$device" "$size" "$type" "$temp" "$health" "$model" "$serial" "$osd_id" "$ceph_status" "$usage"
|
|
fi
|
|
done
|
|
|
|
# NVMe drives
|
|
nvme_devices=$(lsblk -d -n -o NAME,SIZE | grep "^nvme" 2>/dev/null)
|
|
if [ -n "$nvme_devices" ]; then
|
|
echo -e "\n=== NVMe Drives ==="
|
|
printf "%-15s %-10s %-10s %-40s %-25s\n" "DEVICE" "SIZE" "TYPE" "MODEL" "SERIAL"
|
|
echo "------------------------------------------------------------------------------------------------------"
|
|
echo "$nvme_devices" | while read -r name size; do
|
|
device="/dev/$name"
|
|
# Get model and serial from smartctl for accuracy
|
|
smart_info=$(sudo smartctl -i "$device" 2>/dev/null)
|
|
model=$(echo "$smart_info" | grep "Model Number" | cut -d: -f2 | xargs)
|
|
serial=$(echo "$smart_info" | grep "Serial Number" | cut -d: -f2 | xargs)
|
|
[[ -z "$model" ]] && model="-"
|
|
[[ -z "$serial" ]] && serial="-"
|
|
printf "%-15s %-10s %-10s %-40s %-25s\n" "$device" "$size" "NVMe" "$model" "$serial"
|
|
done
|
|
fi
|
|
|
|
#------------------------------------------------------------------------------
|
|
# Optional sections
|
|
#------------------------------------------------------------------------------
|
|
|
|
# Ceph RBD Devices
|
|
rbd_devices=$(lsblk -d -n -o NAME,SIZE,TYPE 2>/dev/null | grep "rbd" | sort -V)
|
|
if [ -n "$rbd_devices" ]; then
|
|
echo -e "\n=== Ceph RBD Devices ==="
|
|
printf "%-15s %-10s %-10s %-30s\n" "DEVICE" "SIZE" "TYPE" "MOUNTPOINT"
|
|
echo "------------------------------------------------------------"
|
|
echo "$rbd_devices" | while read -r name size type; do
|
|
# Get mountpoint if any
|
|
mountpoint=$(lsblk -n -o MOUNTPOINT "/dev/$name" 2>/dev/null | head -1)
|
|
[[ -z "$mountpoint" ]] && mountpoint="-"
|
|
printf "%-15s %-10s %-10s %-30s\n" "/dev/$name" "$size" "$type" "$mountpoint"
|
|
done
|
|
fi
|
|
|
|
# Show mapping diagnostic info if DEBUG is set
|
|
if [[ -n "$DEBUG" ]]; then
|
|
echo -e "\n=== DEBUG: Drive Mappings ==="
|
|
for key in "${!DRIVE_MAP[@]}"; do
|
|
echo "Bay $key: ${DRIVE_MAP[$key]}"
|
|
done | sort -n
|
|
fi
|