RDK X5 Monitor — 系统监控
操作步骤
1. CPU 状态
# CPU 使用率(实时)
top -bn1 | head -5
# 各核频率
cat /sys/devices/system/cpu/cpu*/cpufreq/scaling_cur_freq
# 调度策略
cat /sys/devices/system/cpu/cpu0/cpufreq/scaling_governor
2. BPU 算力监控
# BPU 使用率(0~100)
cat /sys/devices/system/bpu/bpu0/ratio
# BPU 频率
cat /sys/devices/system/bpu/bpu0/devfreq/*/cur_freq
3. 温度
# 芯片温度(除以 1000 = ℃)
cat /sys/class/thermal/thermal_zone0/temp
# BPU 温度
cat /sys/class/hwmon/hwmon0/temp1_input
超过 95°C 自动降频,极限 105°C。
4. 内存与磁盘
free -h # 内存
df -h # 磁盘
5. GPU 频率
cat /sys/class/devfreq/*/cur_freq 2>/dev/null | head -1
6. 网络 IP
ip -4 addr show | grep inet | grep -v 127.0.0.1
hostname -I
7. 一键状态总览
echo "=== CPU ===" && top -bn1 | head -5 && \
echo "=== BPU ===" && cat /sys/devices/system/bpu/bpu0/ratio 2>/dev/null && \
echo "=== Temp ===" && echo "$(($(cat /sys/class/thermal/thermal_zone0/temp)/1000))°C" && \
echo "=== Mem ===" && free -h | head -2 && \
echo "=== Disk ===" && df -h / | tail -1 && \
echo "=== IP ===" && hostname -I
8. 持续监控(每 2 秒刷新)
watch -n 2 'echo "CPU: $(top -bn1 | grep Cpu | head -1)" && \
echo "BPU: $(cat /sys/devices/system/bpu/bpu0/ratio 2>/dev/null)%" && \
echo "Temp: $(($(cat /sys/class/thermal/thermal_zone0/temp)/1000))°C" && \
free -h | head -2'
排查故障
| 现象 | 原因 | 解决 |
|---|---|---|
| CPU 100% 持续 | 进程占满 | top 查看高占用进程;kill 或降低负载 |
| 温度 >90°C | 散热不足 | 加装散热片/风扇;降低 BPU 负载 |
| BPU ratio 始终 0 | 无推理任务运行 | 正常现象;启动 AI 推理后会上升 |
| 磁盘满 | 日志或备份过大 | du -sh /var/log/*;sudo apt clean |