-
-
Save fonic/8f38e5e3ce5c8693ae3a23aa1af21fb9 to your computer and use it in GitHub Desktop.
#!/usr/bin/env bash | |
# ------------------------------------------------------------------------- | |
# - | |
# Created by Fonic (https://github.com/fonic) - | |
# Date: 12/29/19 - 02/12/20 - | |
# - | |
# Created for and tested on single-GPU system equipped with NVIDIA - | |
# GeForce RTX 2060 SUPER. For other systems, modifications might be - | |
# required. - | |
# - | |
# Based on: - | |
# https://gist.github.com/frantic1048/41f56fd6328fa83ce6ad5acb3a4c0336 - | |
# https://gist.github.com/hacker1024/c01a773f50769bd8216fa01ea0a1ef33 - | |
# https://techbase.kde.org/Development/Tutorials/Sensors - | |
# - | |
# ------------------------------------------------------------------------- | |
# Globals | |
MAX_GPU_TEMP=100 # maximum GPU temperature in °C | |
MAX_MEM_USED=8192 # maximum memory used in MB | |
MAX_GPU_CLOCK=2100 # maximum GPU clock in MHz | |
MAX_MEM_CLOCK=7000 # maximum memory clock in MHz | |
MAX_FAN_RPM=3000 # maximum fan speed in RPM | |
# Main loop | |
echo "ksysguardd 1.2.0" | |
echo -n "ksysguardd> " | |
last_update=$((${SECONDS} - 1)) | |
while read -r input; do | |
# Update monitor data just in time, but not more often than once per second | |
# NOTE: | |
# nvidia-settings will stop printing data on the first error it encounters. | |
# Thus, queries for [fan:1] have to be placed at the end of the list for the | |
# script to work on systems with only one fan | |
if (( ${SECONDS} < ${last_update} || ${SECONDS} - ${last_update} >= 1 )); then | |
readarray -t lines < <(nvidia-settings -t \ | |
-q [gpu:0]/GPUCoreTemp \ | |
-q [gpu:0]/UsedDedicatedGPUMemory \ | |
-q [gpu:0]/GPUCurrentClockFreqs \ | |
-q [gpu:0]/GPUUtilization \ | |
-q [fan:0]/GPUCurrentFanSpeed \ | |
-q [fan:0]/GPUCurrentFanSpeedRPM \ | |
-q [fan:1]/GPUCurrentFanSpeed \ | |
-q [fan:1]/GPUCurrentFanSpeedRPM \ | |
) | |
gpu_temp="${lines[0]}" | |
mem_used="${lines[1]}" | |
gpu_clock="${lines[2]%,*}" | |
mem_clock="${lines[2]#*,}" | |
re="^graphics=([0-9]+), memory=([0-9]+), video=([0-9]+), PCIe=([0-9]+)$" | |
if [[ "${lines[3]}" =~ ${re} ]]; then | |
gpu_load="${BASH_REMATCH[1]}" | |
mem_load="${BASH_REMATCH[2]}" | |
vpu_load="${BASH_REMATCH[3]}" | |
pcie_load="${BASH_REMATCH[4]}" | |
fi | |
fan0_load="${lines[4]}" | |
fan0_rpm="${lines[5]}" | |
fan1_load="${lines[6]}" | |
fan1_rpm="${lines[7]}" | |
last_update=${SECONDS} | |
fi | |
# Evaluate input, generate output | |
case "${input}" in | |
# List of monitors (format: '<id>\t<data-type>') | |
"monitors") | |
echo -e "gpu_temp\tinteger" | |
echo -e "mem_used\tinteger" | |
echo -e "gpu_clock\tinteger" | |
echo -e "mem_clock\tinteger" | |
echo -e "gpu_load\tinteger" | |
echo -e "mem_load\tinteger" | |
echo -e "vpu_load\tinteger" | |
echo -e "pcie_load\tinteger" | |
echo -e "fan0_load\tinteger" | |
echo -e "fan0_rpm\tinteger" | |
echo -e "fan1_load\tinteger" | |
echo -e "fan1_rpm\tinteger" | |
;; | |
# Monitor info (format: '<label>\t<min-value>\t<max-value>\t<unit>') | |
"gpu_temp?") echo -e "GPU\t0\t${MAX_GPU_TEMP}\t°C"; ;; | |
"mem_used?") echo -e "MEM\t0\t${MAX_MEM_USED}\tMB"; ;; | |
"gpu_clock?") echo -e "GPU\t0\t${MAX_GPU_CLOCK}\tMHz"; ;; | |
"mem_clock?") echo -e "MEM\t0\t${MAX_MEM_CLOCK}\tMHz"; ;; | |
"gpu_load?") echo -e "GPU\t0\t100\t%"; ;; | |
"mem_load?") echo -e "MEM\t0\t100\t%"; ;; | |
"vpu_load?") echo -e "VPU\t0\t100\t%"; ;; | |
"pcie_load?") echo -e "PCIe\t0\t100\t%"; ;; | |
"fan0_load?") echo -e "FAN1\t0\t100\t%"; ;; | |
"fan0_rpm?") echo -e "FAN1\t0\t${MAX_FAN_RPM}\tRPM"; ;; | |
"fan1_load?") echo -e "FAN2\t0\t100\t%"; ;; | |
"fan1_rpm?") echo -e "FAN2\t0\t${MAX_FAN_RPM}\tRPM"; ;; | |
# Monitor data (format: '<value>') | |
"gpu_temp") echo "${gpu_temp}"; ;; | |
"mem_used") echo "${mem_used}"; ;; | |
"gpu_clock") echo "${gpu_clock}"; ;; | |
"mem_clock") echo "${mem_clock}"; ;; | |
"gpu_load") echo "${gpu_load}"; ;; | |
"mem_load") echo "${mem_load}"; ;; | |
"vpu_load") echo "${vpu_load}"; ;; | |
"pcie_load") echo "${pcie_load}"; ;; | |
"fan0_load") echo "${fan0_load}"; ;; | |
"fan0_rpm") echo "${fan0_rpm}"; ;; | |
"fan1_load") echo "${fan1_load}"; ;; | |
"fan1_rpm") echo "${fan1_rpm}"; ;; | |
"exit"|"quit") break; ;; | |
esac | |
# Renew prompt | |
echo -n "ksysguardd> " | |
done |
cool script thank you!
Any chance you could implement reading the Power draw of the GPU?
It can be read using:
nvidia-smi --query-gpu=power.draw --format=csv
but I haven't managed to read it using nvidia-settings (as you do in your script)
@alexanderhelbok: you're welcome.
Just had a quick look at nvidia-smi
. My script could now be completely rewritten to use that instead of nvidia-settings
. Back in 2019 when I initially created the script, nvidia-smi
was still in its infancy and could only query/display a handful of metrics, thus nvidia-settings
was the only way to go.
However, I'm quite certain that I won't rewrite it - KSysGuard is deprecated in favor of Plasma System Monitor anyway, thus the script will become deprecated as well in the foreseeable future.
True fair enough, time to switch to Plasma System Monitor then ^^
True fair enough, time to switch to Plasma System Monitor then ^^
... which already has built-in NVIDIA support, albeit quite limited. I think what Plasma System Monitor can currently monitor for NVIDIA GPUs is exactly what nvidia-smi
used to provide back then. If I find the time, I might consider contributing to Plasma System Monitor and extend NVIDIA support further.
This is seriously cool, thank you!
I wish System Monitor was this extensive, but I might have to switch back for detailed metrics now!
@fubarhouse Thanks, glad you like it. I'm actually still using KSysGuard and this script myself - last time I checked System Monitor wasn't really to my liking.
+1 for: nice!
I grouped some sensors and ended up liking this layout.
https://gist.github.com/BETLOG/85f069c248daa1ccfd8b4996a0bb5b28