58 lines
2.9 KiB
Django/Jinja
58 lines
2.9 KiB
Django/Jinja
#!/bin/bash
|
|
{{ ansible_managed | comment }}
|
|
# This is the 'peak' script; applies most-aggressive amdgpu clock/power/voltage tunables
|
|
#
|
|
# AMDGPU driver/sysfs references:
|
|
# https://01.org/linuxgraphics/gfx-docs/drm/gpu/amdgpu.html
|
|
# https://docs.kernel.org/gpu/amdgpu/thermal.html
|
|
#
|
|
# start by including the 'common' script; determines card/hwmon dir/power profiles/power capability
|
|
. $(dirname "${BASH_SOURCE[0]}")/amdgpu-common.sh
|
|
|
|
{# begin the templated script for 'overclocked' AMD GPU profiles based on the existing tuned profiles #}
|
|
# set the minimum GPU clock - for best performance, this should be near the maximum
|
|
# RX6000 series power management *sucks*
|
|
echo 's 0 {{ gpu_clock_min }}' | tee /sys/class/drm/"${CARD}"/device/pp_od_clk_voltage
|
|
|
|
# set the maximum GPU clock
|
|
echo 's 1 {{ gpu_clock_max }}' | tee /sys/class/drm/"${CARD}"/device/pp_od_clk_voltage
|
|
|
|
# set the GPU *memory* clock
|
|
# normally this would appear disregarded, memory clocked at the minimum allowed by the overdrive (OD) range
|
|
# it follows the core clock; if both 0/1 profiles for _it_ are high enough, the memory will follow
|
|
echo 'm 1 {{ gpumem_clock_static }}' | tee /sys/class/drm/"${CARD}"/device/pp_od_clk_voltage
|
|
{% if gpu_mv_offset is defined %}
|
|
|
|
# offset GPU voltage {{ gpu_mv_offset }}mV
|
|
echo 'vo {{ gpu_mv_offset }}' | tee /sys/class/drm/"${CARD}"/device/pp_od_clk_voltage
|
|
{% endif %}
|
|
|
|
# commit the changes
|
|
echo 'c' | tee /sys/class/drm/"${CARD}"/device/pp_od_clk_voltage
|
|
|
|
# force GPU core and memory into highest clocks (fix flickering and poor power management)
|
|
# set manual control mode
|
|
# allows control via 'pp_dpm_mclk', 'pp_dpm_sclk', 'pp_dpm_pcie', 'pp_dpm_fclk', and 'pp_power_profile_mode' files
|
|
echo 'manual' | tee /sys/class/drm/"${CARD}"/device/power_dpm_force_performance_level
|
|
|
|
# adjust power limit using multiplier against board capability
|
|
POWER_LIM_OC=$(/usr/bin/awk -v m="$POWER_CAP" -v n={{ gpu_power_multi.overclock }} 'BEGIN {printf "%.0f", (m*n)}')
|
|
echo "$POWER_LIM_OC" | tee "${HWMON_DIR}/power1_cap"
|
|
|
|
# pp_dpm_*clk settings are unintuitive, giving profiles that may be used
|
|
echo '1' | tee /sys/class/drm/"${CARD}"/device/pp_dpm_sclk
|
|
echo '3' | tee /sys/class/drm/"${CARD}"/device/pp_dpm_mclk
|
|
echo '2' | tee /sys/class/drm/"${CARD}"/device/pp_dpm_fclk
|
|
echo '2' | tee /sys/class/drm/"${CARD}"/device/pp_dpm_socclk
|
|
|
|
# extract the VR power profile ID number
|
|
PROF_VR_NUM=$(/usr/bin/awk '$0 ~ /VR.*:/ {print $1}' <<< "$PROFILE_MODES")
|
|
|
|
# force 'overclocked' profile to 'VR' power/clock heuristics
|
|
# latency/frame timing seemed favorable with relatively-close minimum clocks
|
|
echo "${PROF_VR_NUM}" | tee /sys/class/drm/"${CARD}"/device/pp_power_profile_mode
|
|
|
|
# note 4/8/2023: instead of 'manual'... try dealing with broken power management, force clocks to high
|
|
# ref: https://gitlab.freedesktop.org/drm/amd/-/issues/1500
|
|
# followup: doesn't work that well in practice, still flaky on clocks/frame times
|
|
#echo 'high' | tee /sys/class/drm/"${CARD}"/device/power_dpm_force_performance_level
|