Some checks failed
Docker image CI / Build and publish Docker image to Docker Hub and GitHub Containers Repository (push) Has been cancelled
151 lines
6.1 KiB
Bash
151 lines
6.1 KiB
Bash
#!/bin/bash
|
|
|
|
# Enable strict bash mode to stop the script if an uninitialized variable is used, if a command fails, or if a command with a pipe fails
|
|
# Not working in some setups : https://github.com/tigerblue77/Dell_iDRAC_fan_controller/issues/48
|
|
# set -euo pipefail
|
|
|
|
source functions.sh
|
|
source constants.sh
|
|
|
|
# Trap the signals for container exit and run graceful_exit function
|
|
trap 'graceful_exit' SIGINT SIGQUIT SIGTERM
|
|
|
|
# Prepare, format and define initial variables
|
|
|
|
# readonly DELL_FRESH_AIR_COMPLIANCE=45
|
|
|
|
# Check if FAN_SPEED variable is in hexadecimal format. If not, convert it to hexadecimal
|
|
if [[ "$FAN_SPEED" == 0x* ]]; then
|
|
readonly DECIMAL_FAN_SPEED=$(convert_hexadecimal_value_to_decimal "$FAN_SPEED")
|
|
readonly HEXADECIMAL_FAN_SPEED="$FAN_SPEED"
|
|
else
|
|
readonly DECIMAL_FAN_SPEED="$FAN_SPEED"
|
|
readonly HEXADECIMAL_FAN_SPEED=$(convert_decimal_value_to_hexadecimal "$FAN_SPEED")
|
|
fi
|
|
|
|
set_iDRAC_login_string "$IDRAC_HOST" "$IDRAC_USERNAME" "$IDRAC_PASSWORD"
|
|
|
|
get_Dell_server_model
|
|
|
|
if [[ ! $SERVER_MANUFACTURER == "DELL" ]]; then
|
|
print_error_and_exit "Your server isn't a Dell product"
|
|
fi
|
|
|
|
# If server model is Gen 14 (*40) or newer
|
|
if [[ $SERVER_MODEL =~ .*[RT][[:space:]]?[0-9][4-9]0.* ]]; then
|
|
readonly DELL_POWEREDGE_GEN_14_OR_NEWER=true
|
|
readonly CPU1_TEMPERATURE_INDEX=2
|
|
readonly CPU2_TEMPERATURE_INDEX=4
|
|
else
|
|
readonly DELL_POWEREDGE_GEN_14_OR_NEWER=false
|
|
readonly CPU1_TEMPERATURE_INDEX=1
|
|
readonly CPU2_TEMPERATURE_INDEX=2
|
|
fi
|
|
|
|
# Log main informations
|
|
echo "Server model: $SERVER_MANUFACTURER $SERVER_MODEL"
|
|
echo "iDRAC/IPMI host: $IDRAC_HOST"
|
|
|
|
# Log the fan speed objective, CPU temperature threshold and check interval
|
|
echo "Fan speed objective: $DECIMAL_FAN_SPEED%"
|
|
echo "CPU temperature threshold: "$CPU_TEMPERATURE_THRESHOLD"°C"
|
|
echo "Check interval: ${CHECK_INTERVAL}s"
|
|
echo ""
|
|
|
|
TABLE_HEADER_PRINT_COUNTER=$TABLE_HEADER_PRINT_INTERVAL
|
|
# Set the flag used to check if the active fan control profile has changed
|
|
IS_DELL_DEFAULT_FAN_CONTROL_PROFILE_APPLIED=true
|
|
|
|
# Check present sensors
|
|
IS_EXHAUST_TEMPERATURE_SENSOR_PRESENT=true
|
|
IS_CPU2_TEMPERATURE_SENSOR_PRESENT=true
|
|
|
|
# Start timer in background
|
|
sleep "$CHECK_INTERVAL" &
|
|
SLEEP_PROCESS_PID=$!
|
|
|
|
retrieve_temperatures $IS_EXHAUST_TEMPERATURE_SENSOR_PRESENT $IS_CPU2_TEMPERATURE_SENSOR_PRESENT
|
|
|
|
if [ -z "$EXHAUST_TEMPERATURE" ]; then
|
|
echo "No exhaust temperature sensor detected."
|
|
IS_EXHAUST_TEMPERATURE_SENSOR_PRESENT=false
|
|
fi
|
|
if [ -z "$CPU2_TEMPERATURE" ]; then
|
|
echo "No CPU2 temperature sensor detected."
|
|
IS_CPU2_TEMPERATURE_SENSOR_PRESENT=false
|
|
fi
|
|
# Output new line to beautify output if one of the previous conditions have echoed
|
|
if ! $IS_EXHAUST_TEMPERATURE_SENSOR_PRESENT || ! $IS_CPU2_TEMPERATURE_SENSOR_PRESENT; then
|
|
echo ""
|
|
fi
|
|
|
|
#readonly NUMBER_OF_DETECTED_CPUS=(${CPUS_TEMPERATURES//;/ })
|
|
# TODO : write "X CPU sensors detected." and remove previous ifs
|
|
readonly HEADER=$(build_header $NUMBER_OF_DETECTED_CPUS)
|
|
|
|
# Start monitoring
|
|
while true; do
|
|
# Initialize a variable to store the comments displayed when the fan control profile changed
|
|
COMMENT=" -"
|
|
# Check if CPU 1 is overheating then apply Dell default dynamic fan control profile if true
|
|
if CPU1_OVERHEATING; then
|
|
apply_Dell_default_fan_control_profile
|
|
|
|
if ! $IS_DELL_DEFAULT_FAN_CONTROL_PROFILE_APPLIED; then
|
|
IS_DELL_DEFAULT_FAN_CONTROL_PROFILE_APPLIED=true
|
|
|
|
# If CPU 2 temperature sensor is present, check if it is overheating too.
|
|
# Do not apply Dell default dynamic fan control profile as it has already been applied before
|
|
if $IS_CPU2_TEMPERATURE_SENSOR_PRESENT && CPU2_OVERHEATING; then
|
|
COMMENT="CPU 1 and CPU 2 temperatures are too high, Dell default dynamic fan control profile applied for safety"
|
|
else
|
|
COMMENT="CPU 1 temperature is too high, Dell default dynamic fan control profile applied for safety"
|
|
fi
|
|
fi
|
|
# If CPU 2 temperature sensor is present, check if it is overheating then apply Dell default dynamic fan control profile if true
|
|
elif $IS_CPU2_TEMPERATURE_SENSOR_PRESENT && CPU2_OVERHEATING; then
|
|
apply_Dell_default_fan_control_profile
|
|
|
|
if ! $IS_DELL_DEFAULT_FAN_CONTROL_PROFILE_APPLIED; then
|
|
IS_DELL_DEFAULT_FAN_CONTROL_PROFILE_APPLIED=true
|
|
COMMENT="CPU 2 temperature is too high, Dell default dynamic fan control profile applied for safety"
|
|
fi
|
|
else
|
|
apply_user_fan_control_profile
|
|
|
|
# Check if user fan control profile is applied then apply it if not
|
|
if $IS_DELL_DEFAULT_FAN_CONTROL_PROFILE_APPLIED; then
|
|
IS_DELL_DEFAULT_FAN_CONTROL_PROFILE_APPLIED=false
|
|
COMMENT="CPU temperature decreased and is now OK (<= $CPU_TEMPERATURE_THRESHOLD°C), user's fan control profile applied."
|
|
fi
|
|
fi
|
|
|
|
# If server model is not Gen 14 (*40) or newer
|
|
if ! $DELL_POWEREDGE_GEN_14_OR_NEWER; then
|
|
# Enable or disable, depending on the user's choice, third-party PCIe card Dell default cooling response
|
|
# No comment will be displayed on the change of this parameter since it is not related to the temperature of any device (CPU, GPU, etc...) but only to the settings made by the user when launching this Docker container
|
|
if "$DISABLE_THIRD_PARTY_PCIE_CARD_DELL_DEFAULT_COOLING_RESPONSE"; then
|
|
disable_third_party_PCIe_card_Dell_default_cooling_response
|
|
THIRD_PARTY_PCIE_CARD_DELL_DEFAULT_COOLING_RESPONSE_STATUS="Disabled"
|
|
else
|
|
enable_third_party_PCIe_card_Dell_default_cooling_response
|
|
THIRD_PARTY_PCIE_CARD_DELL_DEFAULT_COOLING_RESPONSE_STATUS="Enabled"
|
|
fi
|
|
fi
|
|
|
|
# Print temperatures, active fan control profile and comment if any change happened during last time interval
|
|
if [ $TABLE_HEADER_PRINT_COUNTER -eq $TABLE_HEADER_PRINT_INTERVAL ]; then
|
|
printf "%s\n" "$HEADER"
|
|
TABLE_HEADER_PRINT_COUNTER=0
|
|
fi
|
|
print_temperature_array_line "$INLET_TEMPERATURE" "$CPUS_TEMPERATURES" "$EXHAUST_TEMPERATURE" "$CURRENT_FAN_CONTROL_PROFILE" "$THIRD_PARTY_PCIE_CARD_DELL_DEFAULT_COOLING_RESPONSE_STATUS" "$COMMENT"
|
|
((TABLE_HEADER_PRINT_COUNTER++))
|
|
|
|
wait $SLEEP_PROCESS_PID
|
|
|
|
# Start timer in background for next cycle
|
|
sleep "$CHECK_INTERVAL" &
|
|
SLEEP_PROCESS_PID=$!
|
|
|
|
retrieve_temperatures $IS_EXHAUST_TEMPERATURE_SENSOR_PRESENT $IS_CPU2_TEMPERATURE_SENSOR_PRESENT
|
|
done
|