mirror of
https://github.com/systemd/systemd-stable.git
synced 2025-01-25 06:03:40 +03:00
064a5c1438
Compared to PID1 where systemd-oomd has to be the client to PID1 because PID1 is a more privileged process than systemd-oomd, systemd-oomd is the more privileged process compared to a user manager so we have user managers be the client whereas systemd-oomd is now the server. The same varlink protocol is used between user managers and systemd-oomd to deliver ManagedOOM property updates. systemd-oomd now sets up a varlink server that user managers connect to to send ManagedOOM property updates. We also add extra validation to make sure that non-root senders don't send updates for cgroups they don't own. The integration test was extended to repeat the chill/bloat test using a user manager instead of PID1.
125 lines
4.3 KiB
Bash
Executable File
125 lines
4.3 KiB
Bash
Executable File
#!/usr/bin/env bash
|
|
set -eux
|
|
set -o pipefail
|
|
|
|
systemd-analyze log-level debug
|
|
systemd-analyze log-target console
|
|
|
|
# Loose checks to ensure the environment has the necessary features for systemd-oomd
|
|
[[ -e /proc/pressure ]] || echo "no PSI" >>/skipped
|
|
cgroup_type="$(stat -fc %T /sys/fs/cgroup/)"
|
|
if [[ "$cgroup_type" != *"cgroup2"* ]] && [[ "$cgroup_type" != *"0x63677270"* ]]; then
|
|
echo "no cgroup2" >>/skipped
|
|
fi
|
|
if [ ! -f /usr/lib/systemd/systemd-oomd ] && [ ! -f /lib/systemd/systemd-oomd ]; then
|
|
echo "no oomd" >>/skipped
|
|
fi
|
|
|
|
if [[ -e /skipped ]]; then
|
|
exit 0
|
|
fi
|
|
|
|
rm -rf /etc/systemd/system/testsuite-55-testbloat.service.d
|
|
|
|
echo "DefaultMemoryPressureDurationSec=2s" >>/etc/systemd/oomd.conf
|
|
|
|
mkdir -p /etc/systemd/system/systemd-oomd.service.d/
|
|
echo -e "[Service]\nEnvironment=SYSTEMD_LOG_LEVEL=debug" >/etc/systemd/system/systemd-oomd.service.d/debug.conf
|
|
|
|
systemctl daemon-reload
|
|
|
|
# if oomd is already running for some reasons, then restart it to make sure the above settings to be applied
|
|
if systemctl is-active systemd-oomd.service; then
|
|
systemctl restart systemd-oomd.service
|
|
fi
|
|
|
|
systemctl start testsuite-55-testchill.service
|
|
systemctl start testsuite-55-testbloat.service
|
|
|
|
# Verify systemd-oomd is monitoring the expected units
|
|
oomctl | grep "/testsuite-55-workload.slice"
|
|
oomctl | grep "20.00%"
|
|
oomctl | grep "Default Memory Pressure Duration: 2s"
|
|
|
|
systemctl status testsuite-55-testchill.service
|
|
|
|
# systemd-oomd watches for elevated pressure for 2 seconds before acting.
|
|
# It can take time to build up pressure so either wait 2 minutes or for the service to fail.
|
|
timeout="$(date -ud "2 minutes" +%s)"
|
|
while [[ $(date -u +%s) -le $timeout ]]; do
|
|
if ! systemctl status testsuite-55-testbloat.service; then
|
|
break
|
|
fi
|
|
sleep 2
|
|
done
|
|
|
|
# testbloat should be killed and testchill should be fine
|
|
if systemctl status testsuite-55-testbloat.service; then exit 42; fi
|
|
if ! systemctl status testsuite-55-testchill.service; then exit 24; fi
|
|
|
|
# Make sure we also work correctly on user units.
|
|
|
|
runas() {
|
|
declare userid=$1
|
|
shift
|
|
# shellcheck disable=SC2016
|
|
su "$userid" -s /bin/sh -c 'XDG_RUNTIME_DIR=/run/user/$UID exec "$@"' -- sh "$@"
|
|
}
|
|
|
|
runas testuser systemctl start --user testsuite-55-testchill.service
|
|
runas testuser systemctl start --user testsuite-55-testbloat.service
|
|
|
|
# Verify systemd-oomd is monitoring the expected units
|
|
oomctl | grep -E "/user.slice.*/testsuite-55-workload.slice"
|
|
oomctl | grep "20.00%"
|
|
oomctl | grep "Default Memory Pressure Duration: 2s"
|
|
|
|
runas testuser systemctl --user status testsuite-55-testchill.service
|
|
|
|
# systemd-oomd watches for elevated pressure for 2 seconds before acting.
|
|
# It can take time to build up pressure so either wait 2 minutes or for the service to fail.
|
|
timeout="$(date -ud "2 minutes" +%s)"
|
|
while [[ $(date -u +%s) -le $timeout ]]; do
|
|
if ! runas testuser systemctl --user status testsuite-55-testbloat.service; then
|
|
break
|
|
fi
|
|
sleep 2
|
|
done
|
|
|
|
# testbloat should be killed and testchill should be fine
|
|
if runas testuser systemctl --user status testsuite-55-testbloat.service; then exit 42; fi
|
|
if ! runas testuser systemctl --user status testsuite-55-testchill.service; then exit 24; fi
|
|
|
|
# only run this portion of the test if we can set xattrs
|
|
if setfattr -n user.xattr_test -v 1 /sys/fs/cgroup/; then
|
|
sleep 120 # wait for systemd-oomd kill cool down and elevated memory pressure to come down
|
|
|
|
mkdir -p /etc/systemd/system/testsuite-55-testbloat.service.d/
|
|
echo "[Service]" >/etc/systemd/system/testsuite-55-testbloat.service.d/override.conf
|
|
echo "ManagedOOMPreference=avoid" >>/etc/systemd/system/testsuite-55-testbloat.service.d/override.conf
|
|
|
|
systemctl daemon-reload
|
|
systemctl start testsuite-55-testchill.service
|
|
systemctl start testsuite-55-testmunch.service
|
|
systemctl start testsuite-55-testbloat.service
|
|
|
|
timeout="$(date -ud "2 minutes" +%s)"
|
|
while [[ "$(date -u +%s)" -le "$timeout" ]]; do
|
|
if ! systemctl status testsuite-55-testmunch.service; then
|
|
break
|
|
fi
|
|
sleep 2
|
|
done
|
|
|
|
# testmunch should be killed since testbloat had the avoid xattr on it
|
|
if ! systemctl status testsuite-55-testbloat.service; then exit 25; fi
|
|
if systemctl status testsuite-55-testmunch.service; then exit 43; fi
|
|
if ! systemctl status testsuite-55-testchill.service; then exit 24; fi
|
|
fi
|
|
|
|
systemd-analyze log-level info
|
|
|
|
echo OK >/testok
|
|
|
|
exit 0
|