forked from ISTI-ansible-roles/ansible-roles
library/roles/rstudio-server: Optionally install script and cron job to kill abuser processes. See https://support.d4science.org/issues/6941
This commit is contained in:
parent
572387dad2
commit
2fddf89a92
|
@ -3,3 +3,7 @@ rstudio_install_server: False
|
||||||
rstudio_enabled: True
|
rstudio_enabled: True
|
||||||
rstudio_file: rstudio-server-0.99.903-amd64.deb
|
rstudio_file: rstudio-server-0.99.903-amd64.deb
|
||||||
rstudio_download_url: 'https://download2.rstudio.org/{{ rstudio_file }}'
|
rstudio_download_url: 'https://download2.rstudio.org/{{ rstudio_file }}'
|
||||||
|
|
||||||
|
rstudio_install_kill_script: True
|
||||||
|
# cron job minutes
|
||||||
|
rstudio_kill_script_frequency: "*/5"
|
||||||
|
|
|
@ -0,0 +1,78 @@
|
||||||
|
#!/bin/bash
|
||||||
|
#
|
||||||
|
# TODO:
|
||||||
|
# - print nagios friendly output into a file
|
||||||
|
# - kill rsession processes older than N days
|
||||||
|
#
|
||||||
|
|
||||||
|
set -e
|
||||||
|
set -o pipefail
|
||||||
|
|
||||||
|
CMD_NAME=$0
|
||||||
|
|
||||||
|
USER_N=
|
||||||
|
USER_SESSION_PID=
|
||||||
|
USER_PROCS_PIDS_ALL=
|
||||||
|
USER_PROCS_TO_KILL=
|
||||||
|
USER_PROCS_PARENTS=
|
||||||
|
USER_PROCS_PARENT_PID=
|
||||||
|
SPARE_MEM=1048576
|
||||||
|
OUT_DIR=$( mktemp -d -t kill-rogue-jobs.XXXXXXXXXX )
|
||||||
|
USER_PROCS_LIST=$OUT_DIR/proclist
|
||||||
|
USER_PROCS_PARENTS=$OUT_DIR/parents
|
||||||
|
|
||||||
|
trap "eval logger '$CMD_NAME: trap intercepted, exiting.' ; cleanup" SIGHUP SIGINT SIGTERM
|
||||||
|
|
||||||
|
function cleanup() {
|
||||||
|
rm -fr $OUT_DIR
|
||||||
|
}
|
||||||
|
|
||||||
|
function find_rogue_processes() {
|
||||||
|
eval logger '$CMD_NAME: find_rogue_processes for user $USER_N'
|
||||||
|
ps -edaf | grep rsession | grep -v grep | grep ${USER_N} | awk '{ print $3 }' | uniq > $USER_PROCS_PARENTS
|
||||||
|
ps -edaf | grep rsession | grep -v grep | grep ${USER_N} | awk '{ print $2 }' | uniq > $USER_PROCS_LIST
|
||||||
|
for parent in $( cat $USER_PROCS_PARENTS ) ; do
|
||||||
|
grep -v $parent $USER_PROCS_LIST > $USER_PROCS_LIST.tmp
|
||||||
|
mv $USER_PROCS_LIST.tmp $USER_PROCS_LIST
|
||||||
|
done
|
||||||
|
USER_PROCS_TO_KILL=$( cat $USER_PROCS_LIST )
|
||||||
|
}
|
||||||
|
|
||||||
|
function exterminate() {
|
||||||
|
eval logger '$CMD_NAME: exterminate killing user $USER_N processes'
|
||||||
|
for pid in $( echo $USER_PROCS_TO_KILL ) ; do
|
||||||
|
kill -15 $pid
|
||||||
|
done
|
||||||
|
}
|
||||||
|
|
||||||
|
USERS_SESSIONS=$( ps -edaf | grep rsession | grep -v defunct | grep -v grep | awk '{ print $10 }' | uniq )
|
||||||
|
|
||||||
|
if [ -z $USERS_SESSIONS ] ; then
|
||||||
|
eval logger '$CMD_NAME: There are no active sessions'
|
||||||
|
exit 0
|
||||||
|
fi
|
||||||
|
NUM_CPUS=$( grep processor /proc/cpuinfo | wc -l )
|
||||||
|
ALLOWED_THREADS=$(( $NUM_CPUS - 1 ))
|
||||||
|
TOTAL_MEM=$( grep MemTotal /proc/meminfo | awk '{ print $2 }' )
|
||||||
|
ALLOWED_USED_MEM=$(( $TOTAL_MEM - $SPARE_MEM ))
|
||||||
|
|
||||||
|
for USER_N in $( echo $USERS_SESSIONS ) ; do
|
||||||
|
USER_PROCS=$( ps -edaf | grep rsession | grep -v grep | grep ${USER_N} | wc -l )
|
||||||
|
USER_MEM=$( ps -eo pid,rss,vsz,args | grep rsession | grep -v grep | grep ${USER_N} | awk '{ print $2}' | paste -sd+ | bc )
|
||||||
|
if [ $USER_PROCS -gt $ALLOWED_THREADS ] || [ $USER_MEM -gt $ALLOWED_USED_MEM ] ; then
|
||||||
|
if [ $USER_PROCS -gt $ALLOWED_THREADS ] ; then
|
||||||
|
eval logger '$CMD_NAME: user $USER_N is running too many processes'
|
||||||
|
fi
|
||||||
|
if [ $USER_MEM -gt $ALLOWED_USED_MEM ] ; then
|
||||||
|
eval logger '$CMD_NAME: user $USER_N is using too much memory'
|
||||||
|
fi
|
||||||
|
find_rogue_processes
|
||||||
|
exterminate
|
||||||
|
else
|
||||||
|
eval logger '$CMD_NAME: we do not need to kill any processes for user $USER_N'
|
||||||
|
fi
|
||||||
|
done
|
||||||
|
|
||||||
|
trap cleanup EXIT
|
||||||
|
exit 0
|
||||||
|
|
|
@ -12,7 +12,6 @@
|
||||||
args:
|
args:
|
||||||
creates: /srv/{{ rstudio_file }}
|
creates: /srv/{{ rstudio_file }}
|
||||||
register: rstudio_download
|
register: rstudio_download
|
||||||
ignore_errors: True
|
|
||||||
|
|
||||||
- name: Install the rstudio server package
|
- name: Install the rstudio server package
|
||||||
command: gdebi -n -q /srv/{{ rstudio_file }}
|
command: gdebi -n -q /srv/{{ rstudio_file }}
|
||||||
|
@ -30,6 +29,16 @@
|
||||||
service: name=rstudio-server state=stopped enabled=no
|
service: name=rstudio-server state=stopped enabled=no
|
||||||
when: not rstudio_enabled
|
when: not rstudio_enabled
|
||||||
|
|
||||||
|
- name: Install a script that kills the abusing job processes
|
||||||
|
copy: src=kill-rogue-jobs dest=/usr/local/bin/kill-rogue-jobs owner=root group=root mode=0755
|
||||||
|
when: rstudio_install_kill_script
|
||||||
|
tags: [ 'rstudio', 'rstudio_server', 'rstudio_kill_rogues' ]
|
||||||
|
|
||||||
|
- name: Install a cron job that kills the abusing jobs
|
||||||
|
cron: name="Kill rogue jobs" job="/usr/local/bin/kill-rogue-jobs" user=root minute="{{ rstudio_kill_script_frequency }}"
|
||||||
|
when: rstudio_install_kill_script
|
||||||
|
tags: [ 'rstudio', 'rstudio_server', 'rstudio_kill_rogues' ]
|
||||||
|
|
||||||
when: rstudio_install_server
|
when: rstudio_install_server
|
||||||
tags: [ 'rstudio', 'rstudio_server' ]
|
tags: [ 'rstudio', 'rstudio_server' ]
|
||||||
|
|
||||||
|
@ -44,5 +53,11 @@
|
||||||
- gdebi
|
- gdebi
|
||||||
- rstudio-server
|
- rstudio-server
|
||||||
|
|
||||||
|
- name: Remove the script that kills the abusing job processes
|
||||||
|
file: dest=/usr/local/bin/kill-rogue-jobs state=absent
|
||||||
|
|
||||||
|
- name: Remove the cron job that kills the abusing jobs
|
||||||
|
cron: name="Kill rogue jobs" job="/usr/local/bin/kill-rogue-jobs" user=root minute="{{ rstudio_kill_script_frequency }}" state=absent
|
||||||
|
|
||||||
when: not rstudio_install_server
|
when: not rstudio_install_server
|
||||||
tags: [ 'rstudio', 'rstudio_server' ]
|
tags: [ 'rstudio', 'rstudio_server' ]
|
||||||
|
|
Loading…
Reference in New Issue