X-Git-Url: http://git.rot13.org/?a=blobdiff_plain;f=recepies%2Flxc%2Flxc-watchdog.sh;h=a68d33bb1ac055acba840e723751d54c8fc3db22;hb=132f2c88b2fb189b6fc60334792e125d470ee8d6;hp=1188db644d43579c68ea515d4ed0aa5a5ec0dbd5;hpb=ac40db6443f92542815501d209280c9376fe5038;p=sysadmin-cookbook diff --git a/recepies/lxc/lxc-watchdog.sh b/recepies/lxc/lxc-watchdog.sh index 1188db6..a68d33b 100755 --- a/recepies/lxc/lxc-watchdog.sh +++ b/recepies/lxc/lxc-watchdog.sh @@ -1,14 +1,25 @@ -#!/bin/sh - -# lxc-watchdog.sh -# -# Dobrica Pavlinusic 2010-03-15 -# -# this script can be used to start/stop Linux containers -# using clever inotify hack to monitor halt/reboot from -# Tony Risinger posted to lxc-users mailing list +#! /bin/sh +### BEGIN INIT INFO +# Provides: lxc-watchdog +# Required-Start: $remote_fs $named $network $time +# Required-Stop: $remote_fs $named $network +# Required-Start: +# Required-Stop: +# Default-Start: 2 3 4 5 +# Default-Stop: 0 1 6 +# Short-Description: Manage Linux Containers startup/shutdown +# Description: Uses clever inotify hack to monitor container's +# halt/reboot events watching /var/run/utmp +### END INIT INFO + +# Author: Dobrica Pavlinusic # +# based on Tony Risinger post to lxc-users mailing list # http://www.mail-archive.com/lxc-users@lists.sourceforge.net/msg00074.html +# +# Install with: +# ln -sf /srv/sysadmin-cookbook/recepies/lxc/lxc-watchdog.sh /etc/init.d/lxc-watchdog +# update-rc.d lxc-watchdog defaults which inotifywait >/dev/null || apt-get install inotify-tools @@ -26,16 +37,18 @@ lxc_exists() { lxc_rootfs() { - grep lxc.rootfs "/var/lib/lxc/$1/config" | cut -d= -f2 | sed 's/^ *//' + grep '^ *lxc\.rootfs *=' "/var/lib/lxc/$1/config" | cut -d= -f2 | sed 's/^ *//' } lxc_status() { - lxc-ls -1 | sort -u | xargs -i lxc-info -n {} | sed "s/'//g" | while read name is status ; do - on_boot=" " - test -s /var/lib/lxc/$name/on_boot && on_boot="on_boot" - echo "$name $status $on_boot $(lxc_rootfs $name)" - done + ( find /var/lib/lxc/ -name "config" | cut -d/ -f5 | sort -u | xargs -i lxc-info -n {} | sed "s/'//g" | while read name is status ; do + boot="-" + hostname=`cat $(lxc_rootfs $name)/etc/hostname` + ip=`grep address $(lxc_rootfs $name)/etc/network/interfaces | sed 's/.*address //'` + test -s /var/lib/lxc/$name/on_boot && boot="boot" + echo "$name $status $boot $(lxc_rootfs $name) $ip $hostname" + done ) | column -t } @@ -46,7 +59,10 @@ cleanup_init_scripts() { $rootfs/etc/rc?.d/*umountfs \ $rootfs/etc/rc?.d/*umountroot \ $rootfs/etc/rc?.d/*hwclock* \ + $rootfs/etc/rc?.d/*udev* \ 2>/dev/null | xargs -i rm -v {} + + echo $1 > $rootfs/etc/hostname } @@ -57,7 +73,7 @@ setup_inittab() { # let container respond to kill -SIGPWR inittab=$rootfs/etc/inittab - if ! grep "$add" ${inittab} >/dev/null ; then + if test -e $inittab && ! grep "$add" ${inittab} >/dev/null ; then grep -v "$remove" ${inittab} > ${inittab}.new echo $add >> ${inittab}.new mv ${inittab}.new ${inittab} @@ -66,6 +82,11 @@ setup_inittab() { } +lxc_log() { + echo `date +%Y-%m-%dT%H:%M:%S` $* +} + + lxc_kill() { name=$1 sig=$2 @@ -75,26 +96,34 @@ lxc_kill() { lxc-info -n $name exit 1 fi - echo "$name kill $sig $init_pid" + lxc_log "$name kill $sig $init_pid" /bin/kill $sig $init_pid } lxc_stop() { + lxc_log "$name stop" lxc_kill $name -SIGPWR lxc-wait -n $name -s STOPPED + lxc_log "$name stoped" # rm -f /var/lib/lxc/${name}/on_boot } lxc_start() { name=$1 + rootfs=$(lxc_rootfs $1) + + if [ ! -e $rootfs ] ; then + echo "ERROR $name rootfs $rootfs not found" + return + fi if ! lxc-info -n $name | grep RUNNING ; then - echo "$name start" + lxc_log "$name start" lxc-start -n $name -o /tmp/${name}.log -d lxc-wait -n $name -s RUNNING lxc-info -n $name - echo $name > /var/lib/lxc/${name}/on_boot + test -f /var/lib/lxc/${name}/on_boot || echo $name > /var/lib/lxc/${name}/on_boot fi } @@ -109,20 +138,20 @@ while true; do if [ "$tasks" -eq 1 ]; then runlevel="$(runlevel ${vps_utmp})" - echo `date +%Y-%m-%dT%H:%M:%S` "$name runlevel $runlevel" + lxc_log "$name runlevel $runlevel" case $runlevel in N*) # nothing for new boot state ;; ??0) - echo "$name halt" + lxc_log "$name halt" lxc-stop -n "${name}" lxc-wait -n ${name} -s STOPPED break ;; ??6) - echo "$name reboot"; + lxc_log "$name reboot"; lxc-stop -n ${name} lxc-wait -n ${name} -s STOPPED lxc-start -d -n ${name} -o /tmp/${name}.log @@ -134,18 +163,23 @@ while true; do ;; esac else - echo "# $name $tasks tasks" + lxc_log "$name $tasks tasks" fi # time of 5 minutes on it JUST IN CASE... inotifywait -qqt 300 ${vps_utmp} done -echo "${name} exited" +lxc_log "$name watchdog exited" } +usage() { + echo "Usage: $0 {start|stop|restart|status|boot|disable} [name name ... ]" >&2 + exit 3 +} + command_on_lxc() { command=$1 shift @@ -157,10 +191,12 @@ case "$command" in start) lxc_exists $1 cleanup_init_scripts $1 - setup_inittab $1 ::power "p0::powerfail:/sbin/init 0" - setup_inittab $1 ::ctrlaltdel "p6::ctrlaltdel:/sbin/init 6" + setup_inittab $1 ":respawn:/sbin/getty.*tty1" "c1:12345:respawn:/sbin/getty 38400 tty1 linux" + setup_inittab $1 "::power" "p0::powerfail:/sbin/init 0" + setup_inittab $1 "::ctrlaltdel" "p6::ctrlaltdel:/sbin/init 6" lxc_start $1 - ( nohup $0 watchdog $1 >> /tmp/$1.log 2>/dev/null ) & + # give container 5 seconds to start more than one process + ( sleep 5 ; nohup $0 watchdog $1 >> /tmp/$1.log 2>/dev/null ) & ;; stop|halt) lxc_exists $1 @@ -172,9 +208,14 @@ reload|force-reload|restart|reboot) watchdog) lxc_watchdog $1 ;; +boot) + echo $1 > /var/lib/lxc/$1/on_boot + ;; +disable) + echo -n > /var/lib/lxc/$1/on_boot + ;; *) - echo "Usage: $0 {start|stop|restart|status}" >&2 - exit 3 + usage ;; esac @@ -182,14 +223,18 @@ esac } command=$1 -shift - +test -z "$command" && usage test "$command" = "status" && lxc_status && exit +shift if [ -z "$1" ] ; then ls /var/lib/lxc/*/on_boot | while read path ; do name=`echo $path | cut -d/ -f5` - command_on_lxc $command $name + if [ "$command" != "start" -o "$command" = "start" -a -s $path ] ; then + command_on_lxc $command $name + else + echo "# skip $command $name" + fi done else while [ ! -z "$1" ] ; do