X-Git-Url: http://git.onelab.eu/?a=blobdiff_plain;f=initscripts%2Fpl_netinit;h=071873cc98fe2c979d7252b44977f3c5088315c4;hb=62296ddf166b02a91a82484d00399605f67630fc;hp=afd4c03902e5ee7e0511c8f0e5db9ec1cf2d3e69;hpb=b5b7d860157f6458aca2d69a30092ecd7fc5a616;p=bootcd.git diff --git a/initscripts/pl_netinit b/initscripts/pl_netinit index afd4c03..071873c 100755 --- a/initscripts/pl_netinit +++ b/initscripts/pl_netinit @@ -1,6 +1,8 @@ #!/bin/sh #-*-shell-script-*- +set -x + # the name of the floppy based network configuration # files (checked first). the name planet.cnf is kept # for backward compatibility with old nodes, and only @@ -56,10 +58,20 @@ IFCONFIG_OUTPUT=/tmp/ifconfig DEFAULT_NET_CONF=0 -net_init_failed() -{ +function net_init_failed() { echo echo $(date "+%H:%M:%S") " pl_netinit: network initialization failed," + echo + echo For forensics + echo + echo ========== lspci beg + /sbin/lspci -n | /bin/grep "Class 0200" + echo ========== lspci end + echo + echo ========== ifconfig beg + /sbin/ifconfig + echo ========== ifconfig end + echo echo $(date "+%H:%M:%S") " pl_netinit: shutting down machine in two hours" /bin/sleep 2h /sbin/shutdown -h now @@ -67,8 +79,7 @@ net_init_failed() } # Function for checking the IP address to see if its sensible. -check_ip() -{ +function check_ip() { case "$*" in "" | *[!0-9.]* | *[!0-9]) return 1 ;; esac @@ -83,8 +94,7 @@ check_ip() # return 1 if found and parsed. if this is the case, DEFAULT_NET_CONF will # be set to 1. For any found configuration file, $USED_NET_CONF will # contain the validated contents -find_node_config() -{ +function find_node_config() { /bin/rm -f $TMP_OLD_FLOPPY_CONF_FILE 2>&1 > /dev/null echo $(date "+%H:%M:%S") " pl_netinit: looking for node configuration file on floppy" @@ -129,7 +139,7 @@ find_node_config() # devices shopt -s nullglob - for device in /sys/block/[hs]d*; do + for device in /sys/block/[hsv]d*; do removable=$(cat $device/removable) if [[ $removable -ne 1 ]]; then continue @@ -286,20 +296,38 @@ if [[ -z "$ETH_DEVICE" ]]; then net_init_failed fi +# within a systemd-driven startup, we often see this stage +# triggered before the network interface is actually exposed +# by udev/kernel +# although of course we have network-online.target +# as a requirement; go figure what systemd actually does.. + +# in any case, let us try to work around that by allowing some delay +# here + +ALLOW=5 +COUNTER=0 +while true; do + if /sbin/ifconfig $ETH_DEVICE >& /dev/null; then + echo "pl_netinit: device present $ETH_DEVICE, proceeding (${COUNTER}s/${ALLOW}s)" + break + fi + echo $(date "+%H:%M:%S") " pl_netinit: waiting for device $ETH_DEVICE,${COUNTER}s/${ALLOW}s" + COUNTER=$(($COUNTER+1)) + [ $COUNTER -ge $ALLOW ] && net_init_failed + sleep 1 +done + # actually check to make sure ifconfig succeeds -/sbin/ifconfig $ETH_DEVICE up 2>&1 > /dev/null -if [[ $? -ne 0 ]]; then + +/sbin/ifconfig $ETH_DEVICE up 2>&1 > /dev/null || { echo $(date "+%H:%M:%S") " pl_netinit: device $ETH_DEVICE does not exist, most likely" echo $(date "+%H:%M:%S") " pl_netinit: this CD does not have hardware support for your" echo $(date "+%H:%M:%S") " pl_netinit: network adapter. please send the following lines" echo $(date "+%H:%M:%S") " pl_netinit: to your PlanetLab support for further assistance" - echo - /sbin/lspci -n | /bin/grep "Class 0200" - echo - net_init_failed -fi +} echo $(date "+%H:%M:%S") " pl_netinit: attempting to start networking" /sbin/service network start @@ -308,4 +336,3 @@ echo $(date "+%H:%M:%S") " pl_netinit: attempting to start networking" /sbin/ifconfig $ETH_DEVICE > $IFCONFIG_OUTPUT echo $(date "+%H:%M:%S") " pl_netinit: network online" -