mirror of
https://github.com/xcat2/xcat-core.git
synced 2025-10-23 23:45:33 +00:00
- zvmdiscovery plugin will not handle findme - not change request if no temp discovered bmc nodes, to avoid the confusing error message - add more logs, and ignore the `ipmitool sol info` error output
310 lines
14 KiB
Bash
Executable File
310 lines
14 KiB
Bash
Executable File
#!/bin/bash
|
|
log_label="xcat.genesis.dodiscovery"
|
|
|
|
#the time when the latest findme request is sent to master
|
|
reqtime=0
|
|
#the timeout value on the waiting for the "processed" response from master
|
|
#when the xcatd on master finished the processing of my findme request,
|
|
#a "processed" response will be replied
|
|
maxresptime=180
|
|
|
|
minixcatd.awk &
|
|
PUBKEY=`openssl rsa -in /etc/xcat/privkey.pem -pubout 2> /dev/null|grep -v "PUBLIC KEY"`
|
|
PUBKEY=`echo $PUBKEY|sed -e 's/ //g'`
|
|
export PUBKEY
|
|
|
|
logger -s -t $log_label -p local4.info "Beginning node discovery process..."
|
|
for nic in `ip link|grep mtu|grep -v LOOPBACK|grep -v usb|grep -v ,LOWER_UP|awk -F: '{print $2}'`; do
|
|
ip link set $nic up
|
|
done
|
|
waitforlink=100
|
|
while [ ! -z "$NICSTOBRINGUP" -a $waitforlink -gt 0 ]; do
|
|
NICSTOBRINGUP=`ip link|grep mtu|grep -v LOOPBACK|grep -v usb|grep -v ,LOWER_UP|awk -F: '{print $2}'`
|
|
waitforlink=$((waitforlink - 1))
|
|
sleep 0.1
|
|
if [ $waitforlink = 1 ]; then
|
|
logger -s -t $log_label -p local4.warning "No link detected on $NICSTOBRINGUP after 10 seconds"
|
|
fi
|
|
done
|
|
NICSGETTINGADDR=`ip link|grep mtu|grep -v LOOPBACK|grep -v usb|grep ,LOWER_UP|awk -F: '{print $2}'`
|
|
timewaiting=0
|
|
logger -s -t $log_label -p local4.info "Waiting for nics to get addresses"
|
|
while [ ! -z "$NICSGETTINGADDR" -a $timewaiting != 700 ]; do
|
|
NEWNICSGETTINGADDR=""
|
|
for nic in $NICSGETTINGADDR; do
|
|
if ! ip -4 -o a show dev $nic |grep -q inet; then
|
|
NEWNICSGETTINGADDR="$NEWNICSGETTINGADDR $nic"
|
|
else
|
|
echo -n "$nic|"
|
|
ip -4 -o addr show dev $nic | awk '{print $4}' | sed -e sX/.*XX
|
|
fi
|
|
done
|
|
sleep 0.1
|
|
timewaiting=$((timewaiting+1))
|
|
if [ $timewaiting = 699 ]; then
|
|
logger -s -t $log_label -p local4.warning "No DHCP answer for $nic, ignoring interface..."
|
|
fi
|
|
NICSGETTINGADDR=$NEWNICSGETTINGADDR
|
|
done
|
|
if [ $timewaiting != 700 -a $timewaiting -gt 450 ]; then
|
|
logger -s -t $log_label -p local4.warning "Obtained an IP address $NICSGETTINGADDR but it took $timewaiting cycles, you may want to check the spanning tree configuration in the switch."
|
|
fi
|
|
logger -s -t $log_label -p local4.info "Network configuration complete, commencing transmit of discovery packets"
|
|
read XCATMASTER XCATPORT < <(grep xcatd= /proc/cmdline| sed 's/.*xcatd=\([^ ]*\).*/\1/' |tr ':' ' ')
|
|
if [[ -z $XCATPORT ]]; then
|
|
XCATPORT=3001
|
|
fi
|
|
export XCATPORT
|
|
|
|
#time to make our packet...
|
|
while [ ! -r /restart ]; do
|
|
|
|
#record the current time
|
|
curtime=$(date +%s)
|
|
|
|
#the existence of "/processing" indicates that my findme request is under processing
|
|
if [ -f "/processing" ]; then
|
|
if [ $curtime -gt $((reqtime+maxresptime)) ]; then
|
|
#I think my findme request processing is timeout, I will resend the findme request
|
|
logger -s -t $log_label -p local4.info "seems the processing of my findme request cost more than $maxresptime, send new findme request"
|
|
rm -rf /processing
|
|
else
|
|
logger -s -t $log_label -p local4.info "My findme request is still under processing, do not send new request"
|
|
sleep 5
|
|
fi
|
|
continue
|
|
fi
|
|
|
|
MTM=unknown
|
|
SERIAL=unknown
|
|
ARCH=unknown
|
|
ARCH=`uname -m` #32-bit only is old news
|
|
PLATFORM=unknown
|
|
if [ -r /sys/devices/virtual/dmi/id/product_name ]; then #x86
|
|
PRODNAME=`cat /sys/devices/virtual/dmi/id/product_name`
|
|
IAMAVM=0
|
|
if [ "$PRODNAME" = "KVM" ]; then
|
|
IAMAVM=1
|
|
MTM=KVM
|
|
elif [ "$PRODNAME" = "VMware Virtual Platform" ]; then
|
|
IAMAVM=1
|
|
MTM=VMware
|
|
else
|
|
MTM=`cat /sys/devices/virtual/dmi/id/product_name|awk -F'[' '{print $2}'|awk -F']' '{print $1}'`
|
|
if [ -z "$MTM" ]; then
|
|
FRU=`ipmitool fru print 0`
|
|
if [ $? -eq 0 ]; then
|
|
MTM=`echo "$FRU" | awk -F': ' '/Product Manufacturer/ {m=$2} /Product Name|Product Part Number/ {if (n==""||n=="NONE") {n=$2}} END {print m":"n}'`
|
|
fi
|
|
if [ -z "$MTM" -o "$MTM" == ":" ]; then
|
|
logger -s -t $log_label -p local4.warning "Couldn't find MTM information in FRU, falling back to DMI (MTMS-based discovery may fail)"
|
|
m=`cat /sys/devices/virtual/dmi/id/sys_vendor`
|
|
n=`cat /sys/devices/virtual/dmi/id/product_name`
|
|
MTM="$m:$n"
|
|
fi
|
|
fi
|
|
SERIAL=`cat /sys/devices/virtual/dmi/id/product_serial`
|
|
fi
|
|
CPUCOUNT=`cat /proc/cpuinfo |grep "model name"|wc -l`
|
|
grep "model name" /proc/cpuinfo | while read line; do #to avoid pulling in tail, we do a goofy thing
|
|
echo $line > /tmp/cpumod
|
|
done
|
|
CPUTYPE=`cat /tmp/cpumod|awk -F':' '{print $2}'|sed -e 's/^ //'`
|
|
UUID=`sed -e 's/\(..\)\(..\)\(..\)\(..\)-\(..\)\(..\)-\(..\)\(..\)/\4\3\2\1-\6\5-\8\7/' /sys/devices/virtual/dmi/id/product_uuid`
|
|
|
|
elif [ -r /proc/device-tree/model ]; then #POWER
|
|
MTM=`cat /proc/device-tree/model -vT | sed -e 's/^.*,//' | sed -e 's/^[\t ]*//'| sed -e 's/[\t ]*\^@//'`
|
|
CPUCOUNT=`cat /proc/cpuinfo |grep -e "^cpu\s*:"|wc -l`
|
|
PLATFORM=`cat /proc/cpuinfo | grep -e "^platform\s*:" | awk '{print \$3}'`
|
|
grep -e "^cpu\s*:" /proc/cpuinfo | while read line; do #to avoid pulling in tail, we do a goofy thing
|
|
echo $line > /tmp/cpumod
|
|
done
|
|
CPUTYPE=`cat /tmp/cpumod|awk -F':' '{print $2}'|sed -e 's/^ //'`
|
|
SERIAL=`cat /proc/device-tree/system-id -vT | sed -e 's/^.*,//' | sed -e 's/^[\t ]*//'| sed -e 's/[\t ]*\^@//'`
|
|
# For POWER servers, the /proc/sys/kernel/random/uuid is changing for each query, so use mtms + mac of first up nic as the UUID
|
|
#UUID=`sed -e 's/\(..\)\(..\)\(..\)\(..\)-\(..\)\(..\)-\(..\)\(..\)/\4\3\2\1-\6\5-\8\7/' /proc/sys/kernel/random/uuid`
|
|
UUID=unknown
|
|
|
|
fi
|
|
|
|
# The MEMORY will look like this: 32868920
|
|
MEMORY=`cat /proc/meminfo |grep MemTotal|awk '{printf "%.0fMB\n", $2/1024}'`
|
|
|
|
# The DISKSIZE will look like this: sda:960GB,sdb:960GB,sdc:480GB,sdd:480GB (sorted by major,minor)
|
|
DISKSIZE="$(grep -v name /proc/partitions |sort -g -k 1,2 |awk 'BEGIN{sep=""} /[^0-9]$/{printf("%s%s:%.0fGB", sep, $4, $3/1024^2) ; sep=","}')"
|
|
|
|
logger -s -t $log_label -p local4.info "Beginning echo information to discovery packet file..."
|
|
echo '<xcatrequest>' > /tmp/discopacket
|
|
echo "<command>findme</command>" >> /tmp/discopacket
|
|
echo "<sequential>1</sequential>" >> /tmp/discopacket
|
|
echo "<arch>$ARCH</arch>" >> /tmp/discopacket
|
|
if [ "$IAMAVM" = 1 ]; then
|
|
echo "<nodetype>virtual</nodetype>" >> /tmp/discopacket
|
|
fi
|
|
echo "<cpucount>$CPUCOUNT</cpucount>" >> /tmp/discopacket
|
|
echo "<cputype>$CPUTYPE</cputype>" >> /tmp/discopacket
|
|
echo "<memory>$MEMORY</memory>" >> /tmp/discopacket
|
|
echo "<disksize>$DISKSIZE</disksize>" >> /tmp/discopacket
|
|
if [ "$UUID" != "unknown" ]; then
|
|
echo "<uuid>$UUID</uuid>" >> /tmp/discopacket
|
|
fi
|
|
|
|
flag_mtm=`echo "$MTM" | sed 's/0//g'`
|
|
if [ "$flag_mtm" ] && [ "$MTM" != "unknown" ]; then
|
|
MTM=`echo $MTM | sed 's/\.//g'`
|
|
echo "<mtm>$MTM</mtm>" >> /tmp/discopacket
|
|
fi
|
|
flag_serial=`echo "$SERIAL" | sed 's/0//g'`
|
|
if [ "$flag_serial" ] && [ "$SERIAL" != "unknown" ]; then
|
|
SERIAL=`echo $SERIAL | sed 's/\.//g'`
|
|
echo "<serial>$SERIAL</serial>" >> /tmp/discopacket
|
|
fi
|
|
if [ "$PLATFORM" != "unknown" ]; then
|
|
echo "<platform>$PLATFORM</platform>" >> /tmp/discopacket
|
|
fi
|
|
|
|
LANCHAN=$(ipmitool sol info 2>/dev/null|awk '/Payload Channel/{print $4}')
|
|
IsStatic=`ipmitool lan print $LANCHAN | grep 'IP Address Source' | grep 'Static'`
|
|
if [ "$IsStatic" ]; then
|
|
BMCIPADDR=`ipmitool lan print $LANCHAN | grep 'IP Address' | grep -v 'IP Address Source' | cut -d ":" -f2 | sed 's/ //'`
|
|
if [ "$BMCIPADDR" ]; then
|
|
echo "<bmc>$BMCIPADDR</bmc>" >> /tmp/discopacket
|
|
fi
|
|
fi
|
|
|
|
BMCMAC=`ipmitool lan print $LANCHAN | grep 'MAC Address' | cut -d ":" -f2-7 | sed 's/ //'`
|
|
if [ "$BMCMAC" ]; then
|
|
echo "<bmcmac>$BMCMAC</bmcmac>" >> /tmp/discopacket
|
|
fi
|
|
|
|
# Check whether the hardware support in-band BMC configuration with the IPMI device
|
|
if [ -r /dev/ipmi0 -o -r /dev/ipmi/0 -o -r /dev/ipmidev/0 ]; then
|
|
echo "<bmcinband>1</bmcinband>" >> /tmp/discopacket
|
|
fi
|
|
|
|
#so we have some cases where DMI table explictly records every function number, and some where only first function is enumerated
|
|
#so for each onboard device, we record it. If it is also the first function, we'll seek out other function numbers and append
|
|
#if that other function number does not show up in its own dmi type 41 record
|
|
if [ -f "/usr/sbin/dmidecode" ]; then
|
|
for onboard in `dmidecode -t 41|egrep '(Type:|Bus Address)'|grep -A1 Ethernet|grep -v Ethernet|sed -e 's/.*Address: //'`; do
|
|
obdevs=("${obdevs[@]}" $onboard)
|
|
if [ ${onboard#*.} = 0 ]; then
|
|
truncslot=${onboard%.*}
|
|
for obslot in `grep $truncslot /sys/class/net/*/device/uevent|sed -e s/.*=//`; do
|
|
if ! dmidecode -t 41|grep $obslot > /dev/null; then
|
|
obdevs=("${obdevs[@]}" $obslot)
|
|
fi
|
|
done
|
|
fi
|
|
done
|
|
fi
|
|
MAC_OF_FIRST_UP_NIC=unknown
|
|
#TODO: downed nics, also examine /sys/bus/pci/*/ for more network class devices that might not have driver suppert
|
|
for dev in `ip link|grep -B1 ether|grep UP|awk '{print $2}'|sed -e s/://|grep -v usb0`; do
|
|
FIRMDESC=""
|
|
ONBOARDINDEX=""
|
|
DRIVER=`grep DRIVER /sys/class/net/$dev/device/uevent|awk -F= '{print $2}'`
|
|
PCI_SLOT=`grep PCI_SLOT_NAME /sys/class/net/$dev/device/uevent|awk -F= '{print $2}'`
|
|
ADDRESS=`ip -4 -o a show dev $dev|awk '/global/{print $4}'`
|
|
MAC=`ip link show dev $dev|grep ether|awk '{print $2}'| tr /a-f/ /A-F/`
|
|
if [ "$MAC_OF_FIRST_UP_NIC" == "unknown" ]; then
|
|
MAC_OF_FIRST_UP_NIC=`echo $MAC | sed -e s/://g`
|
|
fi
|
|
if [[ ! -z "$PCI_SLOT" && -f "/usr/sbin/dmidecode" ]]; then
|
|
SLOTNAME=`dmidecode -t 9|egrep '(Designation|Address)'|grep -B1 $PCI_SLOT|grep Designation|sed -e 's/.*Designation:[ ]*//'`
|
|
if [ -z "$SLOTNAME" ]; then #check for on board device
|
|
index=1
|
|
for s in "${obdevs[@]}"; do
|
|
if [ "$s" = "$PCI_SLOT" ]; then
|
|
ONBOARDINDEX=$index
|
|
break
|
|
fi
|
|
index=$((index+1))
|
|
done
|
|
if [ ! -z "$ONBOARDINDEX" ]; then
|
|
FIRMDESC=`dmidecode -t 41|egrep '(Designation|Address)' |grep -B 1 $PCI_SLOT|grep Designation|sed -e 's/.*: //'`
|
|
if [ -z "$FIRMDESC" ]; then
|
|
SHORTPCISLOT=${PCI_SLOT%.*}
|
|
FIRMDESC=`dmidecode -t 41|egrep '(Designation|Address)' |grep -B 1 $SHORTPCISLOT|grep Designation|sed -e 's/.*: //'`
|
|
fi
|
|
SLOTNAME="Onboard Ethernet $ONBOARDINDEX"
|
|
fi
|
|
fi
|
|
fi
|
|
echo "<mac>$DRIVER|$dev|$MAC|$ADDRESS</mac>" >> /tmp/discopacket
|
|
echo "<nic>" >> /tmp/discopacket
|
|
echo " <devname>$dev</devname>" >> /tmp/discopacket
|
|
echo " <driver>$DRIVER</driver>" >> /tmp/discopacket
|
|
if [ ! -z "$ADDRESS" ]; then
|
|
echo " <ip4address>$ADDRESS</ip4address>" >> /tmp/discopacket
|
|
fi
|
|
echo " <hwaddr>$MAC</hwaddr>" >> /tmp/discopacket
|
|
if [ ! -z "$PCI_SLOT" ]; then
|
|
echo " <pcidev>$PCI_SLOT</pcidev>" >> /tmp/discopacket
|
|
fi
|
|
if [ ! -z "$SLOTNAME" ]; then
|
|
echo " <location>$SLOTNAME</location>" >> /tmp/discopacket
|
|
fi
|
|
if [ ! -z "$ONBOARDINDEX" ]; then
|
|
echo " <onboardeth>$ONBOARDINDEX</onboardeth>" >> /tmp/discopacket
|
|
fi
|
|
if [ ! -z "$FIRMDESC" ]; then
|
|
echo " <firmdesc>$FIRMDESC</firmdesc>" >> /tmp/discopacket
|
|
fi
|
|
myswitch=`lldptool -n -i $dev -t -V sysName|grep -v 'System Name TLV'|sed -e 's/^ *//'`
|
|
if [ ! -z "$myswitch" -a "$myswitch" != "Agent instance for device not found" ]; then
|
|
echo " <switchname>$myswitch</switchname>" >> /tmp/discopacket
|
|
fi
|
|
for switchaddr in `lldptool -i $dev -n -t -V mngAddr|grep IP|sed -e 's/.*:.//'`; do
|
|
if [ "$switchaddr" = "Agent instance for device not found" ]; then break; fi
|
|
echo " <switchaddr>$switchaddr</switchaddr>" >> /tmp/discopacket
|
|
done
|
|
myswitchdesc=`lldptool -n -i $dev -t -V sysDesc|grep -v 'System Description TLV'|sed -e 's/^ *//'`
|
|
if [ ! -z "$myswitchdesc" -a "$myswitchdesc" != "Agent instance for device not found" ]; then
|
|
echo " <switchdesc>$myswitchdesc</switchdesc>" >> /tmp/discopacket
|
|
fi
|
|
myport=`lldptool -n -i $dev -t -V portDesc|grep -v 'Port Description TLV'|sed -e 's/^ *//'`
|
|
if [ ! -z "$myport" -a "$myswitchdesc" != "Agent instance for device not found" ]; then
|
|
echo " <switchport>$myport</switchport>" >> /tmp/discopacket
|
|
fi
|
|
|
|
echo "</nic>" >> /tmp/discopacket
|
|
done
|
|
if [ "$UUID" == "unknown" ]; then
|
|
UUID=`echo $MTM-$SERIAL-$MAC_OF_FIRST_UP_NIC | tr /A-Z/ /a-z/`
|
|
echo "<uuid>$UUID</uuid>" >> /tmp/discopacket
|
|
fi
|
|
echo "<xcatpubkey>$PUBKEY</xcatpubkey>" >> /tmp/discopacket #this is not secure to use by itself, switch sourced pubkey for security
|
|
echo "<sha512sig>" >> /tmp/discopacket
|
|
echo "</sha512sig>" >> /tmp/discopacket
|
|
echo "</xcatrequest>" >> /tmp/discopacket
|
|
openssl dgst -sha512 -out /tmp/discopacket.sha512 -sign /etc/xcat/privkey.pem /tmp/discopacket
|
|
openssl enc -e -a -in /tmp/discopacket.sha512 > /tmp/discopacket.b64sig
|
|
cat /tmp/discopacket |while read line; do
|
|
if [ "$line" = "</sha512sig>" ]; then
|
|
cat /tmp/discopacket.b64sig >> /tmp/discopacket.new
|
|
fi
|
|
echo $line >> /tmp/discopacket.new
|
|
done
|
|
mv /tmp/discopacket.new /tmp/discopacket
|
|
logger -s -t $log_label -p local4.info "Discovery packet file is ready."
|
|
rm -f /tmp/discopacket.gz
|
|
gzip -9 /tmp/discopacket
|
|
if [ ! -z "$XCATMASTER" ]; then
|
|
logger -s -t $log_label -p local4.info "Sending the discovery packet to xCAT ($XCATMASTER:$XCATPORT)..."
|
|
(cat /tmp/discopacket.gz | udpcat.awk $XCATMASTER $XCATPORT ) &
|
|
fi
|
|
for dhcps in `grep dhcp-server /var/lib/dhclient/dhclient.leases|awk '{print $4}'|sed -s 's/;//'`; do
|
|
logger -s -t $log_label -p local4.info "Sending the discovery packet to xCAT ($dhcps:$XCATPORT)..."
|
|
(cat /tmp/discopacket.gz | udpcat.awk $dhcps $XCATPORT ) &
|
|
done
|
|
|
|
#record the time when the "findme request is sent to master"
|
|
reqtime=$(date +%s)
|
|
#cat /tmp/discopacket
|
|
logger -s -t $log_label -p local4.info "Sleeping 5 seconds..."
|
|
sleep 5
|
|
done
|
|
logger -s -t $log_label -p local4.info "Restart network interfaces..."
|
|
/bin/restart
|