#!/usr/bin/env perl # IBM(c) 2007 EPL license http://www.eclipse.org/legal/epl-v10.html package xCAT_monitoring::rmcmon; BEGIN { $::XCATROOT = $ENV{'XCATROOT'} ? $ENV{'XCATROOT'} : '/opt/xcat'; } use lib "$::XCATROOT/lib/perl"; use xCAT::NodeRange; use Sys::Hostname; use Socket; use xCAT::Utils; use xCAT::GlobalDef; #print "xCAT_monitoring::rmcmon loaded\n"; 1; #------------------------------------------------------------------------------- =head1 xCAT_monitoring:rmcmon =head2 Package Description xCAT monitoring plugin package to handle RMC monitoring. =cut #------------------------------------------------------------------------------- #-------------------------------------------------------------------------------- =head3 start This function gets called by the monitorctrl module when xcatd starts. It starts the daemons and does necessary startup process for the RMC monitoring. It also queries the RMC for its currently monitored nodes which will, in tern, compared with the nodes in the input parameter. It asks RMC to add or delete nodes according to the comparison so that the nodes monitored by RMC are in sync with the nodes currently in the xCAT cluster. Arguments: monservers --A hash reference keyed by the monitoring server nodes and each value is a ref to an array of [nodes, nodetype, status] arrays monitored by the server. So the format is: {monserver1=>[['node1', 'osi', 'active'], ['node2', 'switch', 'booting']...], ...} Returns: (return code, message) =cut #-------------------------------------------------------------------------------- sub start { print "rmcmon::start called\n"; $noderef=shift; if ($noderef =~ /xCAT_monitoring::rmcmon/) { $noderef=shift; } #TODO: get a list of monservers + nodes and compare them with RMC. remove/add # if necessary. #assume the server is the current node. #check if rsct is installed and running if (! -e "/usr/bin/lsrsrc") { return (1, "RSCT is not is not installed.\n"); } my $result=`/usr/bin/lssrc -s ctrmc`; if ($result !~ /active/) { #restart rmc daemon $result=`startsrc -s ctrmc`; if ($?) { return (1, "rmc deamon cannot be started\n"); } } #get a list of managed nodes $result=`/usr/bin/lsrsrc-api -s IBM.MngNode::::Name`; chomp($result); my @rmc_nodes=split(/\n/, $result); foreach (keys(%$noderef)) { my $server=$_; my $mon_nodes=$noderef->{$_}; foreach(@$mon_nodes) { my $node_pair=$_; my $node=$node_pair->[0]; my $nodetype=$node_pair->[1]; } } #TODO: start condition-response assosciations return (0, "started"); } #-------------------------------------------------------------------------------- =head3 stop This function gets called by the monitorctrl module when xcatd stops. It stops the monitoring on all nodes, stops the daemons and does necessary cleanup process for the RMC monitoring. Arguments: none Returns: (return code, message) =cut #-------------------------------------------------------------------------------- sub stop { print "rmcmon::stop called\n"; #TODO: stop condition-response associtations. return (0, "stopped"); } #-------------------------------------------------------------------------------- =head3 supportNodeStatusMon This function is called by the monitorctrl module to check if RMC can help monitoring and returning the node status. Arguments: none Returns: 1 =cut #-------------------------------------------------------------------------------- sub supportNodeStatusMon { print "rmcmon::supportNodeStatusMon called\n"; return 1; } #-------------------------------------------------------------------------------- =head3 startNodeStatusMon This function is called by the monitorctrl module to tell RMC to start monitoring the node status and feed them back to xCAT. RMC will start setting up the condition/response to monitor the node status changes. Arguments: monservers --A hash reference keyed by the monitoring server nodes and each value is a ref to an array of [nodes, nodetype, status] arrays monitored by the server. So the format is: {monserver1=>[['node1', 'osi', 'active'], ['node2', 'switch', 'booting']...], ...} Returns: (return code, message) =cut #-------------------------------------------------------------------------------- sub startNodeStatusMon { print "rmcmon::startNodeStatusMon called\n"; return (0, "started"); } #-------------------------------------------------------------------------------- =head3 stopNodeStatusMon This function is called by the monitorctrl module to tell RMC to stop feeding the node status info back to xCAT. It will stop the condition/response that is monitoring the node status. Arguments: none Returns: (return code, message) =cut #-------------------------------------------------------------------------------- sub stopNodeStatusMon { print "rmcmon::stopNodeStatusMon called\n"; return (0, "stopped"); } #-------------------------------------------------------------------------------- =head3 addNodes This function gdds the nodes into the RMC cluster. Arguments: nodes --nodes to be added. It is a hash reference keyed by the monitoring server nodes and each value is a ref to an array of [nodes, nodetype, status] arrays monitored by the server. So the format is: {monserver1=>[['node1', 'osi', 'active'], ['node2', 'switch', 'booting']...], ...} verbose -- verbose mode. 1 for yes, 0 for no. Returns: none =cut #-------------------------------------------------------------------------------- sub addNodes { $noderef=shift; if ($noderef =~ /xCAT_monitoring::rmcmon/) { $noderef=shift; } my $VERBOSE=shift; #if ($VERBOSE) { print "rmcmon::addNodes called $noderef=$noderef\n"}; my $ms_host_name=hostname(); chomp($ms_host_name); foreach (keys(%$noderef)) { my $server=$_; #if ($VERBOSE) { print " monitoring server: $server\n";} if ($server ne $ms_host_name) { next; #only handle the nodes which has this node as the monitor server } #check if rsct is installed and running if (! -e "/usr/bin/lsrsrc") { print "RSCT is not installed.\n"; return 1; } my $result=`/usr/bin/lssrc -s ctrmc`; if ($result !~ /active/) { #restart rmc daemon $result=`startsrc -s ctrmc`; if ($?) { print "rmc deamon cannot be started\n"; return 1; } } #enable remote client connection `/usr/bin/rmcctrl -p`; #ms node id, hostname, ip defs my $ms_node_id; my $ms_name,$ms_aliases,$ms_addrtype,$ms_length,@ms_addrs; my $ms_ipaddresses; #if ($VERBOSE) { # print " ms_host_name=$ms_host_name, ms_nam=$ms_name, ms_aliases=$ms_aliases, ms_ip_addr=$ms_ipaddresses, ms_node_id=$ms_node_id\n"; #} my $mon_nodes=$noderef->{$_}; my $first_time=1; foreach(@$mon_nodes) { my $node_pair=$_; my $node=$node_pair->[0]; my $nodetype=$node_pair->[1]; if ((!$nodetype) || ($nodetype =~ /$::NODETYPE_OSI/)) { #RMC deals only with osi type. empty type is treated as osi type #check if the node has already defined $result=`lsrsrc-api -s IBM.MngNode::"Name=\\\"\"$node\\\"\"" 2>&1`; if ($? == 0) { #resource has already defined next; } #TODO: check all nodes at the same time or use the 'status' value in the node `fping -a $node 2> /dev/null`; if ($?) { print "Cannot add the node $node into the RMC domian. The node is inactive.\n"; next; } if ($first_time) { $first_time=0; #enable remote client connection `/usr/bin/rmcctrl -p`; #get ms node id, hostname, ip etc $ms_node_id=`head -n 1 /var/ct/cfg/ct_node_id`; chomp($ms_node_id); ($ms_name,$ms_aliases,$ms_addrtype,$ms_length,@ms_addrs) = gethostbyname($ms_host_name); chomp($ms_name); $ms_ipaddresses="{"; foreach (@ms_addrs) { $ms_ipaddresses .= '"' .inet_ntoa($_) . '",'; } chop($ms_ipaddresses); $ms_ipaddresses .= "}"; } #get info for the node $mn_node_id=`psh $node "head -n 1 /var/ct/cfg/ct_node_id" 2>&1`; $mn_node_id =~ s/.*([0-9 a-g]{16}).*/$1/s; my ($mn_name,$mn_aliases,$mn_addrtype,$mn_length,@mn_addrs) = gethostbyname($node); chomp($mn_name); my $mn_ipaddresses="{"; foreach (@mn_addrs) { $mn_ipaddresses .= '"'.inet_ntoa($_) . '",'; } chop($mn_ipaddresses); $mn_ipaddresses .= "}"; #if ($VERBOSE) { # print " mn_name=$mn_name, mn_aliases=$mn_aliases, mn_ipaddr=$mn_ipaddresses, mn_node_id=$mn_node_id\n"; #} # define resource in IBM.MngNode class on server $result=`mkrsrc-api IBM.MngNode::Name::"$node"::KeyToken::"$node"::IPAddresses::"$mn_ipaddresses"::NodeID::0x$mn_node_id 2>&1`; if ($?) { print "define resource in IBM.MngNode class result=$result\n"; } #copy the configuration script and run it locally $result=`scp $::XCATROOT/sbin/rmcmon/configrmcnode $node:/tmp 2>&1`; if ($?) { print "rmcmon:addNodes: cannot copy the file configrmcnode to node $node\n"; next; } $result=`psh $node /tmp/configrmcnode -a $node $ms_host_name $ms_ipaddresses 0x$ms_node_id 2>&1`; if ($?) { print "$result\n"; } } } } return 0; } #-------------------------------------------------------------------------------- =head3 removeNodes This function removes the nodes from the RMC cluster. Arguments: nodes --nodes to be removed. It is a hash reference keyed by the monitoring server nodes and each value is a ref to an array of [nodes, nodetype, status] arrays monitored by the server. So the format is: {monserver1=>[['node1', 'osi', 'active'], ['node2', 'switch', 'booting']...], ...} verbose -- verbose mode. 1 for yes, 0 for no. Returns: none =cut #-------------------------------------------------------------------------------- sub removeNodes { $noderef=shift; if ($noderef =~ /xCAT_monitoring::rmcmon/) { $noderef=shift; } my $VERBOSE=shift; #if ($VERBOSE) { print "rmcmon::removeNodes called\n"}; my $local_host_name=hostname(); chomp($local_host_name); foreach (keys(%$noderef)) { $server=$_; #print " monitoring server: $server local_host_name=$local_host_name\n"; #only handle the nodes which has this node as the monitor server if ($server ne $local_host_name) {next; } my $mon_nodes=$noderef->{$_}; foreach(@$mon_nodes) { my $node_pair=$_; my $node=$node_pair->[0]; my $nodetype=$node_pair->[1]; if ((!$nodetype) || ($nodetype =~ /$::NODETYPE_OSI/)) { #RMC deals only with osi type. empty type is treated as osi type #remove resource in IBM.MngNode class on server my $result=`rmrsrc-api -s IBM.MngNode::"Name=\\\"\"$node\\\"\"" 2>&1`; if ($?) { print "remove resource in IBM.MngNode class result=$result\n"; } if ($result =~ m/2612-023/) { #resource not found next; } # TODO: check all the nodes together or use the 'status' value #if the node is inactive, forget it `fping -a $node 2> /dev/null`; if ($?) { next; } #copy the configuration script and run it locally $result=`scp $::XCATROOT/sbin/rmcmon/configrmcnode $node:/tmp 2>&1 `; if ($?) { print "rmcmon:removeNodes: cannot copy the file configrmcnode to node $node\n"; next; } $result=`psh --nonodecheck $node /tmp/configrmcnode -d $node 2>&1`; if ($?) { print "$result\n"; } } } } return 0; }