git-svn-id: https://svn.code.sf.net/p/xcat/code/xcat-core/trunk@10816 8638fb3e-16cb-4fca-ae20-7b5d299a9bcd
		
			
				
	
	
		
			1791 lines
		
	
	
		
			56 KiB
		
	
	
	
		
			Perl
		
	
	
	
	
	
			
		
		
	
	
			1791 lines
		
	
	
		
			56 KiB
		
	
	
	
		
			Perl
		
	
	
	
	
	
| #!/usr/bin/env perl
 | |
| # IBM(c) 2007 EPL license http://www.eclipse.org/legal/epl-v10.html
 | |
| package xCAT_monitoring::rmcmon;
 | |
| BEGIN
 | |
| {
 | |
|   $::XCATROOT = $ENV{'XCATROOT'} ? $ENV{'XCATROOT'} : '/opt/xcat';
 | |
| }
 | |
| use lib "$::XCATROOT/lib/perl";
 | |
| use strict;
 | |
| use xCAT::NodeRange;
 | |
| use Sys::Hostname;
 | |
| use Socket;
 | |
| use xCAT::Utils;
 | |
| use xCAT::InstUtils;
 | |
| use xCAT::GlobalDef;
 | |
| use xCAT_monitoring::monitorctrl;
 | |
| use xCAT_monitoring::rmcmetrix;
 | |
| use xCAT::MsgUtils;
 | |
| use xCAT::DBobjUtils;
 | |
| #print "xCAT_monitoring::rmcmon loaded\n";
 | |
| 1;
 | |
| 
 | |
| 
 | |
| #TODO: script to define sensors on the nodes.
 | |
| #TODO: how to push the sensor scripts to nodes?
 | |
| #TODO: monitoring HMC with old RSCT and new RSCT
 | |
| 
 | |
| #-------------------------------------------------------------------------------
 | |
| =head1  xCAT_monitoring:rmcmon  
 | |
| =head2    Package Description
 | |
|   xCAT monitoring plugin package to handle RMC monitoring.
 | |
| =cut
 | |
| #-------------------------------------------------------------------------------
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    start
 | |
|       This function gets called by the monitorctrl module
 | |
|       when xcatd starts and when monstart command is issued by the user. 
 | |
|       It starts the daemons and does necessary startup process for the RMC monitoring.
 | |
|       It also queries the RMC for its currently monitored
 | |
|       nodes which will, in tern, compared with the nodes
 | |
|       in the input parameter. It asks RMC to add or delete
 | |
|       nodes according to the comparison so that the nodes
 | |
|       monitored by RMC are in sync with the nodes currently
 | |
|       in the xCAT cluster.
 | |
|        p_nodes -- a pointer to an arrays of nodes to be monitored. null means all.
 | |
|        scope -- the action scope, it indicates the node type the action will take place.
 | |
|                 0 means localhost only. 
 | |
|                 2 means both localhost and nodes, 
 | |
|        callback -- the callback pointer for error and status displaying. It can be null.
 | |
|     Returns:
 | |
|       (return code, message) 
 | |
|       if the callback is set, use callback to display the status and error. 
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub start {
 | |
|   print "rmcmon::start called\n";
 | |
|   my $noderef=shift;
 | |
|   if ($noderef =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $noderef=shift;
 | |
|   }
 | |
|   my $scope=shift;
 | |
|   my $callback=shift;
 | |
| 
 | |
|   my $localhostname=hostname();
 | |
|     
 | |
|   #assume the server is the current node.
 | |
|   #check if rsct is installed and running
 | |
|   if (! -e "/usr/bin/lsrsrc") {
 | |
|     if ($callback) {
 | |
|       my $rsp={};
 | |
|       $rsp->{data}->[0]="$localhostname: RSCT is not installed.";
 | |
|       $callback->($rsp);
 | |
|     }
 | |
|     return (1, "RSCT is not installed.\n");
 | |
|   }
 | |
| 
 | |
|   my $result;
 | |
|   chomp(my $pid= `/bin/ps -ef | /bin/grep rmcd | /bin/grep -v grep | /bin/awk '{print \$2}'`);
 | |
|   unless($pid){
 | |
|     #restart rmc daemon
 | |
|     $result=`startsrc -s ctrmc`;
 | |
|     if ($?) {
 | |
|       if ($callback) {
 | |
|         my $rsp={};
 | |
|         $rsp->{data}->[0]="$localhostname: RMC deamon cannot be started.";
 | |
|         $callback->($rsp);
 | |
|       }
 | |
|       return (1, "RMC deamon cannot be started\n");
 | |
|     }
 | |
|     `startsrc -s  IBM.MgmtDomainRM`;
 | |
|   }
 | |
| 
 | |
|   #restore the association
 | |
|   if ($callback) { #this is the case when monstart is called, not the xcatd starts
 | |
|     #get all the current 
 | |
|     my %assocHash=();
 | |
|     my $result=`LANG=C /usr/bin/lscondresp -x -D:_:  2>&1`;
 | |
|     if ($?==0) {
 | |
|       chomp($result); 
 | |
|       my @tmp=split('\n', $result);
 | |
|       foreach my $line (@tmp) {
 | |
| 	my @tmp1=split(':_:', $line);
 | |
|         if (@tmp1 < 4) { next; }
 | |
|         my $cond=$tmp1[0];
 | |
|         my $resp=$tmp1[1];
 | |
|         if ($tmp1[3] =~ /Not|not/) { $assocHash{"$cond:_:$resp"}=0; } 
 | |
|         else {$assocHash{"$cond:_:$resp"}=1;}
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     #start the associations that are saved in /var/log/rmcmon
 | |
|     my $isSV=xCAT::Utils->isServiceNode();
 | |
|     my $fname="/var/log/rmcmon";
 | |
|     if (! -f "$fname") { 
 | |
|       if ($isSV) { $fname="$::XCATROOT/lib/perl/xCAT_monitoring/rmc/pred_assoc_sn"; }
 | |
|       else { $fname="$::XCATROOT/lib/perl/xCAT_monitoring/rmc/pred_assoc_mn"; }
 | |
|     }
 | |
|     if (-f "$fname") {
 | |
|       if (open(FILE, "<$fname")) {
 | |
|         while (readline(FILE)) {
 | |
|           chomp($_); 
 | |
| 	  my @tmp1=split(':_:', $_);
 | |
|           if (@tmp1 < 4) { next; }
 | |
|           my $cond=$tmp1[0];
 | |
|           my $resp=$tmp1[1];
 | |
|           if ($tmp1[3] !~ /Not|not/) { #active
 | |
| 	    if ((!exists($assocHash{"$cond:_:$resp"})) || ($assocHash{"$cond:_:$resp"}==0)) {
 | |
| 	      $result=`/usr/bin/startcondresp $cond $resp 2>&1`;
 | |
|               if (($?) && ($result !~ /2618-244|2618-008/)) { #started
 | |
|                 my $rsp={};
 | |
|                 $rsp->{data}->[0]="$localhostname: $result";
 | |
|                 $callback->($rsp);
 | |
| 	      }
 | |
| 	    }
 | |
| 	  } else { #inactive
 | |
| 	    if (!exists($assocHash{"$cond:_:$resp"})) { 
 | |
|               $result=`/usr/bin/mkcondresp $cond $resp  2>&1`; 
 | |
|               if (($?) && ($result !~ /2618-201|2618-008/)) { #resource already defined
 | |
|                 my $rsp={};
 | |
|                 $rsp->{data}->[0]="$localhostname: $result";
 | |
|                 $callback->($rsp);
 | |
| 	      }
 | |
|             } elsif ($assocHash{"$cond:_:$resp"}==1) { 
 | |
|               $result=`/usr/bin/stopcondresp $cond $resp  2>&1`;
 | |
|               if (($?) && ($result !~ /2618-264/)) { #stoped
 | |
|                 my $rsp={};
 | |
|                 $rsp->{data}->[0]="$localhostname: $result";
 | |
|                 $callback->($rsp);
 | |
| 	      }
 | |
|             }
 | |
| 	  }
 | |
|         }
 | |
|         close(FILE);
 | |
|       } 
 | |
|     } 
 | |
|   } #if ($callback)
 | |
|   my $montype = 'event';
 | |
|   my $entry = undef;
 | |
|   my $conftable =  xCAT::Table->new('monsetting');
 | |
|   $entry = $conftable->getAttribs({'name'=>'rmcmon','key'=>'montype'}, 'value');
 | |
|   if($entry){
 | |
| 	  $montype = $entry->{value};
 | |
|   }
 | |
|   $conftable->close;
 | |
| 
 | |
|   my @metrixconf = xCAT_monitoring::rmcmetrix::get_metrix_conf();
 | |
|   if($montype =~ /perf/){
 | |
|     while(@metrixconf){
 | |
|       my ($rsrc, $rname, $attrlist, $minute);
 | |
|       $rsrc  = shift @metrixconf;
 | |
|       $rname = shift @metrixconf;
 | |
|       $attrlist = shift @metrixconf;
 | |
|       $minute = shift @metrixconf;
 | |
|       xCAT::Utils->runcmd("$::XCATROOT/sbin/rmcmon/rmcmetrixmon init $rsrc $rname $attrlist $minute", 0);
 | |
|     }
 | |
|   }
 | |
|   if(xCAT::Utils->isServiceNode()){
 | |
|     xCAT::Utils->runcmd("$::XCATROOT/sbin/rmcmon/rmcmetrixmon init rrdserver", 0);
 | |
|   }
 | |
|   if ($scope) {
 | |
|     #get a list of managed nodes
 | |
|     $result=`/usr/bin/lsrsrc-api -s IBM.MngNode::::Name 2>&1`;  
 | |
|     if ($?) {
 | |
|       if ($result !~ /2612-023/) {#2612-023 no resources found error
 | |
|         reportError( $result, $callback); 
 | |
|         return (1,$result);
 | |
|       }
 | |
|       $result='';
 | |
|     }
 | |
|     chomp($result);
 | |
|     my @rmc_nodes=split(/\n/, $result);
 | |
|     
 | |
|     #start the rmc daemons for its children
 | |
|     if (@rmc_nodes > 0) {
 | |
|       my $nodestring=join(',', @rmc_nodes);
 | |
|       $result=`XCATBYPASS=Y $::XCATROOT/bin/xdsh $nodestring startsrc -s ctrmc 2>&1`;
 | |
|       if (($result) && ($result !~ /0513-029/)) { #0513-029 multiple instance not supported.
 | |
|         reportError( $result, $callback); 
 | |
|       }
 | |
|     }
 | |
|   }
 | |
|   if ($callback) {
 | |
|     my $rsp={};
 | |
|     $rsp->{data}->[0]="$localhostname: done.";
 | |
|     $callback->($rsp);
 | |
|   }
 | |
| 
 | |
|   return (0, "started");
 | |
| }
 | |
| 
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    pingNodeStatus
 | |
|       This function takes an array of nodes and returns their status using fping.
 | |
|     Arguments:
 | |
|        nodes-- an array of nodes.
 | |
|     Returns:
 | |
|        a hash that has the node status. The format is: 
 | |
|           {alive=>[node1, node3,...], unreachable=>[node4, node2...]}
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub pingNodeStatus {
 | |
|   my ($class, @mon_nodes)=@_;
 | |
|   my %status=();
 | |
|   my @active_nodes=();
 | |
|   my @inactive_nodes=();
 | |
|   if ((@mon_nodes)&& (@mon_nodes > 0)) {
 | |
|     #get all the active nodes
 | |
|     my $nodes= join(' ', @mon_nodes);
 | |
|     my $temp=`fping -a $nodes 2> /dev/null`;
 | |
|     chomp($temp);
 | |
|     @active_nodes=split(/\n/, $temp);
 | |
| 
 | |
|     #get all the inactive nodes by substracting the active nodes from all.
 | |
|     my %temp2;
 | |
|     if ((@active_nodes) && ( @active_nodes > 0)) {
 | |
|       foreach(@active_nodes) { $temp2{$_}=1};
 | |
|         foreach(@mon_nodes) {
 | |
|           if (!$temp2{$_}) { push(@inactive_nodes, $_);}
 | |
|         }
 | |
|     }
 | |
|     else {@inactive_nodes=@mon_nodes;}     
 | |
|   }
 | |
| 
 | |
|   $status{$::STATUS_ACTIVE}=\@active_nodes;
 | |
|   $status{$::STATUS_INACTIVE}=\@inactive_nodes;
 | |
|  
 | |
|   return %status;
 | |
| }
 | |
| 
 | |
| 
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    stop
 | |
|       This function gets called when monstop command is issued by the user. 
 | |
|       It stops the monitoring on all nodes, stops the RMC daemons.
 | |
|     Arguments:
 | |
|        p_nodes -- a pointer to an arrays of nodes to be stoped for monitoring. null means all.
 | |
|        scope -- the action scope, it indicates the node type the action will take place.
 | |
|                 0 means localhost only. 
 | |
|                 2 means both monservers and nodes, 
 | |
|        callback -- the callback pointer for error and status displaying. It can be null.
 | |
|     Returns:
 | |
|       (return code, message) 
 | |
|       if the callback is set, use callback to display the status and error. 
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub stop {
 | |
|   print "rmcmon::stop called\n";
 | |
|   my $noderef=shift;
 | |
|   if ($noderef =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $noderef=shift;
 | |
|   }
 | |
|   my $scope=shift;
 | |
|   my $callback=shift;
 | |
| 
 | |
|   my $localhostname=hostname();
 | |
| 
 | |
|   
 | |
|   xCAT::Utils->runcmd("$::XCATROOT/sbin/rmcmon/rmcmetrixmon clean", 0);
 | |
|   if(xCAT::Utils->isServiceNode()){
 | |
|     xCAT::Utils->runcmd("$::XCATROOT/sbin/rmcmon/rmcmetrixmon clean rrdserver", 0);
 | |
|   } 
 | |
|   my $result;
 | |
|   chomp(my $pid= `/bin/ps -ef | /bin/grep rmcd | /bin/grep -v grep | /bin/awk '{print \$2}'`);
 | |
|   if ($pid){
 | |
|     #save all the association in to /var/log/rmcmon
 | |
|     `rm -f /var/log/rmcmon`;
 | |
|     my $result=`LANG=C /usr/bin/lscondresp -x -D:_:  2>&1`;
 | |
|     if ($?==0) {
 | |
|       if (open(FILE, ">/var/log/rmcmon")) {
 | |
|         print FILE $result;
 | |
|         close(FILE);
 | |
|       }
 | |
| 
 | |
|       #stop condition-response associtations
 | |
|       chomp($result); 
 | |
|       my @tmp=split('\n', $result);
 | |
|       foreach my $line (@tmp) {
 | |
| 	my @tmp1=split(':_:', $line);
 | |
|         if (@tmp1 < 4) { next; }
 | |
|         if ($tmp1[3] !~ /Not|not/) {
 | |
| 	  my $result=`/usr/bin/stopcondresp $tmp1[0] $tmp1[1]  2>&1`;
 | |
|           if (($?) && ($result !~ /2618-264/)) { #stoped
 | |
| 	    if ($callback) {
 | |
|               my $rsp={};
 | |
|               $rsp->{data}->[0]="$localhostname: $result";
 | |
|               $callback->($rsp);
 | |
| 	    }
 | |
| 	  }
 | |
|         }
 | |
|       } #foreach
 | |
|     } # if ($pid)
 | |
|   
 | |
|     #restop the rmc daemon
 | |
|     #$result=`stopsrc -s ctrmc`;
 | |
|     #if ($?) {
 | |
|     #  if ($callback) {
 | |
|     #    my $rsp={};
 | |
|     #    $rsp->{data}->[0]="$localhostname: RMC deamon cannot be stopped.";
 | |
|     #    $callback->($rsp);
 | |
|     #  }
 | |
|     #  return (1, "RMC deamon cannot be stopped\n");
 | |
|     #}
 | |
|   }
 | |
| 
 | |
|   if ($scope) {
 | |
|     my $pPairHash=xCAT_monitoring::monitorctrl->getMonServer($noderef);
 | |
|     if (ref($pPairHash) eq 'ARRAY') {
 | |
| 	reportError($pPairHash->[1], $callback);
 | |
| 	return (1, "");	
 | |
|     }
 | |
| 
 | |
|  
 | |
|     #the identification of this node
 | |
|     my @hostinfo=xCAT::Utils->determinehostname();
 | |
|     my $isSV=xCAT::Utils->isServiceNode();
 | |
| 
 | |
|     my %iphash=();
 | |
|     foreach(@hostinfo) {$iphash{$_}=1;}
 | |
|     if (!$isSV) { $iphash{'noservicenode'}=1;}
 | |
| 
 | |
|     foreach my $key (keys (%$pPairHash)) {
 | |
|       my @key_a=split(':', $key);
 | |
|       if (! $iphash{$key_a[0]}) { next;}  
 | |
|       my $mon_nodes=$pPairHash->{$key};
 | |
|       
 | |
|       #figure out what nodes to stop
 | |
|       my @nodes_to_stop=();
 | |
|       if ($mon_nodes) {
 | |
|         foreach(@$mon_nodes) {
 | |
|           my $node=$_->[0];
 | |
|           my $nodetype=$_->[1];
 | |
|           if (($nodetype) && ($nodetype =~ /$::NODETYPE_OSI/)) { 
 | |
| 	    push(@nodes_to_stop, $node);
 | |
|           }  
 | |
|         }     
 | |
|       }
 | |
| 
 | |
|       if (@nodes_to_stop > 0) {
 | |
|         my $nodestring=join(',', @nodes_to_stop);
 | |
|         $result=`XCATBYPASS=Y $::XCATROOT/bin/xdsh $nodestring "/bin/ps -ef | /bin/grep rmcd | /bin/grep -v grep | /bin/awk '{if (\\\$2>0) system(\\\"stopsrc -s ctrmc\\\")}' 2>&1"`;
 | |
| 
 | |
|         if (($result) && ($result !~ /0513-044/)){ #0513-0544 is normal value
 | |
| 	  reportError($result, $callback);
 | |
|         }
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   return (0, "stopped");
 | |
| }
 | |
| 
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    config
 | |
|       This function configures the cluster for the given nodes.  
 | |
|       This function is called when moncfg command is issued or when xcatd starts
 | |
|       on the service node. It will configure the cluster to include the given nodes within
 | |
|       the monitoring doamin. 
 | |
|     Arguments:
 | |
|        p_nodes -- a pointer to an arrays of nodes to be added for monitoring. none means all.
 | |
|        scope -- the action scope, it indicates the node type the action will take place.
 | |
|                 0 means localhost only. 
 | |
|                 2 means localhost and nodes, 
 | |
|        callback -- the callback pointer for error and status displaying. It can be null.
 | |
|     Returns:
 | |
|        (error code, error message)
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub config {
 | |
|   #print "rmcmon:config called\n";
 | |
|   my $noderef=shift;
 | |
|   if ($noderef =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $noderef=shift;
 | |
|   }
 | |
|   my $scope=shift;
 | |
|   my $callback=shift;
 | |
| 
 | |
|   my $localhostname=hostname();
 | |
|     
 | |
|   #assume the server is the current node.
 | |
|   #check if rsct is installed and running
 | |
|   if (! -e "/usr/bin/lsrsrc") {
 | |
|     if ($callback) {
 | |
|       my $rsp={};
 | |
|       $rsp->{data}->[0]="$localhostname: RSCT is not installed.";
 | |
|       $callback->($rsp);
 | |
|     }
 | |
|     return (1, "RSCT is not installed.\n");
 | |
|   }
 | |
| 
 | |
|   my $result;
 | |
|   chomp(my $pid= `/bin/ps -ef | /bin/grep rmcd | /bin/grep -v grep | /bin/awk '{print \$2}'`);
 | |
|   unless($pid){
 | |
|     #restart rmc daemon
 | |
|     $result=`startsrc -s ctrmc`;
 | |
|     if ($?) {
 | |
|      if ($callback) {
 | |
|        my $rsp={};
 | |
|        $rsp->{data}->[0]="$localhostname: RMC deamon cannot be started.";
 | |
|        $callback->($rsp);
 | |
|      }
 | |
|      return (1, "RMC deamon cannot be started\n");
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   #enable remote client connection
 | |
|   `/usr/bin/rmcctrl -p`;
 | |
|   
 | |
|  
 | |
|   #the identification of this node
 | |
|   my @hostinfo=xCAT::Utils->determinehostname();
 | |
|   my $isSV=xCAT::Utils->isServiceNode();
 | |
|   my %iphash=();
 | |
|   foreach(@hostinfo) {$iphash{$_}=1;}
 | |
|   if (!$isSV) { $iphash{'noservicenode'}=1;}
 | |
| 
 | |
|   #create conditions/responses/sensors on the service node or mn
 | |
|   my $result=`/usr/sbin/rsct/install/bin/ctversion`;
 | |
|   my $rsct_ver;
 | |
|   if (!$?) {
 | |
|       chomp($result);
 | |
|       my @tempa=split(/ /, $result); 
 | |
|       if (@tempa>1) {
 | |
|           $rsct_ver=$tempa[1]; 
 | |
|       }
 | |
|   }
 | |
|   my $version_string;
 | |
|   if ($rsct_ver) {$version_string="RSCT_VER=$rsct_ver"; } 
 | |
| 
 | |
|   my $result;
 | |
|   if ($isSV) {
 | |
|       $result=`$version_string $::XCATROOT/sbin/rmcmon/mkrmcresources $::XCATROOT/lib/perl/xCAT_monitoring/rmc/resources/sn 2>&1`;  } else  {
 | |
| 	  $result=`$version_string $::XCATROOT/sbin/rmcmon/mkrmcresources $::XCATROOT/lib/perl/xCAT_monitoring/rmc/resources/mn 2>&1`;
 | |
|   }      
 | |
|   if ($?) {
 | |
|     my $error= "Error when creating predefined resources on $localhostname:\n$result";
 | |
|     reportError($error, $callback);
 | |
|   }
 | |
|   if(!$isSV){
 | |
|     xCAT::Utils->runcmd("chtab key='rmetrics_IBM.Host' monsetting.name=rmcmon monsetting.value='PctTotalTimeIdle,PctTotalTimeWait,PctTotalTimeUser,PctTotalTimeKernel,PctRealMemFree:1'", 0);
 | |
|     xCAT::Utils->runcmd("chtab key='rmetrics_IBM.EthernetDevice' monsetting.name=rmcmon monsetting.value='RecByteRate,RecPacketRate,XmitByteRate,XmitPacketRate:1'", 0);
 | |
|   }
 | |
| 
 | |
|   my $pPairHash=xCAT_monitoring::monitorctrl->getMonServer($noderef);
 | |
|   if (ref($pPairHash) eq 'ARRAY') {
 | |
|       reportError($pPairHash->[1], $callback);
 | |
|       return (1, "");	
 | |
|   }
 | |
| 
 | |
|   foreach my $key (keys (%$pPairHash)) {
 | |
|     my @key_a=split(':', $key);
 | |
|     if (! $iphash{$key_a[0]}) { next;} 
 | |
|     my $mon_nodes=$pPairHash->{$key};
 | |
| 
 | |
|     my $master=$key_a[1];
 | |
| 
 | |
|     #figure out what nodes to add
 | |
|     my @nodes_to_add=();
 | |
|     my @hmc_nodes=();
 | |
|     if ($mon_nodes) {
 | |
|       foreach(@$mon_nodes) {
 | |
|         my $node=$_->[0];
 | |
|         my $nodetype=$_->[1];
 | |
|         if ($nodetype){ 
 | |
| 	  if ($nodetype =~ /$::NODETYPE_OSI/) { push(@nodes_to_add, $node); }
 | |
| 	  elsif (xCAT::DBobjUtils->getnodetype($node) =~ /$::NODETYPE_HMC/) { push(@hmc_nodes, $node); }
 | |
|         } 
 | |
|       }     
 | |
|     }
 | |
| 
 | |
|     #add new nodes to the RMC cluster
 | |
|     if (@nodes_to_add> 0) {
 | |
|       addNodes(\@nodes_to_add, $master, $scope, $callback, 0);
 | |
|     }
 | |
| 
 | |
|     #add new HMC nodes to the RMC cluster
 | |
|     if (@hmc_nodes > 0) {
 | |
|       addNodes(\@hmc_nodes, $master, $scope, $callback, 1);
 | |
|     }
 | |
|   }
 | |
| 
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    deconfig
 | |
|       This function de-configures the cluster for the given nodes.  
 | |
|       This function is called when mondecfg command is issued by the user. 
 | |
|       It should remove the given nodes from the product for monitoring.
 | |
|     Arguments:
 | |
|        p_nodes -- a pointer to an arrays of nodes to be removed for monitoring. none means all.
 | |
|        scope -- the action scope, it indicates the node type the action will take place.
 | |
|                 0 means local host only. 
 | |
|                 2 means both local host and nodes, 
 | |
|        callback -- the callback pointer for error and status displaying. It can be null.
 | |
|     Returns:
 | |
|        (error code, error message)
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub deconfig {
 | |
|   print "rmcmon:deconfig called\n";
 | |
|   my $noderef=shift;
 | |
|   if ($noderef =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $noderef=shift;
 | |
|   }
 | |
|   my $scope=shift;
 | |
|   my $callback=shift;
 | |
|   my $localhostname=hostname();
 | |
|   my $pPairHash=xCAT_monitoring::monitorctrl->getMonServer($noderef);
 | |
|   if (ref($pPairHash) eq 'ARRAY') {
 | |
|       reportError($pPairHash->[1], $callback);
 | |
|       return (1, "");	
 | |
|   }
 | |
|  
 | |
|   #the identification of this node
 | |
|   my @hostinfo=xCAT::Utils->determinehostname();
 | |
|   my $isSV=xCAT::Utils->isServiceNode();
 | |
|   my %iphash=();
 | |
|   foreach(@hostinfo) {$iphash{$_}=1;}
 | |
|   if (!$isSV) { $iphash{'noservicenode'}=1;}
 | |
|   if(!$isSV){
 | |
|     xCAT::Utils->runcmd("chtab -d key='rmetrics_IBM.Host' monsetting", 0);
 | |
|     xCAT::Utils->runcmd("chtab -d key='rmetrics_IBM.EthernetDevice' monsetting", 0);
 | |
|   }
 | |
| 
 | |
|   foreach my $key (keys (%$pPairHash)) {
 | |
|     my @key_a=split(':', $key);
 | |
|     if (! $iphash{$key_a[0]}) { next;}  
 | |
|     my $mon_nodes=$pPairHash->{$key};
 | |
| 
 | |
|     my $master=$key_a[1];
 | |
| 
 | |
|     #figure out what nodes to remove
 | |
|     my @nodes_to_rm=();
 | |
|     my @hmc_nodes=();
 | |
|     if ($mon_nodes) {
 | |
|       foreach(@$mon_nodes) {
 | |
|         my $node=$_->[0];
 | |
|         my $nodetype=$_->[1];
 | |
|         if ($nodetype) {
 | |
|           if ($nodetype =~ /$::NODETYPE_OSI/) { push(@nodes_to_rm, $node);}
 | |
| 	  elsif (xCAT::DBobjUtils->getnodetype($node) =~ /$::NODETYPE_HMC/) { push(@hmc_nodes, $node); }
 | |
|         }  
 | |
|       }     
 | |
|     }
 | |
| 
 | |
|     #remove nodes from the RMC cluster
 | |
|     if (@nodes_to_rm > 0) {
 | |
|       removeNodes(\@nodes_to_rm, $master, $scope, $callback, 0);
 | |
|     }
 | |
| 
 | |
|     #remove HMC nodes from the RMC cluster
 | |
|     if (@hmc_nodes > 0) {
 | |
|       removeNodes(\@hmc_nodes, $master, $scope, $callback, 1);
 | |
|     }
 | |
|   } 
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    supportNodeStatusMon
 | |
|     This function is called by the monitorctrl module to check
 | |
|     if RMC can help monitoring and returning the node status.
 | |
|     
 | |
|     Arguments:
 | |
|         none
 | |
|     Returns:
 | |
|          1  
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub supportNodeStatusMon {
 | |
|   #print "rmcmon::supportNodeStatusMon called\n";
 | |
|   return 1;
 | |
| }
 | |
| 
 | |
| 
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3   startNodeStatusMon
 | |
|     This function is called by the monitorctrl module to tell
 | |
|     RMC to start monitoring the node status and feed them back
 | |
|     to xCAT. RMC will start setting up the condition/response 
 | |
|     to monitor the node status changes.  
 | |
| 
 | |
|     Arguments:
 | |
|        p_nodes -- a pointer to an arrays of nodes for monitoring. none means all.
 | |
|        scope -- the action scope, it indicates the node type the action will take place.
 | |
|                 0 means local host only. 
 | |
|                 2 means both local host and nodes, 
 | |
|        callback -- the callback pointer for error and status displaying. It can be null.
 | |
|     Returns:
 | |
|        (error code, error message)
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub startNodeStatusMon {
 | |
|   print "rmcmon::startNodeStatusMon\n";
 | |
|   my $noderef=shift;
 | |
|   if ($noderef =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $noderef=shift;
 | |
|   }
 | |
|   my $scope=shift;
 | |
|   my $callback=shift;
 | |
| 
 | |
|   my $localhostname=hostname();
 | |
|   my $retcode=0;
 | |
|   my $retmsg="";
 | |
| 
 | |
| 
 | |
|   my $isSV=xCAT::Utils->isServiceNode();
 | |
| 
 | |
|   #get all the nodes status from IBM.MngNode class of local host and 
 | |
|   #the identification of this node
 | |
|   my $pPairHash=xCAT_monitoring::monitorctrl->getMonServer($noderef);
 | |
|   if (ref($pPairHash) eq 'ARRAY') {
 | |
|       reportError($pPairHash->[1], $callback);
 | |
|       return (1, "");	
 | |
|   }
 | |
| 
 | |
|   my @hostinfo=xCAT::Utils->determinehostname();
 | |
|   my %iphash=();
 | |
|   foreach(@hostinfo) {$iphash{$_}=1;}
 | |
|   if (!$isSV) { $iphash{'noservicenode'}=1;}
 | |
| 
 | |
|   my @servicenodes=();
 | |
|   my %status_hash=();
 | |
|   foreach my $key (keys (%$pPairHash)) {
 | |
|     my @key_a=split(':', $key);
 | |
|     if (! $iphash{$key_a[0]}) { next;}
 | |
|     my $mon_nodes=$pPairHash->{$key};
 | |
| 
 | |
|     foreach my $nn(@$mon_nodes) {
 | |
|       my $nodetype=$nn->[1];
 | |
|       if ($nodetype) {
 | |
| 	if (($nodetype =~ /$::NODETYPE_OSI/)|| (xCAT::DBobjUtils->getnodetype($nn->[0]) =~ /$::NODETYPE_HMC/)) {
 | |
|           $status_hash{$nn->[0]}=$nn->[2];
 | |
|         }
 | |
|       }  
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   #get nodestatus from RMC and update the xCAT DB
 | |
|   ($retcode, $retmsg) = saveRMCNodeStatusToxCAT(\%status_hash);
 | |
|   if ($retcode != 0) {
 | |
|     reportError($retmsg, $callback);
 | |
|   }
 | |
| 
 | |
|  #get rsct version
 | |
|   my $result=`/usr/sbin/rsct/install/bin/ctversion`;
 | |
|   my $rsct_ver="0.0.0";
 | |
|   if (!$?) {
 | |
|       chomp($result);
 | |
|       my @tempa=split(/ /, $result); 
 | |
|       if (@tempa>1) {
 | |
|           $rsct_ver=$tempa[1]; 
 | |
|       }
 | |
|   }
 | |
|  
 | |
|   #get setting from the monsetting table
 | |
|   my $batch=0;
 | |
|   if (xCAT::Utils->CheckVersion($rsct_ver, "2.3.5.0") >= 0) {
 | |
|     my %settings=xCAT_monitoring::monitorctrl->getPluginSettings("rmcmon");
 | |
| 
 | |
|     my $batch_string=$settings{'nodeusebatch'};
 | |
|     if ($batch_string  =~ /1|Yes|yes|YES|Y|y/ ) { $batch=1;}   
 | |
|   }
 | |
| 
 | |
|   if ($batch) {
 | |
|       my $result=`startcondresp NodeReachability_B UpdatexCATNodeStatus_B 2>&1`;
 | |
|       if (($?) && ($result !~ /2618-244|2618-008/)) { #started
 | |
| 	  $retcode=$?;
 | |
| 	  $retmsg="Error start node status monitoring: $result";
 | |
| 	  reportError($retmsg, $callback);
 | |
|       }
 | |
|   } else {
 | |
|     if (!$isSV) {
 | |
| 	#start monitoring the status of mn's immediate children
 | |
| 	my $result=`startcondresp NodeReachability UpdatexCATNodeStatus 2>&1`;
 | |
| 	if (($?) && ($result !~ /2618-244|2618-008/)) { #started
 | |
| 	    $retcode=$?;
 | |
| 	    $retmsg="Error start node status monitoring: $result";
 | |
| 	    reportError($retmsg, $callback);
 | |
| 	}
 | |
| 	
 | |
| 	#start monitoring the status of mn's grandchildren via their service nodes
 | |
| 	$result=`startcondresp NodeReachability_H UpdatexCATNodeStatus 2>&1`;
 | |
| 	if (($?) && ($result !~ /2618-244|2618-008/)) { #started
 | |
| 	    $retcode=$?;
 | |
| 	    $retmsg="Error start node status monitoring: $result";
 | |
| 	    reportError($retmsg, $callback);
 | |
| 	}
 | |
|     }
 | |
|   }
 | |
|   return ($retcode, $retmsg);
 | |
| }
 | |
| 
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3   saveRMCNodeStatusToxCAT
 | |
|     This function gets RMC node status and save them to xCAT database
 | |
| 
 | |
|     Arguments:
 | |
|         $oldstatus a pointer to a hash table that has the current node status
 | |
|         $node  the name of the service node to run RMC command from. If null, get from local host. 
 | |
|     Returns:
 | |
|         (return code, message)
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub saveRMCNodeStatusToxCAT {
 | |
|   #print "rmcmon::saveRMCNodeStatusToxCAT called\n";
 | |
|   my $retcode=0;
 | |
|   my $retmsg="";
 | |
|   my $statusref=shift;
 | |
|   if ($statusref =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $statusref=shift;
 | |
|   }
 | |
|   my $node=shift;
 | |
| 
 | |
|   my %status_hash=%$statusref;
 | |
| 
 | |
|   #get all the node status from mn's children
 | |
|   my $result;
 | |
|   my @active_nodes=();
 | |
|   my @inactive_nodes=();
 | |
|   if ($node) {
 | |
|     $result=`CT_MANAGEMENT_SCOPE=4 LANG=C /usr/bin/lsrsrc-api -o IBM.MngNode::::$node::Name::Status 2>&1`;
 | |
|   } else {
 | |
|     $result=`CT_MANAGEMENT_SCOPE=1 LANG=C /usr/bin/lsrsrc-api -s IBM.MngNode::::Name::Status 2>&1`;
 | |
|   }
 | |
| 
 | |
|   
 | |
|   if ($result) {
 | |
|     my @lines=split('\n', $result);
 | |
|     #only save the ones that needs to change
 | |
|     foreach (@lines) {
 | |
| 	my @pairs=split('::', $_);
 | |
|         if ($pairs[0] eq "ERROR") {
 | |
| 	  $retmsg .= "$_\n";
 | |
|         }
 | |
|         else {
 | |
|           if ($pairs[1]==1) { 
 | |
|             if ($status_hash{$pairs[0]} ne $::STATUS_ACTIVE) { push @active_nodes,$pairs[0];} 
 | |
|           }
 | |
|           else { 
 | |
|             if ($status_hash{$pairs[0]} ne $::STATUS_INACTIVE) { push @inactive_nodes, $pairs[0];}
 | |
|           }
 | |
|         }   
 | |
|       } 
 | |
|   }
 | |
|   
 | |
| 
 | |
|   my %new_node_status=();
 | |
|   if (@active_nodes>0) {
 | |
|     $new_node_status{$::STATUS_ACTIVE}=\@active_nodes;
 | |
|   } 
 | |
|   if (@inactive_nodes>0) {
 | |
|     $new_node_status{$::STATUS_INACTIVE}=\@inactive_nodes;
 | |
|   }
 | |
|   #only set the node status for the changed ones
 | |
|   if (keys(%new_node_status) > 0) {
 | |
|     xCAT_monitoring::monitorctrl::setNodeStatusAttributes(\%new_node_status);
 | |
|   }  
 | |
| 
 | |
|   if ($retmsg) {$retcode=1;}
 | |
|   else {$retmsg="started";}
 | |
|  
 | |
|   return ($retcode, $retmsg);
 | |
| }
 | |
| 
 | |
| 
 | |
| 
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3   stopNodeStatusMon
 | |
|     This function is called by the monitorctrl module to tell
 | |
|     RMC to stop feeding the node status info back to xCAT. It will
 | |
|     stop the condition/response that is monitoring the node status.
 | |
| 
 | |
|     Arguments:
 | |
|        p_nodes -- a pointer to an arrays of nodes for monitoring. none means all.
 | |
|        scope -- the action scope, it indicates the node type the action will take place.
 | |
|                 0 means local host only. 
 | |
|                 2 means both local host and nodes, 
 | |
|        callback -- the callback pointer for error and status displaying. It can be null.
 | |
|     Returns:
 | |
|         (return code, message)
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub stopNodeStatusMon {
 | |
|   print "rmcmon::stopNodeStatusMon called\n";
 | |
|   my $noderef=shift;
 | |
|   if ($noderef =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $noderef=shift;
 | |
|   }
 | |
|   my $scope=shift;
 | |
|   my $callback=shift;
 | |
| 
 | |
|   my $retcode=0;
 | |
|   my $retmsg="";
 | |
| 
 | |
|   my $isSV=xCAT::Utils->isServiceNode();
 | |
|   my $localhostname=hostname();
 | |
|  
 | |
|  #get rsct version
 | |
|   my $result=`/usr/sbin/rsct/install/bin/ctversion`;
 | |
|   my $rsct_ver="0.0.0";
 | |
|   if (!$?) {
 | |
|       chomp($result);
 | |
|       my @tempa=split(/ /, $result); 
 | |
|       if (@tempa>1) {
 | |
|           $rsct_ver=$tempa[1]; 
 | |
|       }
 | |
|   }
 | |
|  
 | |
|   #get setting from the monsetting table
 | |
|   my $batch=0;
 | |
|   if (xCAT::Utils->CheckVersion($rsct_ver, "2.3.5.0") >= 0) {
 | |
|     my %settings=xCAT_monitoring::monitorctrl->getPluginSettings("rmcmon");
 | |
| 
 | |
|     my $batch_string=$settings{'nodeusebatch'};
 | |
|     if ($batch_string  =~ /1|Yes|yes|YES|Y|y/ ) { $batch=1;}   
 | |
|   }
 | |
|   if ($batch) {
 | |
|       my $result=`stopcondresp NodeReachability_Batch UpdatexCATNodeStatus_Batch 2>&1`;
 | |
|       if (($?) && ($result !~ /2618-264/)) { #stoped
 | |
| 	  $retcode=$?;
 | |
| 	  $retmsg="Error stop node status monitoring: $result";
 | |
| 	  reportError($retmsg, $callback);
 | |
|       }
 | |
|       
 | |
|   } else {
 | |
|       if ($isSV) { return  ($retcode, $retmsg); }
 | |
| 
 | |
|       #stop monitoring the status of mn's immediate children
 | |
|       my $result=`stopcondresp NodeReachability UpdatexCATNodeStatus 2>&1`;
 | |
|       if (($?) && ($result !~ /2618-264/)) { #stoped
 | |
| 	  $retcode=$?;
 | |
| 	  $retmsg="Error stop node status monitoring: $result";
 | |
| 	  reportError($retmsg, $callback);
 | |
|       }
 | |
|       #stop monitoring the status of mn's grandchildren via their service nodes
 | |
|       $result=`stopcondresp NodeReachability_H UpdatexCATNodeStatus 2>&1`;
 | |
|       if (($?) && ($result !~ /2618-264/)) { #stoped
 | |
| 	  $retcode=$?;
 | |
| 	  $retmsg="Error stop node status monitoring: $result";
 | |
| 	  reportError($retmsg, $callback);
 | |
|       }
 | |
|   }
 | |
| 
 | |
|   return ($retcode, $retmsg);
 | |
| }
 | |
| 
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3   getNodeID
 | |
|     This function gets the nodeif for the given node.
 | |
| 
 | |
|     Arguments:
 | |
|         node
 | |
|     Returns:
 | |
|         node id for the given node
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub getNodeID {
 | |
|   my $node=shift;
 | |
|   if ($node =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $node=shift;
 | |
|   }
 | |
|   my $tab=xCAT::Table->new("mac", -create =>0);
 | |
|   my $tmp=$tab->getNodeAttribs($node, ['mac']);
 | |
|   if (defined($tmp) && ($tmp)) {
 | |
|     my $mac=$tmp->{mac};
 | |
|     $mac =~ s/\|.*//g; #use the first mac
 | |
|     $mac =~ s/\!.*//g; #remove the hostname
 | |
|     $mac =~ s/://g;    #remove :
 | |
|     $mac = "EA" . $mac . "EA";
 | |
|     $tab->close();
 | |
|     return $mac;  
 | |
|   }
 | |
|   $tab->close();
 | |
|   return undef;
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3   getLocalNodeID
 | |
|     This function goes to RMC and gets the nodeid for the local host.
 | |
| 
 | |
|     Arguments:
 | |
|         node
 | |
|     Returns:
 | |
|         node id for the local host.
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub getLocalNodeID {
 | |
|   my $node_id=`/usr/sbin/rsct/bin/lsnodeid`;
 | |
|   if ($?==0) {
 | |
|     chomp($node_id);
 | |
|     return $node_id;
 | |
|   } else {
 | |
|     return undef;
 | |
|   }
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    getNodeInfo
 | |
|       This function gets the nodeid, node ip addresses for the given node 
 | |
|     Arguments:
 | |
|        node
 | |
|        flag --- if 0 means normal nodes, if 1 means HMC.  
 | |
|     Returns:
 | |
|        (nodeid, nodeip) if error, nodeid=-1 and nodeip is the error message
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub getNodeInfo 
 | |
| {
 | |
|   my $node=shift;
 | |
|   my $flag=shift;
 | |
| 
 | |
|   my @hostinfo=xCAT::Utils->determinehostname();
 | |
|   my %iphash=();
 | |
|   foreach(@hostinfo) {$iphash{$_}=1;}
 | |
| 
 | |
|   my $node_id;
 | |
|   if($iphash{$node}) {
 | |
|     $node_id=getLocalNodeID();
 | |
|   } else { 
 | |
|     if ($flag) { 
 | |
|       my $result=`XCATBYPASS=Y $::XCATROOT/bin/xdsh $node -l hscroot lsnodeid`;
 | |
|       if ($?) {
 | |
| 	return (-1, $result);
 | |
|       } else {
 | |
| 	chomp($result);
 | |
|         my @a=split(' ', $result);
 | |
|         $node_id=$a[1];
 | |
|       }
 | |
|     }
 | |
|     else { $node_id=getNodeID($node);} 
 | |
|   }
 | |
| 
 | |
|   my ($name,$aliases,$addrtype,$length,@addrs) = gethostbyname($node);
 | |
|   chomp($name);
 | |
|   my $ipaddresses="{";
 | |
|   foreach (@addrs) { $ipaddresses .= '"'.inet_ntoa($_) . '",'; }
 | |
|   chop($ipaddresses);
 | |
|   $ipaddresses .= "}";
 | |
| 
 | |
|   return ($node_id, $ipaddresses);
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    reportError
 | |
|       This function writes the error message to the callback, otherwise to syslog. 
 | |
|     Arguments:
 | |
|        error
 | |
|        callback 
 | |
|     Returns:
 | |
|        none
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub reportError 
 | |
| {
 | |
|   my $error=shift;
 | |
|   my $callback=shift;
 | |
|   if ($callback) {
 | |
|     my $rsp={};
 | |
|     $rsp->{data}->[0]=$error;
 | |
|     $callback->($rsp);
 | |
|   } else { xCAT::MsgUtils->message('S', "[mon]: $error\n"); }
 | |
|   return;
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    addNodes
 | |
|       This function adds the nodes into the RMC cluster, it does not check the OSI type and
 | |
|       if the node has already defined. 
 | |
|     Arguments:
 | |
|        nodes --an array of nodes to be added. 
 | |
|        master -- the monitoring master of the node.
 | |
|        scope -- the action scope, it indicates the node type the action will take place.
 | |
|                 0 means localhost only. 
 | |
|                 2 means localhost and nodes, 
 | |
|        callback -- the callback pointer for error and status displaying. It can be null.
 | |
|        flag  -- 0 means normal node. 1 means HMC.
 | |
|     Returns:
 | |
|        (error code, error message)
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub addNodes {
 | |
|   my $pmon_nodes=shift;
 | |
|   if ($pmon_nodes =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $pmon_nodes=shift;
 | |
|   }
 | |
| 
 | |
|   my @mon_nodes = @$pmon_nodes;
 | |
|   if (@mon_nodes==0) { return (0, "");}
 | |
| 
 | |
|   my $master=shift;
 | |
|   my $scope=shift;
 | |
|   my $callback=shift;
 | |
|   my $flag=shift;
 | |
|   print "rmcmon.addNodes mon_nodes=@mon_nodes, flag=$flag\n";
 | |
| 
 | |
|   my @hostinfo=xCAT::Utils->determinehostname();
 | |
|   my %iphash=();
 | |
|   foreach(@hostinfo) {$iphash{$_}=1;}
 | |
|   my $localhostname=hostname();
 | |
| 
 | |
|   #find in active nodes
 | |
|   my $inactive_nodes=[];
 | |
|   if ($scope) { 
 | |
|     my %nodes_status=xCAT_monitoring::rmcmon->pingNodeStatus(@mon_nodes); 
 | |
|     $inactive_nodes=$nodes_status{$::STATUS_INACTIVE};
 | |
|     #print "active nodes to add:@$active_nodes\ninactive nodes to add: @$inactive_nodes\n";
 | |
|     if (@$inactive_nodes>0) { 
 | |
|       my $error="The following nodes cannot be added to the RMC cluster because they are inactive:\n  @$inactive_nodes.";
 | |
|       reportError($error, $callback);
 | |
|     }
 | |
|   }
 | |
|   my %inactiveHash=();
 | |
|   foreach(@$inactive_nodes) { $inactiveHash{$_}=1;} 
 | |
| 
 | |
|   #get a list of managed nodes
 | |
|   my $result=`/usr/bin/lsrsrc-api -s IBM.MngNode::::Name 2>&1`;  
 | |
|   if ($?) {
 | |
|     if ($result !~ /2612-023/) {#2612-023 no resources found error
 | |
|       reportError($result, $callback);
 | |
|       return (1,$result);
 | |
|     }
 | |
|     $result='';
 | |
|   }
 | |
|   chomp($result);
 | |
|   my @rmc_nodes=split(/\n/, $result);
 | |
|   my %rmcHash=();
 | |
|   foreach (@rmc_nodes) { $rmcHash{$_}=1;}
 | |
| 
 | |
| 
 | |
|   my $ms_host_name=$localhostname;
 | |
|   my $ms_node_id;
 | |
|   my $mn_node_id;
 | |
|   my $ms_ipaddresses;
 | |
|   my $mn_ipaddresses;
 | |
|   my $result;
 | |
|   my $first_time=1;
 | |
|   my @normal_nodes=();
 | |
| 
 | |
|   foreach my $node(@mon_nodes) {
 | |
|     my $mn_node_id_found=0;
 | |
|     my $hmc_ssh_enabled=0;
 | |
|     #get mn info
 | |
|     if ($first_time) {
 | |
|       $first_time=0;
 | |
|       $ms_node_id=getLocalNodeID();
 | |
|       if ($ms_node_id == -1) {
 | |
|         reportError("Cannot get nodeid for $ms_host_name", $callback);
 | |
|         return (1, "Cannot get nodeid for $ms_host_name"); 
 | |
|       }
 | |
|      
 | |
|       $result= xCAT::Utils::toIP( $master );
 | |
|       if ( @$result[0] != 0 ) {
 | |
|         reportError("Cannot resolve $master", $callback);
 | |
|         return (1, "Cannot resolve $master"); 
 | |
|       }
 | |
|       $ms_ipaddresses="{" . @$result[1] . "}";
 | |
|     }
 | |
| 
 | |
|     if (!$rmcHash{$node}) {
 | |
|       #enable ssh for HMC
 | |
|       if ($flag) {
 | |
|         my $result=`XCATBYPASS=Y $::XCATROOT/bin/rspconfig $node sshcfg=enable 2>&1`;
 | |
|         if ($?) {
 | |
|           my $error= "$result";
 | |
|           reportError($error, $callback);
 | |
|           next;
 | |
|         }     
 | |
|         $hmc_ssh_enabled=1;
 | |
|       }
 | |
| 
 | |
|       #get info for the node
 | |
|       ($mn_node_id, $mn_ipaddresses)=getNodeInfo($node, $flag);
 | |
|       if ($mn_node_id == -1) {
 | |
|         reportError($mn_ipaddresses, $callback);
 | |
|         next; 
 | |
|       }
 | |
|       $mn_node_id_found=1;
 | |
| 
 | |
|       # define resource in IBM.MngNode class on server
 | |
|       $result=`mkrsrc-api IBM.MngNode::Name::"$node"::KeyToken::"$node"::IPAddresses::"$mn_ipaddresses"::NodeID::0x$mn_node_id 2>&1`;
 | |
|       if ($?) {
 | |
|         reportError("define resource in IBM.MngNode class result=$result.", $callback);
 | |
|         next; 
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     if ($inactiveHash{$node}) { next;}
 | |
| 
 | |
|     push(@normal_nodes, $node);
 | |
|     if ($scope==0) { next; }
 | |
| 
 | |
|     #copy the configuration script and run it locally
 | |
|     if($iphash{$node}) {
 | |
|       pop(@normal_nodes);
 | |
|       $result=`/usr/bin/mkrsrc-api IBM.MCP::MNName::"$node"::KeyToken::"$master"::IPAddresses::"$ms_ipaddresses"::NodeID::0x$ms_node_id`;      
 | |
|       if ($?) {
 | |
|         reportError($result, $callback);
 | |
|         next;
 | |
|       }
 | |
|     } else {
 | |
|       if ($flag) { #define MCP on HMC
 | |
|         pop(@normal_nodes);
 | |
| 	if (!$hmc_ssh_enabled) {
 | |
|           my $result=`XCATBYPASS=Y $::XCATROOT/bin/rspconfig $node sshcfg=enable 2>&1`;
 | |
|           if ($?) {
 | |
|             my $error= "$result";
 | |
|             reportError($error, $callback);
 | |
|             next;
 | |
|           }
 | |
|         }    
 | |
|         
 | |
| 	#print "hmccmd=XCATBYPASS=Y $::XCATROOT/bin/xdsh $node -l hscroot \"lsrsrc-api -s IBM.MCP::\\\"NodeID=0x$ms_node_id\\\" 2>&1\"\n";
 | |
|         $result=`XCATBYPASS=Y $::XCATROOT/bin/xdsh $node -l hscroot "lsrsrc-api -s IBM.MCP::\\\"NodeID=0x$ms_node_id\\\" 2>&1"`;
 | |
|         if ($?) {
 | |
|           if ($result !~ /2612-023/) {#2612-023 no resources found error
 | |
|             reportError($result, $callback);
 | |
|             next;
 | |
| 	  }  else {
 | |
|             #print "hmccmd2=XCATBYPASS=Y $::XCATROOT/bin/xdsh $node -l hscroot \"mkrsrc-api IBM.MCP::MNName::\\\"$node\\\"::KeyToken::\\\"$master\\\"::IPAddresses::\\\"$ms_ipaddresses\\\"::NodeID::0x$ms_node_id 2>&1\"\n";
 | |
|             reportError("Configuring $node", $callback); 
 | |
|             $result=`XCATBYPASS=Y $::XCATROOT/bin/xdsh $node -l hscroot "mkrsrc-api IBM.MCP::MNName::\\\"$node\\\"::KeyToken::\\\"$master\\\"::IPAddresses::\\\"$ms_ipaddresses\\\"::NodeID::0x$ms_node_id 2>&1"`;
 | |
|             if ($?) { reportError($result, $callback); }
 | |
| 	  }
 | |
|         }
 | |
| 
 | |
|         #check if hmc node added to management domain successfully
 | |
|         my $n = 6;
 | |
|         while($n > 0){
 | |
|            $result = `/usr/sbin/rsct/bin/rmcdomainstatus -s ctrmc | grep $node`;
 | |
|            if ($result =~ /\s$node\s/){
 | |
|                last;
 | |
|            } else {
 | |
|                sleep 10;
 | |
|                $n = $n - 1;
 | |
|            }
 | |
|         }
 | |
| 
 | |
|         #define AllServiceableEvents_B condition on the HMC
 | |
| 	$result=`CT_MANAGEMENT_SCOPE=3 /usr/bin/mkrsrc-api IBM.Condition::Name::"AllServiceableEvents_B"::ResourceClass::"IBM.Sensor"::EventExpression::"String=?\\\"LSSVCEVENTS_ALL%\\\""::SelectionString::"Name=\\\"CSMServiceableEventSensor\\\""::NodeNameList::{\\\"$node\\\"}::EventBatchingInterval::1::BatchedEventRetentionPeriod::72 2>&1`;
 | |
| 	if (($?) && ($result !~ /2618-201|2618-008|2636-050/)){ 
 | |
| 	    reportError($result, $callback); 
 | |
| 	}
 | |
| 	
 | |
|       }
 | |
|     }
 | |
|   } 
 | |
| 
 | |
|   #let updatenode command to handle the normal nodes as a bulk
 | |
|   if (@normal_nodes>0) {
 | |
|     my $nr=join(',',@normal_nodes);
 | |
|     my $install_root = xCAT::Utils->getInstallDir();
 | |
| 
 | |
|     #get the fanout value
 | |
|     my %settings=xCAT_monitoring::monitorctrl->getPluginSettings("rmcmon");
 | |
| 
 | |
|     my $fanout_string="";
 | |
|     my $fanout_value=$settings{'rfanout'};
 | |
|     if ($fanout_value) { $fanout_string="DSH_FANOUT=$fanout_value";}
 | |
| 
 | |
|     #for local mode, need to referesh the IBM.MCP class to initialize the hb
 | |
|     if ($scope==0) {
 | |
|       #$result=`XCATBYPASS=Y $fanout_string $::XCATROOT/bin/xdsh $nr /usr/bin/refrsrc-api -c IBM.MCP 2>&1"`;
 | |
|       if ($?) { reportError($result, $callback); }
 | |
|       return (0, "ok"); 
 | |
|     }
 | |
| 
 | |
|     #this is remore case
 | |
|     reportError("Configuring the following nodes. It may take a while.\n$nr", $callback);
 | |
|     my $cmd;
 | |
|     my %servernodes = %{xCAT::InstUtils->get_server_nodes($callback, \@normal_nodes)};
 | |
|     # it's possible that the nodes could have diff server names
 | |
|     # do all the nodes for a particular server at once
 | |
|     foreach my $snkey (keys %servernodes) {
 | |
| 	my $nr = join(',', @{$servernodes{$snkey}});
 | |
| 	my $cmd;
 | |
| 	if (xCAT::Utils->isLinux()) {
 | |
| 	    $cmd="XCATBYPASS=Y $fanout_string $::XCATROOT/bin/xdsh $nr -s -e $install_root/postscripts/xcatdsklspost 2 -m $snkey configrmcnode 2>&1";
 | |
| 	    print "$cmd\n";
 | |
| 	}
 | |
| 	else {
 | |
| 	    #use -c 2 here to tell xcataixpost that there is only one postscript, download only it. It applies to AIX only     
 | |
| 	    $cmd="XCATBYPASS=Y $fanout_string $::XCATROOT/bin/xdsh $nr -s -e $install_root/postscripts/xcataixpost -m $snkey -c 2 configrmcnode 2>&1";
 | |
| 	}
 | |
| 	if (! open (CMD, "$cmd |")) {
 | |
| 	    reportError("Cannot run command $cmd", $callback);
 | |
| 	} else {
 | |
| 	    while (<CMD>) {
 | |
| 		chomp;
 | |
| 		my $rsp={};
 | |
| 		$rsp->{data}->[0]="$_";
 | |
| 		$callback->($rsp);
 | |
| 	    }
 | |
| 	    close(CMD);
 | |
| 	}
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   return (0, "ok"); 
 | |
| }
 | |
| 
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    removeNodes
 | |
|       This function removes the nodes from the RMC cluster.
 | |
|     Arguments:
 | |
|       nodes --a pointer to a array of node names to be removed. 
 | |
|       master -- the master of the nodes.
 | |
|        scope -- the action scope, it indicates the node type the action will take place.
 | |
|                 0 means localhost only. 
 | |
|                 2 means localhost and nodes, 
 | |
|        callback -- the callback pointer for error and status displaying. It can be null.
 | |
|        flag  -- 0 means normal node. 1 means HMC.
 | |
|     Returns:
 | |
|       (error code, error message)
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub removeNodes {
 | |
|   my $pmon_nodes=shift;
 | |
|   if ($pmon_nodes =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $pmon_nodes=shift;
 | |
|   }
 | |
|   my @mon_nodes = @$pmon_nodes;
 | |
|   if (@mon_nodes==0) { return (0, "");}
 | |
| 
 | |
|   my $master=shift;
 | |
|   my $scope=shift;
 | |
|   my $callback=shift;
 | |
|   my $flag=shift;
 | |
| 
 | |
|   print "rmcmon.removeNodes mon_nodes=@mon_nodes, flag=$flag\n";
 | |
| 
 | |
|   my $localhostname=hostname();
 | |
|   my $ms_host_name=$localhostname;
 | |
|   my $ms_node_id;
 | |
|   my $result;
 | |
|   my $first_time=1;
 | |
|   my @normal_nodes=();
 | |
|  
 | |
|   #find in active nodes
 | |
|   my $inactive_nodes=[];
 | |
|   if ($scope) { 
 | |
|     my %nodes_status=xCAT_monitoring::rmcmon->pingNodeStatus(@mon_nodes); 
 | |
|     $inactive_nodes=$nodes_status{$::STATUS_INACTIVE};
 | |
|     #print "active nodes to add:@$active_nodes\ninactive nodes to add: @$inactive_nodes\n";
 | |
|     if (@$inactive_nodes>0) { 
 | |
|       my $error="The following nodes cannot be removed from the RMC cluster because they are inactive:\n  @$inactive_nodes.";
 | |
|       reportError($error, $callback);
 | |
|     }
 | |
|   }
 | |
|   my %inactiveHash=();
 | |
|   foreach(@$inactive_nodes) { $inactiveHash{$_}=1;} 
 | |
| 
 | |
|   #get a list of managed nodes
 | |
|   my $result=`/usr/bin/lsrsrc-api -s IBM.MngNode::::Name 2>&1`;  
 | |
|   if ($?) {
 | |
|     if ($result !~ /2612-023/) {#2612-023 no resources found error
 | |
|       reportError($result, $callback);
 | |
|       return (1,$result);
 | |
|     }
 | |
|     $result='';
 | |
|   }
 | |
|   chomp($result);
 | |
|   my @rmc_nodes=split(/\n/, $result);
 | |
|   my %rmcHash=();
 | |
|   foreach (@rmc_nodes) { $rmcHash{$_}=1;}
 | |
| 
 | |
|   #print "rmcmon::removeNodes_noChecking get called with @mon_nodes\n";
 | |
| 
 | |
|   foreach my $node (@mon_nodes) {
 | |
|     if ($rmcHash{$node}) {
 | |
| 	my $result=0;
 | |
| 	if ($flag && $scope && (!$inactiveHash{$node})) {  #remove AllServiceableEvents_B condition for HMC
 | |
| 	    $result=`XCATBYPASS=Y $::XCATROOT/bin/xdsh $node -l hscroot "lsrsrc-api -s IBM.Condition::\\\"Name='AllServiceableEvents_B'\\\" 2>&1"`;
 | |
| 	    if ($?) {
 | |
| 		if ($result !~ /2612-023/) {#2612-023 no resources found error
 | |
| 		    reportError($result, $callback); 
 | |
| 		} 
 | |
| 	    }
 | |
| 	    $result=`/usr/bin/rmcondition -f AllServiceableEvents_B:$node 2>&1`;
 | |
| 	    if ($?) { reportError($result, $callback); }
 | |
| 	}
 | |
|     
 | |
| 
 | |
|       #remove resource in IBM.MngNode class on server
 | |
|       $result=`rmrsrc-api -s IBM.MngNode::"Name=\\\"\"$node\\\"\"" 2>&1`;
 | |
|       if ($?) {  
 | |
|         if ($result =~ m/2612-023/) { #resource not found
 | |
|          next;
 | |
|         }
 | |
|         reportError("Remove resource in IBM.MngNode class result=$result.", $callback);
 | |
|       }
 | |
|     }
 | |
| 
 | |
|     if ($scope==0) { next; }
 | |
|     if ($inactiveHash{$node}) { next;}
 | |
| 
 | |
|     if ($ms_host_name eq $node) {
 | |
|       $result= `/usr/bin/rmrsrc-api -s IBM.MCP::"MNName=\\\"\"$node\\\"\"" 2>&1`;
 | |
|       if ($?) { reportError($result, $callback); }
 | |
|     } else {
 | |
|       #get mn info
 | |
|       if ($first_time) {
 | |
|         $ms_node_id=getLocalNodeID();
 | |
|         if ($ms_node_id == -1) {
 | |
|           reportError("Cannot get nodeid for $ms_host_name", $callback);
 | |
|           return (1, "Cannot get nodeid for $ms_host_name"); 
 | |
|         }
 | |
|         $first_time=0;
 | |
|       }
 | |
| 
 | |
|       if ($flag) { #hmc nodes
 | |
| 	#remove the MCP
 | |
|         $result=`XCATBYPASS=Y $::XCATROOT/bin/xdsh $node -l hscroot "lsrsrc-api -s IBM.MCP::\\\"NodeID=0x$ms_node_id\\\" 2>&1"`;
 | |
|         if ($?) {
 | |
|           if ($result !~ /2612-023/) {#2612-023 no resources found error
 | |
|             reportError($result, $callback); 
 | |
| 	  } 
 | |
| 	  next;
 | |
|         }
 | |
|         $result=`XCATBYPASS=Y $::XCATROOT/bin/xdsh $node -l hscroot "rmrsrc-api -s IBM.MCP::\\\"NodeID=0x$ms_node_id\\\" 2>&1"`;
 | |
|         if ($?) { reportError($result, $callback); }
 | |
| 
 | |
|       } else { #normal nodes
 | |
|         push(@normal_nodes, $node);
 | |
|       }
 | |
|     }
 | |
|   }   
 | |
| 
 | |
|   #let updatenode command to handle the normal nodes as a bulk
 | |
|   if (@normal_nodes>0) {
 | |
|     my $nr=join(',',@normal_nodes); 
 | |
| 
 | |
|     my %settings=xCAT_monitoring::monitorctrl->getPluginSettings("rmcmon");
 | |
| 
 | |
|     my $fanout_string="";
 | |
|     my $fanout_value=$settings{'rfanout'};
 | |
|     if ($fanout_value) { $fanout_string="DSH_FANOUT=$fanout_value";}
 | |
| 
 | |
|     #copy the configuration script and run it locally
 | |
|     $result=`XCATBYPASS=Y $fanout_string $::XCATROOT/bin/xdcp $nr $::XCATROOT/sbin/rmcmon/configrmcnode /tmp 2>&1 `;
 | |
|     if ($?) {
 | |
|       reportError("$result", $callback);
 | |
|     }
 | |
| 
 | |
|     reportError("De-configuring the following nodes. It may take a while.\n$nr", $callback); 
 | |
|     my $cmd="XCATBYPASS=Y $fanout_string $::XCATROOT/bin/xdsh $nr -s MS_NODEID=$ms_node_id /tmp/configrmcnode -1 2>&1";
 | |
|     if (! open (CMD1, "$cmd |")) {
 | |
|       reportError("Cannot run command $cmd", $callback);
 | |
|     } else {
 | |
|       while (<CMD1>) {
 | |
| 	chomp;
 | |
|         my $rsp={};
 | |
|         $rsp->{data}->[0]="$_";
 | |
|         $callback->($rsp);
 | |
|       }
 | |
|       close(CMD1);
 | |
|     }
 | |
| 
 | |
|     #$result=`XCATBYPASS=Y $::XCATROOT/bin/xdsh $nr MS_NODEID=$ms_node_id /tmp/configrmcnode -1 2>&1`;
 | |
|     #if ($?) { reportError($result, $callback);  }
 | |
|   }    
 | |
| 
 | |
|   return (0, "ok");
 | |
| }
 | |
| 
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    processSettingChanges
 | |
|       This function gets called when the setting for this monitoring plugin 
 | |
|       has been changed in the monsetting table.
 | |
|     Arguments:
 | |
|        none.
 | |
|     Returns:
 | |
|         0 for successful.
 | |
|         non-0 for not successful.
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub processSettingChanges {
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    getDiscription
 | |
|       This function returns the detailed description of the plugin inluding the
 | |
|      valid values for its settings in the monsetting tabel. 
 | |
|      Arguments:
 | |
|         none
 | |
|     Returns:
 | |
|         The description.
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub getDescription {
 | |
|   return 
 | |
| "  Description:
 | |
|     rmcmon uses IBM's Resource Monitoring and Control (RMC) component 
 | |
|     of Reliable Scalable Cluster Technology (RSCT) to monitor the 
 | |
|     xCAT cluster. RMC has built-in resources such as CPU, memory, 
 | |
|     process, network, file system etc for monitoring. RMC can also be 
 | |
|     used to provide node liveness status monitoring and performance monitoring for xCAT. 
 | |
|     RMC is good for threadhold monitoring. xCAT automatically sets up the 
 | |
|     monitoring domain for RMC during node deployment time. And if performance
 | |
|     monitoring is enabled, xCAT monitoring will collect and consolidate performance
 | |
|     data based on montype&rmetrics setting, and then store to RRD database. 
 | |
|   Settings:
 | |
|     rfanout -- indicating the fanout number for configuring or deconfiguring 
 | |
|         remote nodes.
 | |
|     nodeusebatch -- use RMC event batching function when doing node status monitoring.
 | |
|     montype -- indicating type of performance monitoring, the value could be 
 | |
|                \"event\" : event monitoring (default),
 | |
| 	       \"perf\" : performance monitoring,
 | |
|                \"event,perf\" or \"perf,event\" : both.
 | |
|     rmetrics -- defines resource class,resouce names, attributes and sample interval for 
 | |
|                 performance monitoring. 
 | |
| 		Syntax of key: rmetrics_resource class For example: rmetrics_IBM.Processor
 | |
| 		Syntax of value: [resource names]attribute names:sample interval
 | |
| 		The unit of sample interval is minute.
 | |
| 		For example:
 | |
| 		  [proc0,proc1]PctTimeIdle,PctTimeWait,PctTimeKernel,PctTimeUser:5
 | |
| 				  
 | |
| ";
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    getNodeConfData
 | |
|       This function gets a list of configuration data that is needed by setting up
 | |
|     node monitoring.  These data-value pairs will be used as environmental variables 
 | |
|     on the given node.
 | |
|     Arguments:
 | |
|         node  
 | |
|         pointer to a hash that will take the data.
 | |
|     Returns:
 | |
|         none
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub getNodeConfData {
 | |
|   #check if rsct is installed or not
 | |
|   if (! -e "/usr/bin/lsrsrc") {
 | |
|     return;
 | |
|   }
 | |
| 
 | |
|   my $node=shift;
 | |
|   if ($node =~ /xCAT_monitoring::rmcmon/) {
 | |
|     $node=shift;
 | |
|   }
 | |
|   my $ref_ret=shift;
 | |
| 
 | |
|   #get node ids for RMC monitoring
 | |
|   my $nodeid=xCAT_monitoring::rmcmon->getNodeID($node);
 | |
|   if (defined($nodeid)) {
 | |
|     $ref_ret->{NODEID}=$nodeid;
 | |
|   }
 | |
|   my $ms_nodeid=xCAT_monitoring::rmcmon->getLocalNodeID();
 | |
|   if (defined($ms_nodeid)) {
 | |
|     $ref_ret->{MS_NODEID}=$ms_nodeid;
 | |
|   }
 | |
|   return;
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    getPostscripts
 | |
|       This function returns the postscripts needed for the nodes and for the servicd
 | |
|       nodes. 
 | |
|      Arguments:
 | |
|         none
 | |
|     Returns:
 | |
|      The the postscripts. It a pointer to an array with the node group names as the keys
 | |
|     and the comma separated poscript names as the value. For example:
 | |
|     {service=>"cmd1,cmd2", xcatdefaults=>"cmd3,cmd4"} where xcatdefults is a group
 | |
|     of all nodes including the service nodes.
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub getPostscripts {
 | |
|   my $ret={};
 | |
|   $ret->{xcatdefaults}="configrmcnode";
 | |
|   return $ret;
 | |
| }
 | |
| 
 | |
| sub showmetrix($rrddir, $attrs, $start_time, $end_time)
 | |
| {
 | |
| 	my($rrddir, $attrs, $start_time, $end_time) = @_;
 | |
| 	my $result = [];
 | |
| 	my $output = undef;
 | |
| 	my @files = ();
 | |
| 	my $file = undef;
 | |
| 	my @attrlist = split /,/,$attrs;
 | |
| 	my $attr = undef;
 | |
| 	my $line = undef;
 | |
| 	my @namelist = ();
 | |
| 	my @timelist = ();
 | |
| 	my %hash = {};
 | |
| 	my $name = undef;
 | |
| 	my $timestamp = undef;
 | |
| 	my $sum = undef;
 | |
| 	my $num = undef;
 | |
| 	my $remote = undef;
 | |
| 
 | |
| 	if($rrddir =~ /:/){
 | |
| 		($remote,$rrddir) = split /:/,$rrddir;
 | |
| 	}
 | |
| 	
 | |
| 	foreach $attr (@attrlist) {
 | |
| 		@namelist = ();
 | |
| 		@timelist = ();
 | |
| 		%hash = {};
 | |
| 		if($remote){
 | |
| 			$output = xCAT::Utils->runcmd("xdsh $remote 'ls -A /var/rrd/$rrddir/$attr*'", 0);
 | |
| 			if($::RUNCMD_RC != 0){
 | |
| 				return $result;
 | |
| 			}
 | |
| 			$output =~ s/(\S+): \/var\/rrd\//''/;
 | |
| 		} else {
 | |
| 			$output = xCAT::Utils->runcmd("ls -A $rrddir/$attr*", 0);
 | |
| 		}
 | |
| 		@files = split /\n/, $output;
 | |
| 		foreach $file (@files) {
 | |
| 			if($file =~ /$attr\.rrd$/){
 | |
| 				$name = "$attr";
 | |
| 			} elsif ($file =~ /${attr}_(\S+)\.rrd$/) {
 | |
| 				$name = $1;
 | |
| 			}
 | |
| 			push @namelist, $name;
 | |
| 			if($remote){
 | |
| 				$output = xCAT_monitoring::rrdutil::RRD_fetch($file, $start_time, $end_time, $remote);
 | |
| 			} else {
 | |
| 				$output = xCAT_monitoring::rrdutil::RRD_fetch($file, $start_time, $end_time);
 | |
| 			}
 | |
| 			$line = pop(@$output);
 | |
| 			if($line =~ /ERROR/){
 | |
| 				push @$result, $line;
 | |
| 				next;
 | |
| 			} else {
 | |
| 				push @$output, $line;
 | |
| 			}
 | |
| 			foreach $line (@$output){
 | |
| 				if($line =~ /[NaNQ|nan]/){
 | |
| 					next;
 | |
| 				} elsif ($line =~ /^(\d+): (\S+) (\S+)/){
 | |
| 					$timestamp = $1;
 | |
| 					$sum = $2;
 | |
| 					$num = $3;
 | |
| 					if(! grep {/$timestamp/} @timelist){
 | |
| 						push @timelist, $timestamp;
 | |
| 					}
 | |
| 					$hash{$name}{$timestamp} = sprintf "%.4f", $sum;
 | |
| 				} elsif ($line =~ /^(\d+): (\S+)/){
 | |
| 					$timestamp = $1;
 | |
| 					$sum = $2;
 | |
| 					if(! grep {/$timestamp/} @timelist){
 | |
| 						push @timelist, $timestamp;
 | |
| 					}
 | |
| 					$hash{$name}{$timestamp} = sprintf "%.4f", $sum;
 | |
| 				}
 | |
| 			}
 | |
| 		}
 | |
| 		$line = join "\t", (@namelist);
 | |
| 		$line = "                          ".$line;
 | |
| 		push @$result, $line;
 | |
| 		@timelist = sort @timelist;
 | |
| 		foreach $timestamp (@timelist){
 | |
| 			$line = localtime($timestamp)."  ";
 | |
| 			foreach $name (@namelist){
 | |
| 				if(exists $hash{$name}{$timestamp}){
 | |
| 					$line =$line."$hash{$name}{$timestamp}\t";
 | |
| 				} else {
 | |
| 					$line = $line."-\t";
 | |
| 				}
 | |
| 			}
 | |
| 			push @$result, $line;
 | |
| 		}
 | |
| 	}
 | |
| 	
 | |
| 	return $result;
 | |
| 
 | |
| }
 | |
| 
 | |
| sub showeventlog
 | |
| {
 | |
|   my @result = ();
 | |
|   my ($table, $node,$attrs,$start_time,$end_time,$where) = @_;
 | |
| 
 | |
|   my $need_filter = 0;  #need second search to sql
 | |
|   my @attr = ();
 | |
|   my @attrkey = ();
 | |
|   my @severity = ('Informational', 'Warning', 'Critical');
 | |
| 
 | |
|   if(!$attrs){
 | |
|     @attrkey = ('eventtype','monitor','monnode','application',
 | |
|                'component','id','severity','message','rawdata','comments');
 | |
|   } else {
 | |
|     @attrkey = split /,/, $attrs;
 | |
|   }
 | |
|   
 | |
|   #node 
 | |
|   push @attr, "node==$node";
 | |
|   #plugin
 | |
|   push @attr, "application==RMC";
 | |
|   #where
 | |
|   if(defined($where)){
 | |
|     foreach my $a (@$where){
 | |
|       if($a =~ /severity([!=><]+)(\w+)/){
 | |
|         my $op = $1;
 | |
|         my $sev = $2;
 | |
|         if(($op eq '==')||($op eq '!=')){
 | |
|           push @attr, $a;
 | |
|         } elsif($op eq '>=') {
 | |
|           foreach my $s (@severity){
 | |
|             if($sev =~ /^$s$/i){
 | |
|               last; 
 | |
|             }
 | |
|             push @attr, "severity!=$s"; 
 | |
|           }
 | |
|         } elsif($op eq '<=') {
 | |
|           my $s = pop @severity;
 | |
|           while($s !~ /^$sev$/i){
 | |
|             push @attr, "severity!=$s";
 | |
|             $s = pop @severity;
 | |
|           }
 | |
|         } elsif($op eq '>') {
 | |
|           foreach my $s (@severity){
 | |
|             if($sev =~ /^$s$/i){
 | |
|               push @attr, "severity!=$s";
 | |
|               last;
 | |
|             }
 | |
|           }
 | |
|         } elsif($op eq '<') {
 | |
|           my $s = pop @severity;
 | |
|           while($sev !~ /^$s$/i){
 | |
|             push @attr, "severity!=$s";
 | |
|             $s = pop @severity;
 | |
|           }
 | |
|           push @attr, "severity!=$s";
 | |
|         } 
 | |
|       } else {
 | |
|         push @attr, $a;
 | |
|       }
 | |
|     } 
 | |
|   }
 | |
|   #eventtime
 | |
|   my ($s_sec,$s_min,$s_hour,$s_mday,$s_mon,$s_year) = localtime($start_time);
 | |
|   my ($e_sec,$e_min,$e_hour,$e_mday,$e_mon,$e_year) = localtime($end_time);
 | |
|   my $tmp = sprintf("eventtime>=%04d-%02d-%02d %02d:%02d:%02d",$s_year+1900,$s_mon+1,$s_mday,$s_hour,$s_min,$s_sec);
 | |
|   push @attr, $tmp;
 | |
|   $tmp = sprintf("eventtime<=%04d-%02d-%02d %02d:%02d:%02d",$e_year+1900,$e_mon+1,$e_mday,$e_hour,$e_min,$e_sec);
 | |
|   push @attr, $tmp;
 | |
| 
 | |
|   my @r = $table->getAllAttribsWhere(\@attr, 'eventtime', @attrkey);
 | |
| 
 | |
|   push @result, (join ",", @attrkey);
 | |
|   $result[0] = "eventtime,$result[0]";
 | |
|   foreach my $entry (@r){
 | |
|     my $str = "\'$entry->{eventtime}\'";
 | |
|     foreach my $a (@attrkey){
 | |
|       $str = $str. ",\'$entry->{$a}\'";
 | |
|     }
 | |
|     push @result, $str;
 | |
|   }
 | |
|   return \@result;
 | |
|   
 | |
| }
 | |
| 
 | |
| #--------------------------------------------------------------------------------
 | |
| =head3    show
 | |
|       This function configures the cluster for the given nodes.  
 | |
|       This function is called when moncfg command is issued or when xcatd starts
 | |
|       on the service node. It will configure the cluster to include the given nodes within
 | |
|       the monitoring doamin. 
 | |
|     Arguments:
 | |
|        p_nodes -- a pointer to an arrays of nodes to be added for monitoring. none means all.
 | |
|        scope -- the action scope, it indicates the node type the action will take place.
 | |
|                 0 means localhost only. 
 | |
|                 2 means localhost and nodes, 
 | |
|        callback -- the callback pointer for error and status displaying. It can be null.
 | |
|     Returns:
 | |
|        (error code, error message)
 | |
| =cut
 | |
| #--------------------------------------------------------------------------------
 | |
| sub show 
 | |
| {
 | |
|   print "rmcmon:show called\n";
 | |
|   no strict 'refs';
 | |
|   my ($noderef, $sum, $time, $attrs, $pe, $where,$callback) = @_;
 | |
|   my @monnodes = ();
 | |
|   my $rsp = {};
 | |
|   my $localhostname=hostname();
 | |
|   my $start_time = undef;
 | |
|   my $end_time = undef;
 | |
|   my $node = undef;
 | |
|   my $output = undef;
 | |
|   my $rrddir = undef;
 | |
| 
 | |
|   $end_time = `date +%s`;
 | |
|   if($time =~ /(\d+)-(\d+)/){
 | |
|     $start_time = $end_time - $1 * 60;
 | |
|     $end_time = $end_time - $2 * 60;
 | |
|   } else {
 | |
|     $start_time = $end_time - $time * 60;
 | |
|   }
 | |
|   
 | |
|   foreach $node (@$noderef){
 | |
|     my $table = xCAT::Table->new('nodetype');
 | |
|     my $entry = $table->getNodeAttribs($node, ['nodetype']);
 | |
|     if($entry && ($entry->{nodetype} =~ /$::NODETYPE_OSI/)){
 | |
|       push @monnodes, $node;
 | |
|     }
 | |
|   }
 | |
|   
 | |
|   #the identification of this node
 | |
|   my $isSV=xCAT::Utils->isServiceNode();
 | |
| 
 | |
|   if(!$isSV && ($sum&0x2)){
 | |
|     push @monnodes, $localhostname;
 | |
|   }
 | |
|   $sum &= 0x1;
 | |
| 
 | |
|   if($pe =~ /p/){
 | |
|   if($sum){
 | |
|     foreach $node (@monnodes){
 | |
|       if($node eq $localhostname){
 | |
| 	$rrddir = "/var/rrd/cluster";
 | |
| 	my @metrixconf = xCAT_monitoring::rmcmetrix::get_metrix_conf();
 | |
| 	my $rmetrixcmd = undef;
 | |
|   	while(@metrixconf){
 | |
| 	  my ($rsrc, $rname, $attrlist, $minute);
 | |
| 	  $rsrc  = shift @metrixconf;
 | |
| 	  $rname = shift @metrixconf;
 | |
| 	  $attrlist = shift @metrixconf;
 | |
| 	  $minute = shift @metrixconf;
 | |
| 	  $rmetrixcmd = "/opt/xcat/sbin/rmcmon/rmcmetrixmon sum $rsrc $attrlist $minute";
 | |
| 	  xCAT::Utils->runcmd($rmetrixcmd, 0);
 | |
|         }
 | |
|       }	elsif(xCAT::Utils->isSN($node)){
 | |
| 	$rrddir = "$node:summary";
 | |
|       } else {
 | |
|         $rrddir = "/var/rrd/$node";
 | |
|       }
 | |
|       $output = &showmetrix($rrddir, $attrs, $start_time, $end_time);
 | |
|       push @{$rsp->{data}}, "\n$node-summary:";
 | |
|       push @{$rsp->{data}}, @$output;
 | |
|     }
 | |
|   } else {
 | |
|     foreach $node (@monnodes){
 | |
|       $rrddir = "/var/rrd/$node";
 | |
|       $output = &showmetrix($rrddir, $attrs, $start_time, $end_time);
 | |
|       push @{$rsp->{data}}, "\n$node:";
 | |
|       push @{$rsp->{data}}, @$output;
 | |
|     }
 | |
|   }
 | |
|   } elsif($pe =~ /e/){
 | |
|     my $eventtable =xCAT::Table->new("eventlog", -create =>0);
 | |
|     if (!$eventtable) {
 | |
|       push @{$rsp->{data}}, "Error:Can't open table eventlog!";
 | |
|       return -1;
 | |
|     }
 | |
|     foreach $node (@monnodes){
 | |
|       push @{$rsp->{data}}, "\n$node:";
 | |
|       $output = showeventlog($eventtable,$node,$attrs,$start_time,$end_time,$where);
 | |
|       push @{$rsp->{data}}, @$output;
 | |
|     }
 | |
|     $eventtable->close();
 | |
|   }
 | |
|   $callback->($rsp);
 | |
|   return (0, "");
 | |
| }
 | |
| 
 |