Subversion Repositories havirt

Rev

Rev 29 | Details | Compare with Previous | Last modification | View Log | RSS feed

Rev Author Line No. Line
3 rodolico 1
#!/usr/bin/env perl
2
 
3
# All functions related to maniplating a specific node
4
# part of havirt.
5
 
4 rodolico 6
# Copyright 2024 Daily Data, Inc.
7
# 
8
# Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following 
9
# conditions are met:
10
#
11
#   Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer.
12
#   Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer 
13
#   in the documentation and/or other materials provided with the distribution.
14
#   Neither the name of the copyright holder nor the names of its contributors may be used to endorse or promote products derived
15
#   from this software without specific prior written permission.
16
# 
17
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT
18
# NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL
19
# THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
20
# (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
21
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
22
# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
23
 
3 rodolico 24
# v0.0.1 20240602 RWR
25
# Initial setup
26 rodolico 26
#
27
# v1.2.0 20240826 RWR
28
# Added some code to migrate domains if node placed in maintenance mode
29
# Added a lot of 'verbose' print lines, and modified for new flag structure
30
#
38 rodolico 31
# v1.2.1 20240828 RWR
32
# Fixed node maintenance, adding scanning and fixing some bugs with
33
# the migration code
3 rodolico 34
 
35
package node;
36
 
37
use warnings;
38
use strict;  
39
 
4 rodolico 40
# define the version number
41
# see https://metacpan.org/pod/release/JPEACOCK/version-0.97/lib/version.pod
42
use version;
38 rodolico 43
our $VERSION = version->declare("1.2.1");
3 rodolico 44
 
4 rodolico 45
 
46
use Data::Dumper;
47
 
3 rodolico 48
use Exporter;
49
 
50
our @ISA = qw( Exporter );
51
our @EXPORT = qw( 
5 rodolico 52
                  &node &list &update &scan &add
3 rodolico 53
                );
54
 
4 rodolico 55
# Converts from output of node info to a key we want to use
56
my %conversion = ( 
57
  'CPU frequency' => 'clock',
58
  'CPU model' => 'cpu_model',
59
  'CPU socket(s)' => 'cpu_socket',
60
  'CPU(s)' => 'cpu_count',
61
  'Core(s) per socket' => 'cpu_cores',
62
  'Memory size' => 'memory',
63
  'NUMA cell(s)' => 'numa_cells',
64
  'Thread(s) per core' => 'threads_per_core'
65
);
3 rodolico 66
 
9 rodolico 67
# show a help screen
68
sub help {
69
   my @return;
70
   push @return, "node update [nodename|-t nodename]";
71
   push @return, "\tUpdates capabilities on one or more nodes, default is all nodes";
72
   push @return, "node list [--format|-f screen|tsv]";
73
   push @return, "\tLists all nodes with some statistics about them as screen or tsv (default screen)";
74
   push @return, "node scan [nodename|-t nodename]";
75
   push @return, "\tUpdates list of domains on one or more existing nodes, default is all nodes";
29 rodolico 76
   push @return, "node maintenance nodename [on|off --target=targetNode]";
17 rodolico 77
   push @return, "\ton - set maintenance flag; no domains can be started/migrated to node";
29 rodolico 78
   push @return, "\t     target must be set with the --target flag";
17 rodolico 79
   push @return, "\toff - Allows domains to be migrated/started on node";
80
   push @return, "\tnothing - displays current maintenance flag";
81
   push @return, "\tNote: a node with any domains running can not have maintenance mode turned on";
9 rodolico 82
   return join( "\n", @return ) . "\n";
83
}
84
 
85
 
5 rodolico 86
# lists hardware capabilities of all nodes (virsh nodeinfo)
4 rodolico 87
sub list {
88
   my @header;
89
   my @data;
90
   my $return;
12 rodolico 91
   &main::readDB();
92
   foreach my $node ( sort keys %{$main::statusDB->{'node'}} ) {
4 rodolico 93
      unless ( @header ) {
94
         # just grab the keys for headers
12 rodolico 95
         @header = sort keys %{ $main::statusDB->{'node'}->{$node} };
4 rodolico 96
         # put Node at the beginning
97
         unshift ( @header, 'Node' );
98
      }
99
      my @line;
100
      push @line, $node;
12 rodolico 101
      foreach my $column (sort keys %{ $main::statusDB->{'node'}->{$node} }) {
102
         push @line, $main::statusDB->{'node'}->{$node}->{$column};
4 rodolico 103
      }
104
      push (@data, \@line );
105
   }
7 rodolico 106
   return &main::report( \@header, \@data );
4 rodolico 107
}
108
 
5 rodolico 109
# Get information about a node. Really only needs to be done when a node is
110
# first defined, or if there is a hardware upgrade
9 rodolico 111
# reads information off of the stack (@_), but will add to that if --target
112
# was defined
4 rodolico 113
sub update {
12 rodolico 114
   &main::readDB( 1 ); # open and lock so we can write to it later
26 rodolico 115
   my @return;
18 rodolico 116
   my @requiredFields = ( 'maintenance' );
4 rodolico 117
   my @targets;
25 rodolico 118
   if ( $main::config->{'flags'}->{'target'} ) {
119
      push @_, $main::config->{'flags'}->{'target'};
4 rodolico 120
   }
12 rodolico 121
   @_ = keys %{$main::statusDB->{'node'}} unless @_;
9 rodolico 122
   while ( my $nodename = shift  ) {
26 rodolico 123
      print "Updating $nodename\n" if $main::config->{'flags'}->{'debug'} || $main::config->{'flags'}->{'verbose'};
25 rodolico 124
      my $command = &main::makeCommand($nodename, "virsh nodeinfo" );
26 rodolico 125
      if ( $main::config->{'flags'}->{'dryrun'} ) {
126
         push @return, $command;
127
      } else {  
128
         my $return, `$command`;
129
         print "Output of [$command] is\n" . $return if $main::config->{'flags'}->{'debug'};
130
         my @nodeinfo = split( "\n", $return );
131
         for ( my $i = 0; $i < @nodeinfo; $i++ ) {
132
            my ($key, $value) = split( /:\s+/, $nodeinfo[$i] );
133
            if ( $value =~ m/^(\d+)\s+[a-z]+$/i ) {
134
               $value = $1;
135
            }
136
            $key = $conversion{$key} if exists( $conversion{$key} );
137
            $main::statusDB->{'node'}->{$nodename}->{$key} = $value;
138
         } # for
139
         foreach my $field ( @requiredFields ) {
140
            $main::statusDB->{'node'}->{$nodename}->{$field} = '' 
141
               unless defined ( $main::statusDB->{'node'}->{$nodename}->{$field} );
142
         } # foreach
143
      }
4 rodolico 144
   } # while
25 rodolico 145
   print "main::statusDB->{'node'} state after update\n" . Dumper( $main::statusDB->{'node'} ) if $main::config->{'flags'}->{'debug'};
12 rodolico 146
   &main::writeDB();
26 rodolico 147
   return "Node has been updated\n" . join( "\n", @return ) . "\n";
4 rodolico 148
}      
149
 
5 rodolico 150
 
151
# check one or more nodes and determine which domains are running on them.
152
# defaults to everything in the node database, but the -t can have it run on only one
153
# this is the function that should be run every few minutes on one of the servers
4 rodolico 154
sub scan {
15 rodolico 155
   return &main::scan(@_);
5 rodolico 156
}
4 rodolico 157
 
3 rodolico 158
 
5 rodolico 159
# add a new node. This is the same as doing an update on a node that doesn't exist.
160
sub add {
12 rodolico 161
   &update( @_ );
3 rodolico 162
}
163
 
25 rodolico 164
# put node in maintenance mode
165
# if there are running domains on it, migrate them off first
38 rodolico 166
# If we migrate, we must then do a force scan, which locks
167
# the database. So, we must read the database shared first, then
168
# only read exclusive when we are actually changing the maintenance
169
# flag. The solution here is a kludge, but it at least works
170
# we do the exclusive read only just before we change then write
17 rodolico 171
sub maintenance {
172
   my ( $node, $action ) = @_;
38 rodolico 173
   &main::readDB();
25 rodolico 174
   my @return;
17 rodolico 175
   if ( $action ) {
38 rodolico 176
      print "Found action [$action] in node.pm:maintenance\n" if $main::config->{'flags'}->{'debug'} > 1;
25 rodolico 177
      if ( lc ( $action ) eq 'on' ) {
38 rodolico 178
         if ( keys %{$main::statusDB->{'nodePopulation'}->{$node}->{'running'} } ) {
25 rodolico 179
            # we've requested maintenance mode, but there are domains running on the node
38 rodolico 180
            print "Found domains on $node in node.pm:maintenance\n" if $main::config->{'flags'}->{'debug'} > 1;
181
            print "Trying to migrate domains off of $node before doing maintenance\n" if $main::config->{'flags'}->{'verbose'} || $main::config->{'flags'}->{'debug'} > 1;
25 rodolico 182
            push @return, &migrateAllDomains( $node, $main::config->{'flags'}->{'target'}, keys %{$main::statusDB->{'nodePopulation'}->{$node}->{'running'}} );
38 rodolico 183
            print "Finished migration attempt, forcing a scan\n" if $main::config->{'flags'}->{'debug'} > 1;
184
            &main::forceScan();
25 rodolico 185
         }
38 rodolico 186
         if ( keys %{ $main::statusDB->{'nodePopulation'}->{$node}->{'running'} } ) {
187
            print "Still found running domains on $node, aborting\n" if $main::config->{'flags'}->{'debug'} > 1;
25 rodolico 188
            push @return,  "Can not mark $node in maintenance mode with running domains";
189
         } else {
38 rodolico 190
            print "Marking $node as under maintenance\n" if $main::config->{'flags'}->{'verbose'} || $main::config->{'flags'}->{'debug'};
191
            &main::readDB(1);
25 rodolico 192
            $main::statusDB->{'node'}->{$node}->{'maintenance'} = 1;
38 rodolico 193
            &main::writeDB();
25 rodolico 194
         }
195
      } else {
38 rodolico 196
         print "Marking $node as Online\n" if $main::config->{'flags'}->{'verbose'} || $main::config->{'flags'}->{'debug'};
197
         &main::readDB(1);
26 rodolico 198
         $main::statusDB->{'node'}->{$node}->{'maintenance'} = 0;
38 rodolico 199
         &main::writeDB();
25 rodolico 200
      }
17 rodolico 201
   }
38 rodolico 202
   &main::readDB();
203
   print Dumper( $main::statusDB ) if $main::config->{'flags'}->{'debug'} > 2;
204
#   return "Maintenance set to " . ( $main::statusDB->{'node'}->{$node}->{'maintenance'} ) . "\n" .
25 rodolico 205
   return "Maintenance set to " . ( $main::statusDB->{'node'}->{$node}->{'maintenance'} ? 'On' : 'Off' ) . "\n" .
206
          ( @return ? join( "\n", @return ) . "\n" : '');
17 rodolico 207
}
208
 
25 rodolico 209
 
210
# migrate domains from node $from to node $to
211
# the rest of the stack is a list of domains to migrate
212
sub migrateAllDomains {
213
   my $from = shift;
214
   my $to = shift;
215
   print "In node.pm:migrateAllDomains, migrating\n" . join( "\n", @_ ) . "\nto $to\n"
216
      if ( $main::config->{'flags'}->{'debug'} );
217
   my @commands;
26 rodolico 218
   print "Checking for available resources on $to before migrating\n"  if $main::config->{'flags'}->{'verbose'};
25 rodolico 219
   if ( my $error = &main::validateResources( $to, @_ ) ) {
220
      return "We can not migrate all of the domains on $from to $to\n$error\n";
221
   }
222
   while ( my $domain = shift ) {
223
      push @commands, &main::migrate( $domain, $to );
224
   }
225
   chomp @commands;
226
   return join( "\n", @commands ) . "\n";
227
}
228
 
229