diff options
Diffstat (limited to 'ctdb/utils')
-rw-r--r-- | ctdb/utils/nagios/README | 56 | ||||
-rw-r--r-- | ctdb/utils/nagios/check_ctdb | 279 | ||||
-rw-r--r-- | ctdb/utils/ping_pong/ping_pong.c | 251 | ||||
-rw-r--r-- | ctdb/utils/pmda/Install | 36 | ||||
-rw-r--r-- | ctdb/utils/pmda/README | 84 | ||||
-rw-r--r-- | ctdb/utils/pmda/Remove | 29 | ||||
-rw-r--r-- | ctdb/utils/pmda/config.m4 | 32 | ||||
-rw-r--r-- | ctdb/utils/pmda/domain.h | 19 | ||||
-rw-r--r-- | ctdb/utils/pmda/help | 106 | ||||
-rw-r--r-- | ctdb/utils/pmda/pmda_ctdb.c | 595 | ||||
-rw-r--r-- | ctdb/utils/pmda/pmns | 73 | ||||
-rw-r--r-- | ctdb/utils/pmda/root | 10 | ||||
-rw-r--r-- | ctdb/utils/scsi_io/scsi_io.c | 1152 | ||||
-rw-r--r-- | ctdb/utils/smnotify/smnotify.c | 150 | ||||
-rw-r--r-- | ctdb/utils/smnotify/smnotify.x | 21 |
15 files changed, 2893 insertions, 0 deletions
diff --git a/ctdb/utils/nagios/README b/ctdb/utils/nagios/README new file mode 100644 index 00000000000..99fa6dc328d --- /dev/null +++ b/ctdb/utils/nagios/README @@ -0,0 +1,56 @@ +check_ctdb 0.3 + +This nagios plugin is free software, and comes with ABSOLUTELY NO WARRANTY. +It may be used, redistributed and/or modified under the terms of the GNU +General Public Licence (see http://www.fsf.org/licensing/licenses/gpl.txt). + +CTDB plugin + +Usage: check_ctdb -i <info> + [ -t <timeout> ] [ -w <warn_range> ] [ -c <crit_range> ] + [ -H <host> ] [-s] [ -l <login_name> ] + [ -V ] [ -h ] + + -?, --usage + Print usage information + -h, --help + Print detailed help screen + -V, --version + Print version information + --extra-opts=[section][@file] + Read options from an ini file. See http://nagiosplugins.org/extra-opts for usage + -i, --info=<info> + Information: One of scriptstatus or ping. + -H, --hostname=<login_name> + Host name or IP Address. + -s, --sudo + Use sudo. + -l, --login=<host> + The user to log in as on the remote machine. + -w, --warning=THRESHOLD + Warning threshold. See + http://nagiosplug.sourceforge.net/developer-guidelines.html#THRESHOLDFORMAT + for the threshold format. + -c, --critical=THRESHOLD + Critical threshold. See + http://nagiosplug.sourceforge.net/developer-guidelines.html#THRESHOLDFORMAT + for the threshold format. + -t, --timeout=INTEGER + Seconds before plugin times out (default: 30) + -v, --verbose + Show details for command-line debugging (can repeat up to 3 times) +Supported commands: + * scriptstatus : + check the ctdb scriptstatus command and return CRITICAL if one of the + scripts fails. + Perfdata count the number of scripts by state (ok, disabled, error, + total). + * ping : + check the ctdb ping command. + Perfdata count the number of nodes, the total ping time and the number + of clients. + Thresholds are checked against the number of nodes. + + +Copyright (c) 2011 Nantes Metropole + diff --git a/ctdb/utils/nagios/check_ctdb b/ctdb/utils/nagios/check_ctdb new file mode 100644 index 00000000000..837a0a4539a --- /dev/null +++ b/ctdb/utils/nagios/check_ctdb @@ -0,0 +1,279 @@ +#!/usr/bin/perl -w +# Nagios plugin to monitor CTDB (Clustered Trivial Database) +# +# License: GPL +# Copyright (c) 2011 Nantes Metropole +# Author: Mathieu Parent <math.parent@gmail.com> +# Contributor(s): - +# +# This program is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License version 2 as +# published by the Free Software Foundation. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with this program. If not, see <http://www.gnu.org/licenses/>. +# + +use strict; +use warnings; +use vars qw($PROGNAME $VERSION $output $values $result); +use Nagios::Plugin; +use File::Basename; + +$PROGNAME = basename($0); +$VERSION = '0.4'; + +my $np = Nagios::Plugin->new( + usage => "Usage: %s -i <info>\n" + . " [ -t <timeout> ] [ -w <warn_range> ] [ -c <crit_range> ]\n" + . " [ -H <host> ] [-s] [ -l <login_name> ]\n" + . ' [ -V ] [ -h ]', + version => $VERSION, + plugin => $PROGNAME, + shortname => uc($PROGNAME), + blurb => 'CTDB plugin', + extra => "Supported commands:\n" + . " * scriptstatus :\n" + . " check the ctdb scriptstatus command and return CRITICAL if one of the\n" + . " scripts fails.\n" + . " Perfdata count the number of scripts by state (ok, disabled, error,\n" + . " total).\n" + . " * ping :\n" + . " check the ctdb ping command.\n" + . " Perfdata count the number of nodes, the total ping time and the number\n" + . " of clients.\n" + . " Thresholds are checked against the number of nodes.\n" + . "\n\nCopyright (c) 2011 Nantes Metropole", + timeout => 30, +); + +$np->add_arg( + spec => 'info|i=s', + help => "-i, --info=<info>\n" + . ' Information: One of scriptstatus or ping.', + required => 1, +); + +$np->add_arg( + spec => 'hostname|H=s', + help => "-H, --hostname=<login_name>\n" + . ' Host name or IP Address.', + required => 0, +); + +$np->add_arg( + spec => 'sudo|s', + help => "-s, --sudo\n" + . ' Use sudo.', + required => 0, +); + +$np->add_arg( + spec => 'login|l=s', + help => "-l, --login=<host>\n" + . ' The user to log in as on the remote machine.', + required => 0, +); + +$np->add_arg( + spec => 'warning|w=s', + help => "-w, --warning=THRESHOLD\n" + . " Warning threshold. See\n" + . " http://nagiosplug.sourceforge.net/developer-guidelines.html#THRESHOLDFORMAT\n" + . ' for the threshold format.', + required => 0, +); + +$np->add_arg( + spec => 'critical|c=s', + help => "-c, --critical=THRESHOLD\n" + . " Critical threshold. See\n" + . " http://nagiosplug.sourceforge.net/developer-guidelines.html#THRESHOLDFORMAT\n" + . ' for the threshold format.', + required => 0, +); + +$np->getopts; + +my $info = $np->opts->info; +my $hostname = $np->opts->hostname; +my $login = $np->opts->login; +my $sudo = $np->opts->sudo; +my $warning = $np->opts->warning; +my $critical = $np->opts->critical; +my $percw; +my $percc; + +$output = ""; + +if (defined($critical)) +{ + ($percc, $critical) = check_percantage($critical); + $critical = undef if ($critical eq ''); +} + +if (defined($warning)) +{ + ($percw, $warning) = check_percantage($warning); + $warning = undef if ($warning eq ''); +} + +$np->set_thresholds(critical => $critical, warning => $warning); + +my $stderr; + +sub safe_open_command { + unshift @_, "sudo" if $sudo; + if ($hostname) { + unshift @_, $hostname; + unshift @_, "-l", $login if $login; + unshift @_, "ssh"; + } + open(OLDERR, ">&", \*STDERR) or die "Can't dup STDERR: $!"; + $stderr = ""; + close STDERR; + open(STDERR, ">>", \$stderr) or die "Can't open STDERR: $!"; + if ($np->opts->verbose) { + print "Executing: @_\n"; + } + if (!open(PIPE, '-|', @_)) { + $result = CRITICAL; + $output .= "Cannot open command '@_': $! ($stderr). "; + # restore STDERR + open(STDERR, ">", \*OLDERR) or die "Can't dup OLDERR: $!"; + } +} + +sub safe_close_command { + close(PIPE); + + if ($? == -1) { + $result = CRITICAL; + $output .= "failed to execute: $!. "; + } elsif ($? & 127) { + $result = CRITICAL; + $output .= sprintf("child died with signal %d, %s coredump. ", + ($? & 127), ($? & 128) ? 'with' : 'without'); + } elsif ($? >> 8) { + if (($? >> 8) == 255) { + # ctdb returns -1=255 if any node is disconnected + $result = WARNING; + $output .= sprintf("child exited with value %d. ", $? >> 8) if $output eq ""; + } else { + $result = CRITICAL; + $output .= sprintf("child exited with value %d. ", $? >> 8); + } + } + # restore STDERR + open(STDERR, ">&OLDERR") or die "Can't dup OLDERR: $!"; +} + +# main : + +if ($info eq "scriptstatus") { + $result = OK; + safe_open_command('ctdb', '-Y', 'scriptstatus'); + if ($result == OK) { + my $script_count = 0; + my $ok_script_count = 0; + my $disabled_script_count = 0; + my $error_script_count = 0; + while (<PIPE>) { + next if $. == 1; # Header + $script_count++; + chop; + my ($col0, $type, $name, $code, $status, $start, $end, @error) = split(":"); + if ($col0 ne '') { + # Old version, before 30 Aug 2011 and commit a779d83a6213 + ($type, $name, $code, $status, $start, $end, @error) = ($col0, $type, $name, $code, $status, $start, $end, @error); + } + my $error = join(':', @error); + if ($error ne "") { + $output = "$output ;; " if $output; + $output = "$output$name ($status=$code): $error "; + if ($result != CRITICAL) { + $result = WARNING; + } + } + if ($status eq "OK") { + $ok_script_count++; + next; + } + if ($status eq "DISABLED") { + $disabled_script_count++; + next; + } + $error_script_count++; + $result = WARNING; + } + safe_close_command(); + $np->add_perfdata(label => "ok", value => $ok_script_count, uom => '', + min => 0, max => $script_count); + $np->add_perfdata(label => "disabled", value => $disabled_script_count, uom => '', + min => 0, max => $script_count); + $np->add_perfdata(label => "error", value => $error_script_count, uom => '', + min => 0, max => $script_count, warning => '0', critical => '0'); + $np->add_perfdata(label => "total", value => $script_count, uom => '', + min => 0, max => $script_count); + if ($result == OK) { + $result = $np->check_threshold(check => $error_script_count, warning => '0', critical => '0'); + } + } + $np->nagios_exit($result, $output); +} elsif ($info eq "ping") { + # Get expected nodes count + $result = OK; + safe_open_command('cat', '/etc/ctdb/nodes'); + 1 while( <PIPE> ); + my $max_nodes_count = $.; + safe_close_command(); + # ctdb ping + $result = OK; + safe_open_command('ctdb', '-n', 'all', 'ping'); + if ($result == OK) { + my $nodes_count = 0; + my $time_total = 0.0; + my $clients_count = 0; + while (<PIPE>) { + chop; + if ($_ =~ /^response from (\d+) time=([0-9.]+) sec \((\d+) clients\)$/) { + my ($node_id, $time, $clients) = ($1,$2,$3); + $nodes_count += 1; + $time_total += $time; + $clients_count += $clients; + } elsif ($_ =~ /^Unable to get ping response from node (\d+)$/) { + # + } else { + $result = CRITICAL; + $output .= "'$_' doesn't match regexp. " + } + } + $output .= sprintf("%d missing nodes. ", $max_nodes_count - $nodes_count) if $nodes_count < $max_nodes_count; + safe_close_command(); + $np->add_perfdata(label => "nodes", value => $nodes_count, uom => '', + min => 0, max => $max_nodes_count, warning => $warning, critical => $critical); + $np->add_perfdata(label => "ping_time", value => $time_total, uom => 's', + min => 0, max => undef); + $np->add_perfdata(label => "clients", value => $clients_count, uom => '', + min => 0, max => undef); + if ($result == OK) { + $result = $np->check_threshold(check => $nodes_count); + } + } + $np->nagios_exit($result, $output); +} else { + $np->nagios_exit(UNKNOWN, "Unknown command: '$info'"); +} + +sub check_percantage +{ + my ($number) = shift(@_); + my $perc = $number =~ s/\%//; + return ($perc, $number); +} + diff --git a/ctdb/utils/ping_pong/ping_pong.c b/ctdb/utils/ping_pong/ping_pong.c new file mode 100644 index 00000000000..16f58d8af2b --- /dev/null +++ b/ctdb/utils/ping_pong/ping_pong.c @@ -0,0 +1,251 @@ +/* + A ping-pong fcntl byte range lock test + + Copyright (C) Andrew Tridgell 2002 + Copyright (C) Michael Adam 2012 + + This program is free software; you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program; if not, see <http://www.gnu.org/licenses/>. +*/ + +/* + This measures the ping-pong byte range lock latency. It is + especially useful on a cluster of nodes sharing a common lock + manager as it will give some indication of the lock managers + performance under stress. + + tridge@samba.org, February 2002 + +*/ + +#define _XOPEN_SOURCE 500 + +#include <stdio.h> +#include <stdlib.h> +#include <sys/time.h> +#include <time.h> +#include <errno.h> +#include <string.h> +#include <unistd.h> +#include <fcntl.h> +#include <sys/mman.h> + +static struct timeval tp1,tp2; + +static int do_reads, do_writes, use_mmap, do_check; + +static void start_timer(void) +{ + gettimeofday(&tp1,NULL); +} + +static double end_timer(void) +{ + gettimeofday(&tp2,NULL); + return (tp2.tv_sec + (tp2.tv_usec*1.0e-6)) - + (tp1.tv_sec + (tp1.tv_usec*1.0e-6)); +} + +/* lock a byte range in a open file */ +static int lock_range(int fd, int offset, int len) +{ + struct flock lock; + + lock.l_type = F_WRLCK; + lock.l_whence = SEEK_SET; + lock.l_start = offset; + lock.l_len = len; + lock.l_pid = 0; + + return fcntl(fd,F_SETLKW,&lock); +} + +/* check whether we could place a lock */ +int check_lock(int fd, int offset, int len) +{ + struct flock lock; + int ret; + + lock.l_type = F_WRLCK; + lock.l_whence = SEEK_SET; + lock.l_start = offset; + lock.l_len = len; + lock.l_pid = 0; + + ret = fcntl(fd, F_GETLK, &lock); + if (ret != 0) { + printf("error calling fcntl F_GETLCK: %s\n", strerror(errno)); + return -1; + } + + if (lock.l_type == F_UNLCK) { + /* we would be able to place the lock */ + return 0; + } + + /* we would not be able to place lock */ + printf("check_lock failed: lock held: " + "pid='%d', type='%d', start='%d', len='%d'\n", + (int)lock.l_pid, (int)lock.l_type, (int)lock.l_start, (int)lock.l_len); + return 1; +} + +/* unlock a byte range in a open file */ +static int unlock_range(int fd, int offset, int len) +{ + struct flock lock; + + lock.l_type = F_UNLCK; + lock.l_whence = SEEK_SET; + lock.l_start = offset; + lock.l_len = len; + lock.l_pid = 0; + + return fcntl(fd,F_SETLKW,&lock); +} + +/* run the ping pong test on fd */ +static void ping_pong(int fd, int num_locks) +{ + unsigned count = 0; + int i=0, loops=0; + unsigned char *val; + unsigned char incr=0, last_incr=0; + unsigned char *p = NULL; + int ret; + + ret = ftruncate(fd, num_locks+1); + if (ret == -1) { + printf("ftruncate failed: %s\n", strerror(errno)); + return; + } + + if (use_mmap) { + p = mmap(NULL, num_locks+1, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0); + if (p == MAP_FAILED) { + printf("mmap failed: %s\n", strerror(errno)); + return; + } + } + + val = (unsigned char *)calloc(num_locks+1, sizeof(unsigned char)); + if (val == NULL) { + printf("calloc failed\n"); + return; + } + + start_timer(); + + lock_range(fd, 0, 1); + i = 0; + + while (1) { + if (lock_range(fd, (i+1) % num_locks, 1) != 0) { + printf("lock at %d failed! - %s\n", + (i+1) % num_locks, strerror(errno)); + } + if (do_check) { + ret = check_lock(fd, i, 1); + } + if (do_reads) { + unsigned char c; + if (use_mmap) { + c = p[i]; + } else if (pread(fd, &c, 1, i) != 1) { + printf("read failed at %d\n", i); + } + incr = c - val[i]; + val[i] = c; + } + if (do_writes) { + char c = val[i] + 1; + if (use_mmap) { + p[i] = c; + } else if (pwrite(fd, &c, 1, i) != 1) { + printf("write failed at %d\n", i); + } + } + if (unlock_range(fd, i, 1) != 0) { + printf("unlock at %d failed! - %s\n", + i, strerror(errno)); + } + i = (i+1) % num_locks; + count++; + if (loops > num_locks && incr != last_incr) { + last_incr = incr; + printf("data increment = %u\n", incr); + fflush(stdout); + } + if (end_timer() > 1.0) { + printf("%8u locks/sec\r", + (unsigned)(2*count/end_timer())); + fflush(stdout); + start_timer(); + count=0; + } + loops++; + } +} + +int main(int argc, char *argv[]) +{ + char *fname; + int fd, num_locks; + int c; + + while ((c = getopt(argc, argv, "rwmc")) != -1) { + switch (c){ + case 'w': + do_writes = 1; + break; + case 'r': + do_reads = 1; + break; + case 'm': + use_mmap = 1; + break; + case 'c': + do_check = 1; + break; + default: + fprintf(stderr, "Unknown option '%c'\n", c); + exit(1); + } + } + + argv += optind; + argc -= optind; + + if (argc < 2) { + printf("ping_pong [options] <file> <num_locks>\n"); + printf(" -r do reads\n"); + printf(" -w do writes\n"); + printf(" -m use mmap\n"); + printf(" -c check locks\n"); + exit(1); + } + + fname = argv[0]; + num_locks = atoi(argv[1]); + if (num_locks <= 0) { + printf("num_locks should be > 0\n"); + exit(1); + } + + fd = open(fname, O_CREAT|O_RDWR, 0600); + if (fd == -1) exit(1); + + ping_pong(fd, num_locks); + + return 0; +} diff --git a/ctdb/utils/pmda/Install b/ctdb/utils/pmda/Install new file mode 100644 index 00000000000..a56a63506a8 --- /dev/null +++ b/ctdb/utils/pmda/Install @@ -0,0 +1,36 @@ +#! /bin/sh +# +# Copyright (c) 1997 Silicon Graphics, Inc. All Rights Reserved. +# +# This program is free software; you can redistribute it and/or modify it +# under the terms of the GNU General Public License as published by the +# Free Software Foundation; either version 2 of the License, or (at your +# option) any later version. +# +# This program is distributed in the hope that it will be useful, but +# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY +# or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License +# for more details. +# +# You should have received a copy of the GNU General Public License along +# with this program; if not, write to the Free Software Foundation, Inc., +# 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +# +# Install the ctdb PMDA and/or PMNS +# + +. $PCP_DIR/etc/pcp.env +. $PCP_SHARE_DIR/lib/pmdaproc.sh + +iam=ctdb +pmda_interface=2 + +# runs as daemon and only supports pipe IPC +daemon_opt=true +dso_opt=false +pipe_opt=true +socket_opt=false + +pmdaSetup +pmdaInstall +exit 0 diff --git a/ctdb/utils/pmda/README b/ctdb/utils/pmda/README new file mode 100644 index 00000000000..f8dbbbccac4 --- /dev/null +++ b/ctdb/utils/pmda/README @@ -0,0 +1,84 @@ +CTDB PMDA +=========== + +This PMDA extracts metrics from the locally running ctdbd daemon for +export to PMCD. + +Note: + This PMDA may be remade from source and hence requires IDO (or + more specifically a C compiler) to be installed. + + Uses of make(1) may fail (without removing or clobbering files) + if the C compiler cannot be found. This is most likely to + happen when running the PMDA ./Install script. + + The only remedial action is to install the C compiler, or + hand-craft changes to the Makefile. + +Metrics +======= + +The file ./help contains descriptions for all of the metrics exported +by this PMDA. + +Once the PMDA has been installed, the following command will list all +the available metrics and their explanatory "help" text: + + $ pminfo -fT ctdb + +Installation +============ + + + # cd $PCP_PMDAS_DIR/ctdb + + + Check that there is no clash in the Performance Metrics Domain + defined in ./domain.h and the other PMDAs currently in use (see + $PCP_PMCDCONF_PATH). If there is, edit ./domain.h to choose another + domain number. + + + Then simply use + + # ./Install + + and choose both the "collector" and "monitor" installation + configuration options. + + You will be prompted to choose either a daemon implementation + or a DSO implementation of the PMDA, and in the case of the daemon + variant to select an IPC method -- everything else is automated + +De-installation +=============== + + + Simply use + + # cd $PCP_PMDAS_DIR/ctdb + # ./Remove + +Troubleshooting +=============== + + + After installing or restarting the agent, the PMCD log file + ($PCP_LOG_DIR/pmcd/pmcd.log) and the PMDA log file + ($PCP_LOG_DIR/pmcd/pmda_ctdb.log) should be checked for any warnings + or errors. + + +Adding a New Metric +=================== + +This section walks through the development task of adding a new metric to the +CTDB PMDA. + + + Define the metric in the pmns file with a unique metric id. See the pmns(4) + man page for details. + + + Add a description of the metric to the help file. + + + Taking note of the previously assigned metric id, add a new entry to the + metrictab structure in pmda_ctdb.c. See the pmdaInit(3) man page for + details. + + + Ensure the counter is already a member of the ctdb_statistics structure. + Finally, add code to pmda_ctdb_fetch_cb() to handle fetch requests for the + newly defined metric. diff --git a/ctdb/utils/pmda/Remove b/ctdb/utils/pmda/Remove new file mode 100644 index 00000000000..7d1c509e50e --- /dev/null +++ b/ctdb/utils/pmda/Remove @@ -0,0 +1,29 @@ +#! /bin/sh +# +# Copyright (c) 1997 Silicon Graphics, Inc. All Rights Reserved. +# +# This program is free software; you can redistribute it and/or modify it +# under the terms of the GNU General Public License as published by the +# Free Software Foundation; either version 2 of the License, or (at your +# option) any later version. +# +# This program is distributed in the hope that it will be useful, but +# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY +# or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License +# for more details. +# +# You should have received a copy of the GNU General Public License along +# with this program; if not, write to the Free Software Foundation, Inc., +# 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +# +# Remove the ctdb PMDA +# + +. $PCP_DIR/etc/pcp.env +. $PCP_SHARE_DIR/lib/pmdaproc.sh + +iam=ctdb + +pmdaSetup +pmdaRemove +exit 0 diff --git a/ctdb/utils/pmda/config.m4 b/ctdb/utils/pmda/config.m4 new file mode 100644 index 00000000000..6b3fbb0ea14 --- /dev/null +++ b/ctdb/utils/pmda/config.m4 @@ -0,0 +1,32 @@ +AC_ARG_ENABLE(pmda, +AS_HELP_STRING([--enable-pmda], [Turn on PCP pmda support (default=no)])) + +HAVE_PMDA=no + +if eval "test x$enable_pmda = xyes"; then + HAVE_PMDA=yes + + AC_CHECK_HEADERS(pcp/pmapi.h pcp/impl.h pcp/pmda.h, [], + [AC_MSG_ERROR([Missing PCP pmda headers])], + [[#ifdef HAVE_PCP_PMAPI_H + # include <pcp/pmapi.h> + #endif + #ifdef HAVE_PCP_IMPL_H + # include <pcp/impl.h> + #endif + #ifdef HAVE_PCP_PMDA_H + # include <pcp/pmda.h> + #endif + ]]) +fi + +if test x"$HAVE_PMDA" = x"yes"; then + CTDB_PMDA=bin/pmdactdb + CTDB_PMDA_INSTALL=install_pmda +else + CTDB_PMDA= + CTDB_PMDA_INSTALL= +fi + +AC_SUBST(CTDB_PMDA) +AC_SUBST(CTDB_PMDA_INSTALL) diff --git a/ctdb/utils/pmda/domain.h b/ctdb/utils/pmda/domain.h new file mode 100644 index 00000000000..0bed7fef599 --- /dev/null +++ b/ctdb/utils/pmda/domain.h @@ -0,0 +1,19 @@ +/* domain.h + * + * Copyright (c) 2004-2009 Silicon Graphics, Inc. All rights reserved. + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + */ +#define CTDB 110 diff --git a/ctdb/utils/pmda/help b/ctdb/utils/pmda/help new file mode 100644 index 00000000000..0e9984eab3a --- /dev/null +++ b/ctdb/utils/pmda/help @@ -0,0 +1,106 @@ +# +# Copyright (c) 2000-2004 Silicon Graphics, Inc. All Rights Reserved. +# +# This program is free software; you can redistribute it and/or modify it +# under the terms of the GNU General Public License as published by the +# Free Software Foundation; either version 2 of the License, or (at your +# option) any later version. +# +# This program is distributed in the hope that it will be useful, but +# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY +# or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License +# for more details. +# +# You should have received a copy of the GNU General Public License along +# with this program; if not, write to the Free Software Foundation, Inc., +# 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA +# +# ctdb PMDA help file in the ASCII format +# +# lines beginning with a # are ignored +# lines beginning @ introduce a new entry of the form +# @ metric_name oneline-text +# help test goes +# here over multiple lines +# ... +# +# the metric_name is decoded against the default PMNS -- as a special case, +# a name of the form NNN.MM (for numeric NNN and MM) is interpreted as an +# instance domain identification, and the text describes the instance domain +# +# blank lines before the @ line are ignored +# + +@ ctdb.num_clients number of clients connected to ctdbd + +@ ctdb.frozen whether any databases are frozen + +@ ctdb.recovering whether recovery is active + +@ ctdb.client_packets_sent number of packets sent to all clients + +@ ctdb.client_packets_recv number of packets received from all clients + +@ ctdb.node_packets_sent number of packets sent to other nodes + +@ ctdb.node_packets_recv number of packets received from other nodes + +@ ctdb.keepalive_packets_sent number of keepalive packets sent to other nodes + +@ ctdb.keepalive_packets_recv number of keepalive packets received from other nodes + +@ ctdb.node.req_call number of node CTDB_REQ_CALL packets handled + +@ ctdb.node.reply_call number of node CTDB_REPLY_CALL packets handled + +@ ctdb.node.req_dmaster number of node CTDB_REQ_DMASTER packets handled + +@ ctdb.node.reply_dmaster number of node CTDB_REPLY_DMASTER packets handled + +@ ctdb.node.reply_error number of node CTDB_REPLY_ERROR packets handled + +@ ctdb.node.req_message number of node CTDB_REQ_MESSAGE packets handled + +@ ctdb.node.req_control number of node CTDB_REQ_CONTROL packets handled + +@ ctdb.node.reply_control number of node CTDB_REPLY_CONTROL packets handled + +@ ctdb.client.req_call number of client CTDB_REQ_CALL packets handled + +@ ctdb.client.req_message number of client CTDB_REQ_MESSAGE packets handled + +@ ctdb.client.req_control number of client CTDB_REQ_CONTROL packets handled + +@ ctdb.timeouts.call (counter not implemented) number of call timeouts + +@ ctdb.timeouts.control number of node control message request timeouts awaiting reply + +@ ctdb.timeouts.traverse number of database traversal timeouts + +@ ctdb.total_calls total number of client ctdb request calls received + +@ ctdb.pending_calls total number of client ctdb request calls in progress + +@ ctdb.lockwait_calls number of tdb chainlock lockwait calls + +@ ctdb.pending_lockwait_calls number of lockwait calls waiting for a lock + +@ ctdb.childwrite_calls number of childwrite calls + +@ ctdb.pending_childwrite_calls number of childwrite calls in progress + +@ ctdb.memory_used total size of the ctdbd null talloc pool + +@ ctdb.max_hop_count maximum hops performed by a CTDB_REQ_CALL packet + +@ ctdb.max_reclock_ctdbd maximum recovery lock latency during setrecmode + +@ ctdb.max_reclock_recd maximum recovery lock latency as reported by the recovery process + +@ ctdb.max_call_latency maximum time spent handling a client request call + +@ ctdb.max_lockwait_latency maximum time spent waiting for a tdb chainlock + +@ ctdb.max_childwrite_latency maximum time spent performing a childwrite + +@ ctdb.num_recoveries number of recoveries finished diff --git a/ctdb/utils/pmda/pmda_ctdb.c b/ctdb/utils/pmda/pmda_ctdb.c new file mode 100644 index 00000000000..e8033bea25e --- /dev/null +++ b/ctdb/utils/pmda/pmda_ctdb.c @@ -0,0 +1,595 @@ +/* + * CTDB Performance Metrics Domain Agent (PMDA) for Performance Co-Pilot (PCP) + * + * Copyright (c) 1995,2004 Silicon Graphics, Inc. All Rights Reserved. + * Copyright (c) 2011 David Disseldorp + * + * This program is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License as published by the + * Free Software Foundation; either version 2 of the License, or (at your + * option) any later version. + * + * This program is distributed in the hope that it will be useful, but + * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY + * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * for more details. + * + * You should have received a copy of the GNU General Public License along + * with this program; if not, write to the Free Software Foundation, Inc., + * 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + */ + +#include <pcp/pmapi.h> +#include <pcp/impl.h> +#include <pcp/pmda.h> +#include "../../include/includes.h" +#include "../../include/ctdb.h" +#include "../../include/ctdb_private.h" +#include "../../include/ctdb_protocol.h" +#include "domain.h" + +/* + * CTDB PMDA + * + * This PMDA connects to the locally running ctdbd daemon and pulls + * statistics for export via PCP. The ctdbd Unix domain socket path can be + * specified with the CTDB_SOCKET environment variable, otherwise the default + * path is used. + */ + +/* + * All metrics supported in this PMDA - one table entry for each. + * The 4th field specifies the serial number of the instance domain + * for the metric, and must be either PM_INDOM_NULL (denoting a + * metric that only ever has a single value), or the serial number + * of one of the instance domains declared in the instance domain table + * (i.e. in indomtab, above). + */ +static pmdaMetric metrictab[] = { + /* num_clients */ + { NULL, { PMDA_PMID(0,0), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,0,0,0,0,0) }, }, + /* frozen */ + { NULL, { PMDA_PMID(1,2), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,0,0,0,0,0) }, }, + /* recovering */ + { NULL, { PMDA_PMID(3,3), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,0,0,0,0,0) }, }, + /* client_packets_sent */ + { NULL, { PMDA_PMID(4,4), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* client_packets_recv */ + { NULL, { PMDA_PMID(5,5), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* node_packets_sent */ + { NULL, { PMDA_PMID(6,6), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* node_packets_recv */ + { NULL, { PMDA_PMID(7,7), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* keepalive_packets_sent */ + { NULL, { PMDA_PMID(8,8), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* keepalive_packets_recv */ + { NULL, { PMDA_PMID(9,9), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* req_call */ + { NULL, { PMDA_PMID(10,10), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* reply_call */ + { NULL, { PMDA_PMID(10,11), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* req_dmaster */ + { NULL, { PMDA_PMID(10,12), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* reply_dmaster */ + { NULL, { PMDA_PMID(10,13), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* reply_error */ + { NULL, { PMDA_PMID(10,14), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* req_message */ + { NULL, { PMDA_PMID(10,15), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* req_control */ + { NULL, { PMDA_PMID(10,16), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* reply_control */ + { NULL, { PMDA_PMID(10,17), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* req_call */ + { NULL, { PMDA_PMID(11,18), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* req_message */ + { NULL, { PMDA_PMID(11,19), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* req_control */ + { NULL, { PMDA_PMID(11,20), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* call */ + { NULL, { PMDA_PMID(12,21), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,0) }, }, + /* control */ + { NULL, { PMDA_PMID(12,22), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,0) }, }, + /* traverse */ + { NULL, { PMDA_PMID(12,23), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,0) }, }, + /* total_calls */ + { NULL, { PMDA_PMID(13,24), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* pending_calls */ + { NULL, { PMDA_PMID(14,25), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,0,0,0,0,0) }, }, + /* locks.num_calls */ + { NULL, { PMDA_PMID(15,27), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* locks.pending_calls */ + { NULL, { PMDA_PMID(16,27), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,0,0,0,0,0) }, }, + /* childwrite_calls */ + { NULL, { PMDA_PMID(17,28), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_COUNTER, + PMDA_PMUNITS(0,0,1,0,0,PM_COUNT_ONE) }, }, + /* pending_childwrite_calls */ + { NULL, { PMDA_PMID(18,29), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,0,0,0,0,0) }, }, + /* memory_used */ + { NULL, { PMDA_PMID(19,30), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(1,0,0,PM_SPACE_BYTE,0,0) }, }, + /* max_hop_count */ + { NULL, { PMDA_PMID(20,31), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,0,0,0,0,0) }, }, + /* max_reclock_ctdbd */ + { NULL, { PMDA_PMID(21,32), PM_TYPE_DOUBLE, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,1,0,0,PM_TIME_SEC,0) }, }, + /* max_reclock_recd */ + { NULL, { PMDA_PMID(22,33), PM_TYPE_DOUBLE, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,1,0,0,PM_TIME_SEC,0) }, }, + /* max_call_latency */ + { NULL, { PMDA_PMID(23,34), PM_TYPE_DOUBLE, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,1,0,0,PM_TIME_SEC,0) }, }, + /* locks.latency.max */ + { NULL, { PMDA_PMID(24,35), PM_TYPE_DOUBLE, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,1,0,0,PM_TIME_SEC,0) }, }, + /* childwrite_latency.max */ + { NULL, { PMDA_PMID(25,36), PM_TYPE_DOUBLE, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,1,0,0,PM_TIME_SEC,0) }, }, + /* num_recoveries */ + { NULL, { PMDA_PMID(26,37), PM_TYPE_U32, PM_INDOM_NULL, PM_SEM_INSTANT, + PMDA_PMUNITS(0,0,0,0,0,0) }, }, +}; + +static struct event_context *ev; +static struct ctdb_context *ctdb; +static struct ctdb_statistics *stats; + +static void +pmda_ctdb_q_read_cb(uint8_t *data, size_t cnt, void *args) +{ + if (cnt == 0) { + fprintf(stderr, "ctdbd unreachable\n"); + /* cleanup on request timeout */ + return; + } + + ctdb_client_read_cb(data, cnt, args); +} + + +static int +pmda_ctdb_daemon_connect(void) +{ + const char *socket_name; + int ret; + struct sockaddr_un addr; + + ev = event_context_init(NULL); + if (ev == NULL) { + fprintf(stderr, "Failed to init event ctx\n"); + return -1; + } + + ctdb = ctdb_init(ev); + if (ctdb == NULL) { + fprintf(stderr, "Failed to init ctdb\n"); + goto err_ev; + } + + socket_name = getenv("CTDB_SOCKET"); + if (socket_name == NULL) { + socket_name = CTDB_PATH; + } + + ret = ctdb_set_socketname(ctdb, socket_name); + if (ret == -1) { + fprintf(stderr, "ctdb_set_socketname failed - %s\n", + ctdb_errstr(ctdb)); + goto err_ctdb; + } + + /* + * ctdb_socket_connect() sets a default queue callback handler that + * calls exit() if ctdbd is unavailable on recv, use our own wrapper to + * work around this + */ + + memset(&addr, 0, sizeof(addr)); + addr.sun_family = AF_UNIX; + strncpy(addr.sun_path, ctdb->daemon.name, sizeof(addr.sun_path)); + + ctdb->daemon.sd = socket(AF_UNIX, SOCK_STREAM, 0); + if (ctdb->daemon.sd == -1) { + fprintf(stderr, "Failed to open client socket\n"); + goto err_ctdb; + } + + set_nonblocking(ctdb->daemon.sd); + set_close_on_exec(ctdb->daemon.sd); + + if (connect(ctdb->daemon.sd, (struct sockaddr *)&addr, sizeof(addr)) == -1) { + fprintf(stderr, "Failed to connect to ctdb daemon via %s\n", + ctdb->daemon.name); + goto err_sd; + } + + ctdb->daemon.queue = ctdb_queue_setup(ctdb, ctdb, ctdb->daemon.sd, + CTDB_DS_ALIGNMENT, + pmda_ctdb_q_read_cb, ctdb, + "to-ctdbd"); + if (ctdb->daemon.queue == NULL) { + fprintf(stderr, "Failed to setup queue\n"); + goto err_sd; + } + + ctdb->pnn = ctdb_ctrl_getpnn(ctdb, timeval_current_ofs(3, 0), + CTDB_CURRENT_NODE); + if (ctdb->pnn == (uint32_t)-1) { + fprintf(stderr, "Failed to get ctdb pnn\n"); + goto err_sd; + } + + return 0; +err_sd: + close(ctdb->daemon.sd); +err_ctdb: + talloc_free(ctdb); +err_ev: + talloc_free(ev); + ctdb = NULL; + return -1; +} + +static void +pmda_ctdb_daemon_disconnect(void) +{ + if (ctdb->methods) { + ctdb->methods->shutdown(ctdb); + } + + if (ctdb->daemon.sd != -1) { + close(ctdb->daemon.sd); + } + + talloc_free(ctdb); + talloc_free(ev); + ctdb = NULL; +} + +static int +fill_node(unsigned int item, pmAtomValue *atom) +{ + switch (item) { + case 10: + atom->ul = stats->node.req_call; + break; + case 11: + atom->ul = stats->node.reply_call; + break; + case 12: + atom->ul = stats->node.req_dmaster; + break; + case 13: + atom->ul = stats->node.reply_dmaster; + break; + case 14: + atom->ul = stats->node.reply_error; + break; + case 15: + atom->ul = stats->node.req_message; + break; + case 16: + atom->ul = stats->node.req_control; + break; + case 17: + atom->ul = stats->node.reply_control; + break; + default: + return PM_ERR_PMID; + } + + return 0; +} + +static int +fill_client(unsigned int item, pmAtomValue *atom) +{ + switch (item) { + case 18: + atom->ul = stats->client.req_call; + break; + case 19: + atom->ul = stats->client.req_message; + break; + case 20: + atom->ul = stats->client.req_control; + break; + default: + return PM_ERR_PMID; + } + + return 0; +} + +static int +fill_timeout(unsigned int item, pmAtomValue *atom) +{ + switch (item) { + case 21: + atom->ul = stats->timeouts.call; + break; + case 22: + atom->ul = stats->timeouts.control; + break; + case 23: + atom->ul = stats->timeouts.traverse; + break; + default: + return PM_ERR_PMID; + } + + return 0; +} + +/* + * callback provided to pmdaFetch + */ +static int +pmda_ctdb_fetch_cb(pmdaMetric *mdesc, unsigned int inst, pmAtomValue *atom) +{ + int ret; + __pmID_int *id = (__pmID_int *)&(mdesc->m_desc.pmid); + + if (inst != PM_IN_NULL) { + return PM_ERR_INST; + } + + if (stats == NULL) { + fprintf(stderr, "stats not available\n"); + ret = PM_ERR_VALUE; + goto err_out; + } + + + switch (id->cluster) { + case 0: + atom->ul = stats->num_clients; + break; + case 1: + atom->ul = stats->frozen; + break; + case 3: + atom->ul = stats->recovering; + break; + case 4: + atom->ul = stats->client_packets_sent; + break; + case 5: + atom->ul = stats->client_packets_recv; + break; + case 6: + atom->ul = stats->node_packets_sent; + break; + case 7: + atom->ul = stats->node_packets_recv; + break; + case 8: + atom->ul = stats->keepalive_packets_sent; + break; + case 9: + atom->ul = stats->keepalive_packets_recv; + break; + case 10: + ret = fill_node(id->item, atom); + if (ret) { + goto err_out; + } + break; + case 11: + ret = fill_client(id->item, atom); + if (ret) { + goto err_out; + } + break; + case 12: + ret = fill_timeout(id->item, atom); + if (ret) { + goto err_out; + } + break; + case 13: + atom->ul = stats->total_calls; + break; + case 14: + atom->ul = stats->pending_calls; + break; + case 15: + atom->ul = stats->locks.num_calls; + break; + case 16: + atom->ul = stats->locks.num_pending; + break; + case 17: + atom->ul = stats->childwrite_calls; + break; + case 18: + atom->ul = stats->pending_childwrite_calls; + break; + case 19: + atom->ul = stats->memory_used; + break; + case 20: + atom->ul = stats->max_hop_count; + break; + case 21: + atom->d = stats->reclock.ctdbd.max; + break; + case 22: + atom->d = stats->reclock.recd.max; + break; + case 23: + atom->d = stats->call_latency.max; + break; + case 24: + atom->d = stats->locks.latency.max; + break; + case 25: + atom->d = stats->childwrite_latency.max; + break; + case 26: + atom->d = stats->num_recoveries; + break; + default: + return PM_ERR_PMID; + } + + ret = 0; +err_out: + return ret; +} + +/* + * This routine is called once for each pmFetch(3) operation, so is a + * good place to do once-per-fetch functions, such as value caching or + * instance domain evaluation. + */ +static int +pmda_ctdb_fetch(int numpmid, pmID pmidlist[], pmResult **resp, pmdaExt *pmda) +{ + int ret; + TDB_DATA data; + int32_t res; + struct timeval ctdb_timeout; + + if (ctdb == NULL) { + fprintf(stderr, "attempting reconnect to ctdbd\n"); + ret = pmda_ctdb_daemon_connect(); + if (ret < 0) { + fprintf(stderr, "reconnect failed\n"); + return PM_ERR_VALUE; + } + } + + ctdb_timeout = timeval_current_ofs(1, 0); + ret = ctdb_control(ctdb, ctdb->pnn, 0, + CTDB_CONTROL_STATISTICS, 0, tdb_null, + ctdb, &data, &res, &ctdb_timeout, NULL); + + if (ret != 0 || res != 0) { + fprintf(stderr, "ctdb control for statistics failed, reconnecting\n"); + pmda_ctdb_daemon_disconnect(); + ret = PM_ERR_VALUE; + goto err_out; + } + + stats = (struct ctdb_statistics *)data.dptr; + + if (data.dsize != sizeof(struct ctdb_statistics)) { + fprintf(stderr, "incorrect statistics size %zu - not %zu\n", + data.dsize, sizeof(struct ctdb_statistics)); + ret = PM_ERR_VALUE; + goto err_stats; + } + + ret = pmdaFetch(numpmid, pmidlist, resp, pmda); + +err_stats: + talloc_free(stats); +err_out: + return ret; +} + +/* + * Initialise the agent + */ +void +pmda_ctdb_init(pmdaInterface *dp) +{ + if (dp->status != 0) { + return; + } + + dp->version.two.fetch = pmda_ctdb_fetch; + pmdaSetFetchCallBack(dp, pmda_ctdb_fetch_cb); + + pmdaInit(dp, NULL, 0, metrictab, + (sizeof(metrictab) / sizeof(metrictab[0]))); +} + +static char * +helpfile(void) +{ + static char buf[MAXPATHLEN]; + + if (!buf[0]) { + snprintf(buf, sizeof(buf), "%s/ctdb/help", + pmGetConfig("PCP_PMDAS_DIR")); + } + return buf; +} + +static void +usage(void) +{ + fprintf(stderr, "Usage: %s [options]\n\n", pmProgname); + fputs("Options:\n" + " -d domain use domain (numeric) for metrics domain of PMDA\n" + " -l logfile write log into logfile rather than using default log name\n" + "\nExactly one of the following options may appear:\n" + " -i port expect PMCD to connect on given inet port (number or name)\n" + " -p expect PMCD to supply stdin/stdout (pipe)\n" + " -u socket expect PMCD to connect on given unix domain socket\n", + stderr); + exit(1); +} + +/* + * Set up the agent if running as a daemon. + */ +int +main(int argc, char **argv) +{ + int err = 0; + char log_file[] = "pmda_ctdb.log"; + pmdaInterface dispatch; + + __pmSetProgname(argv[0]); + + pmdaDaemon(&dispatch, PMDA_INTERFACE_2, pmProgname, CTDB, + log_file, helpfile()); + + if (pmdaGetOpt(argc, argv, "d:i:l:pu:?", &dispatch, &err) != EOF) { + err++; + } + + if (err) { + usage(); + } + + pmdaOpenLog(&dispatch); + pmda_ctdb_init(&dispatch); + pmdaConnect(&dispatch); + pmdaMain(&dispatch); + + exit(0); +} + diff --git a/ctdb/utils/pmda/pmns b/ctdb/utils/pmda/pmns new file mode 100644 index 00000000000..dc7e3ac2bfa --- /dev/null +++ b/ctdb/utils/pmda/pmns @@ -0,0 +1,73 @@ +/* + * Metrics for CTDB PMDA + * + * Copyright (c) 2000-2004 Silicon Graphics, Inc. All Rights Reserved. + * Copyright (c) 2011 David Disseldorp + * + * This program is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License as published by the + * Free Software Foundation; either version 2 of the License, or (at your + * option) any later version. + * + * This program is distributed in the hope that it will be useful, but + * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY + * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * for more details. + * + * You should have received a copy of the GNU General Public License along + * with this program; if not, write to the Free Software Foundation, Inc., + * 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA + */ + +ctdb { + num_clients CTDB:0:0 + frozen CTDB:0:1 + recovering CTDB:0:2 + client_packets_sent CTDB:0:3 + client_packets_recv CTDB:0:4 + node_packets_sent CTDB:0:5 + node_packets_recv CTDB:0:6 + keepalive_packets_sent CTDB:0:7 + keepalive_packets_recv CTDB:0:8 + node + client + timeouts + total_calls CTDB:0:9 + pending_calls CTDB:0:10 + lockwait_calls CTDB:0:11 + pending_lockwait_calls CTDB:0:12 + childwrite_calls CTDB:0:13 + pending_childwrite_calls CTDB:0:14 + memory_used CTDB:0:15 + max_hop_count CTDB:0:16 + max_reclock_ctdbd CTDB:0:17 + max_reclock_recd CTDB:0:18 + max_call_latency CTDB:0:19 + max_lockwait_latency CTDB:0:20 + max_childwrite_latency CTDB:0:21 + num_recoveries CTDB:0:22 +} + +ctdb.node { + req_call CTDB:1:0 + reply_call CTDB:1:1 + req_dmaster CTDB:1:2 + reply_dmaster CTDB:1:3 + reply_error CTDB:1:4 + req_message CTDB:1:5 + req_control CTDB:1:6 + reply_control CTDB:1:7 +} + +ctdb.client { + req_call CTDB:2:0 + req_message CTDB:2:1 + req_control CTDB:2:2 +} + +ctdb.timeouts { + call CTDB:3:0 + control CTDB:3:1 + traverse CTDB:3:2 +} + diff --git a/ctdb/utils/pmda/root b/ctdb/utils/pmda/root new file mode 100644 index 00000000000..ff036ed7fbd --- /dev/null +++ b/ctdb/utils/pmda/root @@ -0,0 +1,10 @@ +/* + * fake "root" for validating the local PMNS subtree + */ + +#include <stdpmid> + +root { ctdb } + +#include "pmns" + diff --git a/ctdb/utils/scsi_io/scsi_io.c b/ctdb/utils/scsi_io/scsi_io.c new file mode 100644 index 00000000000..1a4fe0ef699 --- /dev/null +++ b/ctdb/utils/scsi_io/scsi_io.c @@ -0,0 +1,1152 @@ +/* a tool to open a scsi device and issue some useful commands + such as INQUIRY and helpers to call various PERSISTENT RESERVATION + functions + + Copyright ronnie sahlberg 2007 + + This program is free software; you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program; if not, see <http://www.gnu.org/licenses/>. +*/ + +/* very incomplete and needs to be enhanced with noice command line options + to drive it. + we need access to an array that supports the PERSISTENT RESERVATION cdb's + before we can proceed +*/ +/* scsi bugs: + INQUIRY takes a 2 byte allocation_length parameter but it appears that + it only looks at the low byte. If you specify 0x00ff all is well + but if you specify 0x0100 it gets confused and returnes garbage data + for (e.g) SupportedVPDPages. Same goes for UnitSerialNumber and probably all + other inq pages as well. + +*/ + +#include <unistd.h> +#include <fcntl.h> +#include <stdio.h> +#include <string.h> +#include <errno.h> +#include <sys/ioctl.h> +#include <scsi/sg.h> +#include "popt.h" + + +#define SCSI_TIMEOUT 5000 /* ms */ + +static char *command = NULL; +static char *device = NULL; +static char *key = NULL; +static char *rmkey = NULL; +static int scope = -1; +static int type = -1; + +const char *sensetable[16]={ + "no sense", + "recovered error", + "not ready", + "medium error", + "hardware error", + "illegal request", + "unit attention", + "data protect", + "blank check", + "vendor specific", + "copy aborted", + "aboreted command", + "unknown", + "unknown", + "unknown", + "unknown" +}; + +int scsi_io(int fd, unsigned char *cdb, unsigned char cdb_size, int xfer_dir, unsigned char *data, unsigned int *data_size, unsigned char *sense, unsigned int *sense_len) +{ + sg_io_hdr_t io_hdr; + + memset(&io_hdr, 0, sizeof(sg_io_hdr_t)); + io_hdr.interface_id = 'S'; + + /* CDB */ + io_hdr.cmdp = cdb; + io_hdr.cmd_len = cdb_size; + + /* Where to store the sense_data, if there was an error */ + io_hdr.sbp = sense; + io_hdr.mx_sb_len = *sense_len; + *sense_len=0; + + /* Transfer direction, either in or out. Linux does not yet + support bidirectional SCSI transfers ? + */ + io_hdr.dxfer_direction = xfer_dir; + + /* Where to store the DATA IN/OUT from the device and how big the + buffer is + */ + io_hdr.dxferp = data; + io_hdr.dxfer_len = *data_size; + + /* SCSI timeout in ms */ + io_hdr.timeout = SCSI_TIMEOUT; + + + if(ioctl(fd, SG_IO, &io_hdr) < 0){ + perror("SG_IO ioctl failed"); + return -1; + } + + /* now for the error processing */ + if((io_hdr.info & SG_INFO_OK_MASK) != SG_INFO_OK){ + if(io_hdr.sb_len_wr > 0){ + *sense_len=io_hdr.sb_len_wr; + return 0; + } + } + if(io_hdr.masked_status){ + printf("status=0x%x\n", io_hdr.status); + printf("masked_status=0x%x\n", io_hdr.masked_status); + return -2; + } + if(io_hdr.host_status){ + printf("host_status=0x%x\n", io_hdr.host_status); + return -3; + } + if(io_hdr.driver_status){ + printf("driver_status=0x%x\n", io_hdr.driver_status); + return -4; + } + +#if 0 +{int i; +printf("CDB:\n"); +for(i=0;i<cdb_size;i++){printf("0x%02x ",cdb[i]);if((i%8)==7)printf("\n");} +printf("\n"); +} +{int i; +printf("DATA:\n"); +for(i=0;i<96;i++){printf("0x%02x ",data[i]);if((i%8)==7)printf("\n");} +printf("\n"); +} +#endif + + return 0; +} + +typedef struct _value_string_t { + int value; + const char *string; +} value_string_t; + + + +value_string_t peripheral_device_types[] = { + {0, "SBC : Direct Access Block device"}, + {1, "SSC : Sequential Access Device"}, + {5, "MMC : Multimedia Device"}, + {17,"OSD : Object Based Storage"}, + {0,NULL} +}; + +value_string_t scsi_versions[] = { + {0, "No conformance to any standard claimed"}, + {3, "SPC"}, + {4, "SPC-2"}, + {5, "SPC-3"}, + {0,NULL} +}; + +value_string_t vpd_pages[] = { + {0x00, "Supported VPD Pages"}, + {0x80, "Unit Serial number"}, + {0x83, "Device Identification"}, + {0,NULL} +}; + +const char *val_to_str(value_string_t *vs, int v) +{ + while(vs && vs->string){ + if(vs->value==v){ + return vs->string; + } + vs++; + } + return ""; +} + +void print_sense_data(unsigned char *sense, int sense_len) +{ + int i; + unsigned char asc, ascq; + + printf("Device returned sense information\n"); + if(sense[0]==0x70){ + printf("filemark:%d eom:%d ili:%d sense-key:0x%02x (%s)\n", + !!(sense[2]&0x80), + !!(sense[2]&0x40), + !!(sense[2]&0x20), + sense[2]&0x0f, + sensetable[sense[2]&0x0f]); + printf("command specific info: 0x%02x 0x%02x 0x%02x 0x%02x\n", + sense[8],sense[9],sense[10],sense[11]); + + asc=sense[12]; + printf("additional sense code:0x%02x\n", asc); + + ascq=sense[13]; + printf("additional sense code qualifier:0x%02x\n", ascq); + + printf("field replacable unit code:0x%02x\n", sense[14]); + + if((asc==0x20)&&(ascq==0x00)) + printf("INVALID COMMAND OPERATION CODE\n"); + } + + printf("Sense data:\n"); + for(i=0;i<sense_len;i++){ + printf("0x%02x ", sense[i]); + if((i%8)==7)printf("\n"); + } + printf("\n"); +} + +int scsi_inquiry(int fd) +{ + unsigned char cdb[]={0x12,0,0,0,0,0}; + + unsigned int data_size=96; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + + int res, i; + + cdb[3]=(data_size>>8)&0xff; + cdb[4]=data_size&0xff; + + + printf("Standard INQUIRY Data:\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_FROM_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + /* Peripheral Qualifier */ + printf("Peripheral Qualifier:%c%c%cb\n", + '0'+!!(data[0]&0x80), + '0'+!!(data[0]&0x40), + '0'+!!(data[0]&0x20)); + + /* Peripheral Device Type */ + printf("Peripheral Device Type: 0x%02x (%s)\n", + data[0]&0x1f, + val_to_str(peripheral_device_types, data[0]&0x1f)); + + /* RMB */ + printf("RMB: %s device\n", data[1]&0x80?"REMOVABLE":"NON-REMOVABLE"); + + /* SCSI Version */ + printf("SCSI Version: 0x%02x (%s)\n", + data[2], + val_to_str(scsi_versions, data[2])); + + /* NormACA, HiSUP, Response Data Format */ + printf("NormACA:%d HiSup:%d ResponseDataFormat:%d\n", + !!(data[3]&0x20), + !!(data[3]&0x10), + data[3]&0x0f); + + switch(data[3]&0x0f){ + /*SPC-2/SPC-3/SPC-4*/ + case 2: + /*SPC (not strictly correct but we print it like 2 anyway)*/ + case 1: + /* SCCS ... */ + printf("SCCS:%d ACC:%d TPGS:%c%cb 3PC:%d PROTECT:%d\n", + !!(data[5]&0x80), + !!(data[5]&0x40), + '0'+!!(data[5]&0x20), + '0'+!!(data[5]&0x10), + !!(data[5]&0x08), + !!(data[5]&0x01)); + + /* Encserv ... */ + printf("Encserv:%d VS:%d MultiP:%d ADDR16:%d\n", + !!(data[6]&0x40), + !!(data[6]&0x20), + !!(data[6]&0x10), + !!(data[6]&0x01)); + + /* WBUS16 ... */ + printf("WBUS16:%d SYNC:%d CmdQue:%d VS:%d\n", + !!(data[7]&0x20), + !!(data[7]&0x10), + !!(data[7]&0x02), + !!(data[7]&0x01)); + + + /* T10 vendor Identification */ + printf("Vendor:"); + for(i=0;i<8;i++)printf("%c",data[8+i]);printf("\n"); + + /* Product Identification */ + printf("Product:"); + for(i=0;i<16;i++)printf("%c",data[16+i]);printf("\n"); + + /* Product Revision Level */ + printf("Product Revision:"); + for(i=0;i<4;i++)printf("%c",data[32+i]);printf("\n"); + + break; + } + + return 0; +} + +int scsi_inquiry_supported_vpd_pages(int fd) +{ + unsigned char cdb[]={0x12,0x01,0,0,0,0}; + + unsigned int data_size=0xff; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + + int res, pl, i; + + cdb[3]=(data_size>>8)&0xff; + cdb[4]=data_size&0xff; + + + printf("INQUIRY Supported VPD Pages:\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_FROM_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + /* Page Length */ + pl=data[3]; + + /* Pages */ + for(i=4;i<(pl+4);i++){ + printf("Page:%02xh (%s)\n", + data[i], + val_to_str(vpd_pages, data[i])); + } + + return 0; +} + +int scsi_inquiry_unit_serial_number(int fd) +{ + unsigned char cdb[]={0x12,0x01,0x80,0,0,0}; + + unsigned int data_size=0x00ff; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + + int res, pl, i; + + cdb[3]=(data_size>>8)&0xff; + cdb[4]=data_size&0xff; + + + printf("INQUIRY Unit Serial Number:\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_FROM_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + /* Page Length */ + pl=data[3]; + + /* Unit Serial Number */ + printf("Unit Serial Number:"); + for(i=4;i<(pl+4);i++)printf("%c",data[i]&0xff);printf("\n"); + + return 0; +} + +int scsi_persistent_reserve_in_read_keys(int fd) +{ + unsigned char cdb[]={0x5e,0,0,0,0,0,0,0,0,0}; + + unsigned int data_size=0x00ff; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + unsigned char service_action=0; + int res, i; + unsigned long prgeneration, additional_length; + + cdb[1]=service_action; + cdb[7]=(data_size>>8)&0xff; + cdb[8]=data_size&0xff; + + + printf("PRESISTENT RESERVE IN: READ KEYS\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_FROM_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + /* PRGeneration */ + prgeneration=data[0]; + prgeneration<<=8;prgeneration|=data[1]; + prgeneration<<=8;prgeneration|=data[2]; + prgeneration<<=8;prgeneration|=data[3]; + printf("PRGeneration:%lu\n", prgeneration); + + /* Additional Length */ + additional_length=data[4]; + additional_length<<=8;additional_length|=data[5]; + additional_length<<=8;additional_length|=data[6]; + additional_length<<=8;additional_length|=data[7]; + printf("Additional Length:%lu\n", additional_length); + + /* print the registered keys */ + for(i=0;i<additional_length;i+=8){ + printf("Key:%02x%02x%02x%02x%02x%02x%02x%02x\n", + data[i+8], + data[i+9], + data[i+10], + data[i+11], + data[i+12], + data[i+13], + data[i+14], + data[i+15]); + } + + return 0; +} + +int scsi_persistent_reserve_in_read_reservation(int fd) +{ + unsigned char cdb[]={0x5e,0,0,0,0,0,0,0,0,0}; + + unsigned int data_size=0x00ff; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + unsigned char service_action=1; + int res; + unsigned long prgeneration, additional_length; + + cdb[1]=service_action; + cdb[7]=(data_size>>8)&0xff; + cdb[8]=data_size&0xff; + + + printf("PRESISTENT RESERVE IN: READ RESERVATION\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_FROM_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + /* PRGeneration */ + prgeneration=data[0]; + prgeneration<<=8;prgeneration|=data[1]; + prgeneration<<=8;prgeneration|=data[2]; + prgeneration<<=8;prgeneration|=data[3]; + printf("PRGeneration:%lu\n", prgeneration); + + /* Additional Length */ + additional_length=data[4]; + additional_length<<=8;additional_length|=data[5]; + additional_length<<=8;additional_length|=data[6]; + additional_length<<=8;additional_length|=data[7]; + printf("Additional Length:%lu\n", additional_length); + + if(additional_length==16){ + printf("Key:%02x%02x%02x%02x%02x%02x%02x%02x\n", + data[8], + data[9], + data[10], + data[11], + data[12], + data[13], + data[14], + data[15]); + printf("Scope:%xh Type:%xh\n",data[21]>>4,data[21]&0x0f); + } + + return 0; +} + +int scsi_persistent_reserve_in_report_capabilities(int fd) +{ + unsigned char cdb[]={0x5e,0,0,0,0,0,0,0,0,0}; + + unsigned int data_size=0x00ff; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + unsigned char service_action=2; + int res; + unsigned short length, type_mask; + + cdb[1]=service_action; + cdb[7]=(data_size>>8)&0xff; + cdb[8]=data_size&0xff; + + + printf("PRESISTENT RESERVE IN: REPORT CAPABILITIES\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_FROM_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + /* Length */ + length=data[0]; + length<<=8;length|=data[1]; + printf("Length:%d\n", length); + + /* CRH ... */ + printf("CRH:%d SIP_C:%d ATP_C:%d PTPL_C:%d\n", + !!(data[2]&0x10), + !!(data[2]&0x08), + !!(data[2]&0x04), + !!(data[2]&0x01)); + + /* TMV ... */ + printf("TMV:%d ALLOW_COMMANDS:%c%c%cb PTPL_A:%d\n", + !!(data[3]&0x80), + '0'+(!!(data[3]&0x40)), + '0'+(!!(data[3]&0x20)), + '0'+(!!(data[3]&0x10)), + !!(data[3]&0x01)); + + /* Persistent Reservation Type Mask */ + type_mask=data[4]; + type_mask<<=8;type_mask|=data[5]; + printf("Presistent Reservation Type Mask:0x%04x\n", type_mask); + printf("WR_EX_AR:%d EX_AC_RO:%d WR_EX_RO:%d EX_AC:%d WR_EX:%d EX_AC_AR:%d\n", + !!(data[4]&0x80), + !!(data[4]&0x40), + !!(data[4]&0x20), + !!(data[4]&0x08), + !!(data[4]&0x02), + !!(data[4]&0x01)); + + return 0; +} + +int scsi_persistent_reserve_in_read_full_status(int fd) +{ + unsigned char cdb[]={0x5e,0,0,0,0,0,0,0,0,0}; + + unsigned int data_size=0x00ff; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + unsigned char service_action=3; + int res; + unsigned long prgeneration, additional_length; + + cdb[1]=service_action; + cdb[7]=(data_size>>8)&0xff; + cdb[8]=data_size&0xff; + + + printf("PRESISTENT RESERVE IN: READ FULL STATUS\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_FROM_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + /* PRGeneration */ + prgeneration=data[0]; + prgeneration<<=8;prgeneration|=data[1]; + prgeneration<<=8;prgeneration|=data[2]; + prgeneration<<=8;prgeneration|=data[3]; + printf("PRGeneration:%lu\n", prgeneration); + + /* Additional Length */ + additional_length=data[4]; + additional_length<<=8;additional_length|=data[5]; + additional_length<<=8;additional_length|=data[6]; + additional_length<<=8;additional_length|=data[7]; + printf("Additional Length:%lu\n", additional_length); + +/*XXX*/ + + return 0; +} + +int scsi_persistent_reserve_out_clear(int fd) +{ + unsigned char cdb[]={0x5f,0,0,0,0,0,0,0,0,0}; + + unsigned int data_size=24; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + unsigned char service_action=3; + int res; + + long long k; + + if (scope==-1) { + printf("Must specify scope\n"); + printf("scsi_io --device=<DEVICE> --command=clear --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + if (type==-1) { + printf("Must specify type\n"); + printf("scsi_io --device=<DEVICE> --command=clear --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + if (!key) { + printf("Must specify key\n"); + printf("scsi_io --device=<DEVICE> --command=clear --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + + sscanf(key, "%llx", &k); + cdb[1]=service_action; + cdb[2]=(scope<<4)|type; + cdb[7]=(data_size>>8)&0xff; + cdb[8]=data_size&0xff; + + memset(data, 0, data_size); + + /* Reservation Key */ + data[0]=(k>>56)&0xff; + data[1]=(k>>48)&0xff; + data[2]=(k>>40)&0xff; + data[3]=(k>>32)&0xff; + data[4]=(k>>24)&0xff; + data[5]=(k>>16)&0xff; + data[6]=(k>> 8)&0xff; + data[7]=(k )&0xff; + + /* Service Action Key */ + data[8]=0; + data[9]=0; + data[10]=0; + data[11]=0; + data[12]=0; + data[13]=0; + data[14]=0; + data[15]=0; + + /* Spec_ip_ti=0 all_tg_pt=1 aptpl=0 */ + data[20]=0x04; + + printf("PRESISTENT RESERVE IN: CLEAR\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_TO_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + return 0; +} + +int scsi_persistent_reserve_out_reserve(int fd) +{ + unsigned char cdb[]={0x5f,0,0,0,0,0,0,0,0,0}; + + unsigned int data_size=24; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + unsigned char service_action=1; + int res; + long long k; + + if (scope==-1) { + printf("Must specify scope\n"); + printf("scsi_io --device=<DEVICE> --command=reserve --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + if (type==-1) { + printf("Must specify type\n"); + printf("scsi_io --device=<DEVICE> --command=reserve --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + if (!key) { + printf("Must specify key\n"); + printf("scsi_io --device=<DEVICE> --command=reserve --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + + sscanf(key, "%llx", &k); + + + cdb[1]=service_action; + cdb[2]=(scope<<4)|type; + cdb[7]=(data_size>>8)&0xff; + cdb[8]=data_size&0xff; + + memset(data, 0, data_size); + + /* Reservation Key */ + data[0]=(k>>56)&0xff; + data[1]=(k>>48)&0xff; + data[2]=(k>>40)&0xff; + data[3]=(k>>32)&0xff; + data[4]=(k>>24)&0xff; + data[5]=(k>>16)&0xff; + data[6]=(k>> 8)&0xff; + data[7]=(k )&0xff; + + /* Service Action Key */ + data[8]=0; + data[9]=0; + data[10]=0; + data[11]=0; + data[12]=0; + data[13]=0; + data[14]=0; + data[15]=0; + + /* Spec_ip_ti=0 all_tg_pt=1 aptpl=0 */ + data[20]=0x04; + + printf("PRESISTENT RESERVE IN: RESERVE\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_TO_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + return 0; +} + +int scsi_persistent_reserve_out_preempt(int fd) +{ + unsigned char cdb[]={0x5f,0,0,0,0,0,0,0,0,0}; + + unsigned int data_size=24; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + unsigned char service_action=4; + int res; + long long k; + + if (scope==-1) { + printf("Must specify scope\n"); + printf("scsi_io --device=<DEVICE> --command=preempt --scope=<SCOPE> --type=<TYPE> --key=<KEY> --rmkey=<KEY>\n"); + _exit(10); + } + if (type==-1) { + printf("Must specify type\n"); + printf("scsi_io --device=<DEVICE> --command=preempt --scope=<SCOPE> --type=<TYPE> --key=<KEY> --rmkey=<KEY>\n"); + _exit(10); + } + if (!key) { + printf("Must specify key\n"); + printf("scsi_io --device=<DEVICE> --command=preempt --scope=<SCOPE> --type=<TYPE> --key=<KEY> --rmkey=<KEY>\n"); + _exit(10); + } + if (!rmkey) { + printf("Must specify rmkey\n"); + printf("scsi_io --device=<DEVICE> --command=preempt --scope=<SCOPE> --type=<TYPE> --key=<KEY> --rmkey=<KEY>\n"); + _exit(10); + } + + + + cdb[1]=service_action; + cdb[2]=(scope<<4)|type; + cdb[7]=(data_size>>8)&0xff; + cdb[8]=data_size&0xff; + + memset(data, 0, data_size); + + /* Reservation Key */ + sscanf(key, "%llx", &k); + data[0]=(k>>56)&0xff; + data[1]=(k>>48)&0xff; + data[2]=(k>>40)&0xff; + data[3]=(k>>32)&0xff; + data[4]=(k>>24)&0xff; + data[5]=(k>>16)&0xff; + data[6]=(k>> 8)&0xff; + data[7]=(k )&0xff; + + /* Service Action Key */ + sscanf(rmkey, "%llx", &k); + data[8] =(k>>56)&0xff; + data[9] =(k>>48)&0xff; + data[10]=(k>>40)&0xff; + data[11]=(k>>32)&0xff; + data[12]=(k>>24)&0xff; + data[13]=(k>>16)&0xff; + data[14]=(k>> 8)&0xff; + data[15]=(k )&0xff; + + /* Spec_ip_ti=0 all_tg_pt=1 aptpl=0 */ + data[20]=0x04; + + printf("PRESISTENT RESERVE IN: RESERVE\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_TO_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + return 0; +} + +int scsi_persistent_reserve_out_register_and_ignore_existing_key(int fd) +{ + unsigned char cdb[]={0x5f,0,0,0,0,0,0,0,0,0}; + + unsigned int data_size=24; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + unsigned char service_action=6; + int res; + long long k; + + if (scope==-1) { + printf("Must specify scope\n"); + printf("scsi_io --device=<DEVICE> --command=registerkey --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + if (type==-1) { + printf("Must specify type\n"); + printf("scsi_io --device=<DEVICE> --command=registerkey --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + if (!key) { + printf("Must specify key\n"); + printf("scsi_io --device=<DEVICE> --command=registerkey --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + + sscanf(key, "%llx", &k); + + cdb[1]=service_action; + cdb[2]=(scope<<4)|type; + cdb[7]=(data_size>>8)&0xff; + cdb[8]=data_size&0xff; + + memset(data, 0, data_size); + + /* Reservation Key */ + data[0]=0; + data[1]=0; + data[2]=0; + data[3]=0; + data[4]=0; + data[5]=0; + data[6]=0; + data[7]=0; + + /* Service Action Key */ + data[8] =(k>>56)&0xff; + data[9] =(k>>48)&0xff; + data[10]=(k>>40)&0xff; + data[11]=(k>>32)&0xff; + data[12]=(k>>24)&0xff; + data[13]=(k>>16)&0xff; + data[14]=(k>> 8)&0xff; + data[15]=(k )&0xff; + + /* Spec_ip_ti=0 all_tg_pt=1 aptpl=0 */ + data[20]=0x04; + + printf("PRESISTENT RESERVE IN: REGISTER AND IGNORE EXISTING KEY\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_TO_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + return 0; +} + +int scsi_persistent_reserve_out_unregister_key(int fd) +{ + unsigned char cdb[]={0x5f,0,0,0,0,0,0,0,0,0}; + + unsigned int data_size=24; + unsigned char data[data_size]; + + unsigned int sense_len=32; + unsigned char sense[sense_len]; + unsigned char service_action=6; + int res; + long long k; + + if (scope==-1) { + printf("Must specify scope\n"); + printf("scsi_io --device=<DEVICE> --command=unregisterkey --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + if (type==-1) { + printf("Must specify type\n"); + printf("scsi_io --device=<DEVICE> --command=unregisterkey --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + if (!key) { + printf("Must specify key\n"); + printf("scsi_io --device=<DEVICE> --command=unregisterkey --scope=<SCOPE> --type=<TYPE> --key=<KEY>\n"); + _exit(10); + } + + sscanf(key, "%llx", &k); + + cdb[1]=service_action; + cdb[2]=(scope<<4)|type; + cdb[7]=(data_size>>8)&0xff; + cdb[8]=data_size&0xff; + + memset(data, 0, data_size); + + /* Reservation Key */ + data[0]=(k>>56)&0xff; + data[1]=(k>>48)&0xff; + data[2]=(k>>40)&0xff; + data[3]=(k>>32)&0xff; + data[4]=(k>>24)&0xff; + data[5]=(k>>16)&0xff; + data[6]=(k>> 8)&0xff; + data[7]=(k )&0xff; + + /* Service Action Key */ + data[8]=0; + data[9]=0; + data[10]=0; + data[11]=0; + data[12]=0; + data[13]=0; + data[14]=0; + data[15]=0; + + /* Spec_ip_ti=0 all_tg_pt=1 aptpl=0 */ + data[20]=0x04; + + printf("PRESISTENT RESERVE IN: UNREGISTER KEY\n"); + + res=scsi_io(fd, cdb, sizeof(cdb), SG_DXFER_TO_DEV, data, &data_size, sense, &sense_len); + if(res){ + printf("SCSI_IO failed\n"); + return -1; + } + if(sense_len){ + print_sense_data(sense, sense_len); + return -1; + } + + return 0; +} + + + + +int open_scsi_device(const char *dev) +{ + int fd, vers; + + if((fd=open(dev, O_RDWR))<0){ + printf("ERROR could not open device %s\n", dev); + return -1; + } + if ((ioctl(fd, SG_GET_VERSION_NUM, &vers) < 0) || (vers < 30000)) { + printf("/dev is not an sg device, or old sg driver\n"); + close(fd); + return -1; + } + + return fd; +} + +typedef int (*scsi_func_t)(int fd); +typedef struct _cmds_t { + const char *cmd; + scsi_func_t func; + const char *comment; +} cmds_t; +cmds_t cmds[] = { + {"inq", scsi_inquiry, "Standard INQUIRY output"}, + {"vpd", scsi_inquiry_supported_vpd_pages, "Supported VPD Pages"}, + {"usn", scsi_inquiry_unit_serial_number, "Unit serial number"}, + {"readkeys", scsi_persistent_reserve_in_read_keys, "Read SCSI Reservation Keys"}, + {"readrsvr", scsi_persistent_reserve_in_read_reservation, "Read SCSI Reservation Data"}, + {"reportcap", scsi_persistent_reserve_in_report_capabilities, "Report reservation Capabilities"}, + {"registerkey", scsi_persistent_reserve_out_register_and_ignore_existing_key, "Register and ignore existing key"}, + {"unregisterkey", scsi_persistent_reserve_out_unregister_key, "Unregister a key"}, + {"clear", scsi_persistent_reserve_out_clear, "Clear all reservations and registrations"}, + {"reserve", scsi_persistent_reserve_out_reserve, "Reserve"}, + {"preempt", scsi_persistent_reserve_out_preempt, "Preempt (remove someone elses registration)"}, +}; + +void usage(void) +{ + int i; + printf("Usage: scsi_io --command <command> --device <device>\n"); + printf("Commands:\n"); + for (i=0;i<sizeof(cmds)/sizeof(cmds[0]);i++){ + printf(" %s %s\n", cmds[i].cmd, cmds[i].comment); + } +} + + +int main(int argc, const char *argv[]) +{ + int i, fd; + int opt; + scsi_func_t func=NULL; + struct poptOption popt_options[] = { + POPT_AUTOHELP + { "scope", 's', POPT_ARG_INT, &scope, 0, "scope", "integer" }, + { "type", 't', POPT_ARG_INT, &type, 0, "type", "integer" }, + { "key", 'k', POPT_ARG_STRING, &key, 0, "key", "key" }, + { "rmkey", 'r', POPT_ARG_STRING, &rmkey, 0, "rmkey", "rmkey" }, + { "command", 'c', POPT_ARG_STRING, &command, 0, "command", "command" }, + { "device", 'd', POPT_ARG_STRING, &device, 0, "device", "device" }, +// { "machinereadable", 'Y', POPT_ARG_NONE, &options.machinereadable, 0, "enable machinereadable output", NULL }, + POPT_TABLEEND + }; + poptContext pc; + + pc = poptGetContext(argv[0], argc, argv, popt_options, POPT_CONTEXT_KEEP_FIRST); + + while ((opt = poptGetNextOpt(pc)) != -1) { + switch (opt) { + default: + fprintf(stderr, "Invalid option %s: %s\n", + poptBadOption(pc, 0), poptStrerror(opt)); + _exit(1); + } + } + + if (!command) { + printf("Must specify the command\n"); + usage(); + _exit(10); + } + + if (!device) { + printf("Must specify the device\n"); + usage(); + _exit(10); + } + + fd=open_scsi_device(device); + if(fd<0){ + printf("Could not open SCSI device %s\n",device); + usage(); + _exit(10); + } + + for (i=0;i<sizeof(cmds)/sizeof(cmds[0]);i++){ + if(!strcmp(cmds[i].cmd, command)) { + func = cmds[i].func; + break; + } + } + if (!func) { + printf("Unrecognized command : %s\n", command); + usage(); + _exit(10); + } + + func(fd); + +#if 0 + scsi_persistent_reserve_in_read_full_status(fd); + scsi_persistent_reserve_out_register_and_ignore_existing_key(fd); + scsi_persistent_reserve_in_read_keys(fd); + + scsi_persistent_reserve_out_reserve(fd); + scsi_persistent_reserve_in_read_reservation(fd); + + scsi_persistent_reserve_out_clear(fd); + scsi_persistent_reserve_in_read_reservation(fd); + + scsi_persistent_reserve_out_unregister_key(fd); + scsi_persistent_reserve_in_read_keys(fd); +#endif + return 0; +} diff --git a/ctdb/utils/smnotify/smnotify.c b/ctdb/utils/smnotify/smnotify.c new file mode 100644 index 00000000000..d7fd54626e2 --- /dev/null +++ b/ctdb/utils/smnotify/smnotify.c @@ -0,0 +1,150 @@ +/* + simple smnotify tool + + Copyright (C) Ronnie Sahlberg 2007 + + This program is free software; you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program; if not, see <http://www.gnu.org/licenses/>. +*/ +#include <stdio.h> +#include <unistd.h> +#include <string.h> +#include <sys/types.h> +#include <sys/socket.h> +#include <netinet/in.h> +#include <arpa/inet.h> +#include "smnotify.h" +#include "popt.h" + +static char *client = NULL; +static const char *ip = NULL; +static char *server = NULL; +static int stateval = 0; +static int clientport = 0; +static int sendport = 0; + +static void useage(void) +{ + exit(0); +} + +static int create_socket(const char *addr, int port) +{ + int s; + struct sockaddr_in sock_in; + + s = socket(PF_INET, SOCK_DGRAM, IPPROTO_UDP); + if (s == -1) { + printf("Failed to open local socket\n"); + exit(10); + } + + bzero(&sock_in, sizeof(sock_in)); + sock_in.sin_family = PF_INET; + sock_in.sin_port = htons(port); + inet_aton(addr, &sock_in.sin_addr); + if (bind(s, (struct sockaddr *)&sock_in, sizeof(sock_in)) == -1) { + printf("Failed to bind to local socket\n"); + exit(10); + } + + return s; +} + +int main(int argc, const char *argv[]) +{ + struct poptOption popt_options[] = { + POPT_AUTOHELP + { "client", 'c', POPT_ARG_STRING, &client, 0, "remote client to send the notify to", "hostname/ip" }, + { "clientport", 0, POPT_ARG_INT, &clientport, 0, "clientport", "integer" }, + { "ip", 'i', POPT_ARG_STRING, &ip, 0, "local ip address to send the notification from", "ip" }, + { "sendport", 0, POPT_ARG_INT, &sendport, 0, "port to send the notify from", "integer" }, + { "server", 's', POPT_ARG_STRING, &server, 0, "servername to use in the notification", "hostname/ip" }, + { "stateval", 0, POPT_ARG_INT, &stateval, 0, "stateval", "integer" }, + POPT_TABLEEND + }; + int opt; + poptContext pc; + CLIENT *clnt; + int s; + struct sockaddr_in sock_cl; + struct timeval w; + struct status st; + + pc = poptGetContext(argv[0], argc, argv, popt_options, POPT_CONTEXT_KEEP_FIRST); + + while ((opt = poptGetNextOpt(pc)) != -1) { + switch (opt) { + default: + fprintf(stderr, "Invalid option %s: %s\n", + poptBadOption(pc, 0), poptStrerror(opt)); + exit(1); + } + } + + if (client == NULL) { + printf("ERROR: client not specified\n"); + useage(); + } + + if (ip == NULL) { + printf("ERROR: ip not specified\n"); + useage(); + } + + if (server == NULL) { + printf("ERROR: server not specified\n"); + useage(); + } + + if (stateval == 0) { + printf("ERROR: stateval not specified\n"); + useage(); + } + + + /* Since we want to control from which address these packets are + sent we must create the socket ourself and use low-level rpc + calls. + */ + s = create_socket(ip, sendport); + + /* only wait for at most 3 seconds before giving up */ + alarm(3); + + /* Setup a sockaddr_in for the client we want to notify */ + bzero(&sock_cl, sizeof(sock_cl)); + sock_cl.sin_family = PF_INET; + sock_cl.sin_port = htons(clientport); + inet_aton(client, &sock_cl.sin_addr); + + w.tv_sec = 1; + w.tv_usec= 0; + + clnt = clntudp_create(&sock_cl, 100024, 1, w, &s); + if (clnt == NULL) { + printf("ERROR: failed to connect to client\n"); + exit(10); + } + + /* we dont want to wait for any reply */ + w.tv_sec = 0; + w.tv_usec = 0; + clnt_control(clnt, CLSET_TIMEOUT, (char *)&w); + + st.mon_name=server; + st.state=stateval; + sm_notify_1(&st, clnt); + + return 0; +} diff --git a/ctdb/utils/smnotify/smnotify.x b/ctdb/utils/smnotify/smnotify.x new file mode 100644 index 00000000000..94239f8baf2 --- /dev/null +++ b/ctdb/utils/smnotify/smnotify.x @@ -0,0 +1,21 @@ +#ifdef RPC_HDR +%#ifdef _AIX +%#include <rpc/rpc.h> +%#endif /* _AIX */ +#endif /* RPC_HDR */ + +const SM_MAXSTRLEN = 1024; + +struct status { + string mon_name<SM_MAXSTRLEN>; + int state; +}; + + +program SMNOTIFY { + version SMVERSION { + void SM_NOTIFY(struct status) = 6; + } = 1; +} = 100024; + + |