Today I ended up working out the details on what we want to monitor regarding our BladeCenter. The most interesting details (for us that is) are these:

  • Fan speeds for Chassis Cooling/Power Module Cooling Bay(s)
  • Temperature
  • Power Domain utilization

It wasn’t * that* hard to implement. Only trouble(s) I ran into, were ( 1) IBM did a real shitty job with the MIB’s. If you look closely into the mmblade.mib, you’re gonna notice, that not a single OID is specified for the events. ( 2) As the MIB’s weren’t documented anywhere, I had to look them up via snmpwalk (which I had never used before). So as a reminder (to myself), here’s how it is done:

1
snmpwalk -v1 -c public -O n 10.0.0.35 .1.3.6.1.4.1.2.3.51.2.2

This will get you a list, with a lot of output (5154 lines to be exact). Lucky me, the web interface of the management module/ssh interface is rather verbose, so all you need to do is compare those values with what you are looking for.

So for myself (and anyone interested) read ahead for the list of checks we are currently running on the management module.

  1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
define command {
  command_name      check_snmpv1
  command_line      /usr/lib/nagios/plugins/check_snmp -C public
                             -H $HOSTADDRESS$ -o $ARG1$ -w $ARG2$
                             -c $ARG3$ -l $ARG5$ -u $ARG4$
}

define host {
  use                   generic-network
  host_name             bc-mgmt1
  alias                 bc-mgmt1.home.barfoo.org
  address               10.0.0.35
  parents               uni-greif-05
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Temperature
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.1.5.1.0!
                                  33!38!C!Input temperature
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Chassis Cooling - Bay 1
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.3.20.0!
                                  1600:1200,2100:2600!1200:0,2600:3000!RPM!
                                  Chassis Cooling - Bay 1
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Chassis Cooling - Bay 2
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.3.21.0!
                                  1600:1200,2100:2600!1200:0,2600:3000!RPM!
                                  Chassis Cooling - Bay 2
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Module Cooling - Bay 1
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.6.1.1.6.1!
                                  6200:5400,6700:7000!5300:0,7000:7500!RPM!
                                  Power Module Cooling - Bay 1
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Module Cooling - Bay 1 Fans
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.6.1.1.4.1!
                                  2:1!1:0!Fans present!
                                  Power Module Cooling - Bay 1
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Module Cooling - Bay 2
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.6.1.1.6.2!
                                  6200:5400,6700:7000!5300:0,7000:7500!RPM!
                                  Power Module Cooling - Bay 2
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Module Cooling - Bay 2 Fans
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.6.1.1.4.2!
                                  2:1!1:0!Fans present!
                                  Power Module Cooling - Bay 2
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Module Cooling - Bay 3
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.6.1.1.6.3!
                                  6200:5400,6700:7000!5300:0,7000:7500!RPM!
                                  Power Module Cooling - Bay 3
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Module Cooling - Bay 3 Fans
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.6.1.1.4.3!
                                  2:1!1:0!Fans present!
                                  Power Module Cooling - Bay 3
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Module Cooling - Bay 4
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.6.1.1.6.2!
                                  6200:5400,6700:7000!5300:0,7000:7500!RPM!
                                  Power Module Cooling - Bay 4
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Module Cooling - Bay 4 Fans
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.6.1.1.4.2!
                                  2:1!1:0!Fans present!
                                  Power Module Cooling - Bay 4
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Domain 1: Utilization
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.10.1.1.1.10.1!
                                  2600:2400!2880:2600!W!
                                  Power Domain 1: Utilization
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}

define service {
  use                   generic-service
  host_name             bc-mgmt1
  service_description   Power Domain 2: Utilization
  check_command         check_snmpv1!.1.3.6.1.4.1.2.3.51.2.2.10.1.1.1.10.2!
                                  2600:2400!2880:2600!W!
                                  Power Domain 2: Utilization
  action_url            /pnp/index.php?host=$HOSTNAME$&srv=$SERVICEDESC$
  notes                 View PNP RRD grap
}