rochaporto / collectd-ceph

collectd plugins and dashboards for ceph
GNU General Public License v2.0
60 stars 65 forks source link

cluster status (ceph perf dump) #9

Closed rochaporto closed 10 years ago

rochaporto commented 10 years ago

Something similar to:

ceph --admin-daemon /var/run/ceph/ceph-mon.ceph.asok perf dump
{ "cluster": { "num_mon": 1,
      "num_mon_quorum": 1,
      "num_osd": 2,
      "num_osd_up": 2,
      "num_osd_in": 2,
      "osd_epoch": 29,
      "osd_kb": 6815452,
      "osd_kb_used": 2220596,
      "osd_kb_avail": 4594856,
      "num_pool": 15,
      "num_pg": 960,
      "num_pg_active_clean": 960,
      "num_pg_active": 960,
      "num_pg_peering": 0,
      "num_object": 13,
      "num_object_degraded": 0,
      "num_object_unfound": 0,
      "num_bytes": 22908977,
      "num_mds_up": 0,
      "num_mds_in": 0,
      "num_mds_failed": 0,
      "mds_epoch": 1},
  "leveldb": { "leveldb_get": 35461,
      "leveldb_transaction": 2166,
      "leveldb_compact": 0,
      "leveldb_compact_range": 2,
      "leveldb_compact_queue_merge": 0,
      "leveldb_compact_queue_len": 0},
  "mon": {},
  "throttle-mon_client_bytes": { "val": 0,
      "max": 104857600,
      "get": 2573538,
      "get_sum": 187405680,
      "get_or_fail_fail": 0,
      "get_or_fail_success": 0,
      "take": 0,
      "take_sum": 0,
      "put": 2573538,
      "put_sum": 187405680,
      "wait": { "avgcount": 0,
          "sum": 0.000000000}},
  "throttle-mon_daemon_bytes": { "val": 0,
      "max": 419430400,
      "get": 11354,
      "get_sum": 4799934,
      "get_or_fail_fail": 0,
      "get_or_fail_success": 0,
      "take": 0,
      "take_sum": 0,
      "put": 11354,
      "put_sum": 4799934,
      "wait": { "avgcount": 0,
          "sum": 0.000000000}},
  "throttle-msgr_dispatch_throttler-mon": { "val": 0,
      "max": 104857600,
      "get": 2584892,
      "get_sum": 192205614,
      "get_or_fail_fail": 0,
      "get_or_fail_success": 0,
      "take": 0,
      "take_sum": 0,
      "put": 2584892,
      "put_sum": 192205614,
      "wait": { "avgcount": 0,
          "sum": 0.000000000}}}

Even if some of the metrics are coming from other places too, still worth it.

rochaporto commented 10 years ago

OSD state values are already provided by #1

Total cluster usage is already provided by #4

So we probably don't need this one.