fix(ceph): PromRule CephPGImbalance adjusted to group by node
balancing is done by hostname not osd. !1
This commit is contained in:
		| @ -257,10 +257,25 @@ spec: | |||||||
|           description: "OSD {{ `{{` }} $labels.ceph_daemon }} on {{ `{{` }} $labels.hostname }} deviates by more than 30% from average PG count." |           description: "OSD {{ `{{` }} $labels.ceph_daemon }} on {{ `{{` }} $labels.hostname }} deviates by more than 30% from average PG count." | ||||||
|           summary: "PGs are not balanced across OSDs" |           summary: "PGs are not balanced across OSDs" | ||||||
|         expr: | |         expr: | | ||||||
|           abs( |           # abs( | ||||||
|             ((ceph_osd_numpg > 0) - on (job) group_left avg(ceph_osd_numpg > 0) by (job)) / |           #   ((ceph_osd_numpg > 0) - on (job) group_left avg(ceph_osd_numpg > 0) by (job)) / | ||||||
|             on (job) group_left avg(ceph_osd_numpg > 0) by (job) |           #   on (job) group_left avg(ceph_osd_numpg > 0) by (hostname) | ||||||
|           ) * on (ceph_daemon) group_left(hostname) ceph_osd_metadata > 0.30 |           # ) * on (ceph_daemon) group_left(hostname) ceph_osd_metadata > 0.30 | ||||||
|  |           (sum by(hostname) ((ceph_osd_numpg > 0) * on(ceph_daemon) group_left(hostname) ceph_osd_metadata))  | ||||||
|  |             <  | ||||||
|  |           scalar( | ||||||
|  |             (avg by (job) (sum by(hostname) ((ceph_osd_numpg > 0) * on(ceph_daemon) group_left(hostname) ceph_osd_metadata)) | ||||||
|  |               -  | ||||||
|  |             (avg by (job) (sum by(hostname) ((ceph_osd_numpg > 0) * on(ceph_daemon) group_left(hostname) ceph_osd_metadata)) * 0.3 )) | ||||||
|  |           ) | ||||||
|  |             or | ||||||
|  |           (sum by(hostname) ((ceph_osd_numpg > 0) * on(ceph_daemon) group_left(hostname) ceph_osd_metadata)) | ||||||
|  |           > | ||||||
|  |           scalar( | ||||||
|  |             (avg by (job) (sum by(hostname) ((ceph_osd_numpg > 0) * on(ceph_daemon) group_left(hostname) ceph_osd_metadata)) | ||||||
|  |               + | ||||||
|  |             (avg by (job) (sum by(hostname) ((ceph_osd_numpg > 0) * on(ceph_daemon) group_left(hostname) ceph_osd_metadata)) * 0.3 )) | ||||||
|  |           ) | ||||||
|         for: "5m" |         for: "5m" | ||||||
|         labels: |         labels: | ||||||
|           oid: "1.3.6.1.4.1.50495.1.2.1.4.5" |           oid: "1.3.6.1.4.1.50495.1.2.1.4.5" | ||||||
|  | |||||||
		Reference in New Issue
	
	Block a user