This is an automated email from the ASF dual-hosted git repository.

sodonnell pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/ozone.git


The following commit(s) were added to refs/heads/master by this push:
     new 1cf29b571e HDDS-6155. Adding ReplicationManagerMetrics to 
ReplicaManagerInsight (#5345)
1cf29b571e is described below

commit 1cf29b571ef28fe362e9608b9471319f9be94a0a
Author: VarshaRavi <[email protected]>
AuthorDate: Tue Sep 26 20:26:01 2023 +0530

    HDDS-6155. Adding ReplicationManagerMetrics to ReplicaManagerInsight (#5345)
---
 .../ozone/insight/scm/ReplicaManagerInsight.java   | 128 ++++++++++++++++++++-
 1 file changed, 127 insertions(+), 1 deletion(-)

diff --git 
a/hadoop-ozone/insight/src/main/java/org/apache/hadoop/ozone/insight/scm/ReplicaManagerInsight.java
 
b/hadoop-ozone/insight/src/main/java/org/apache/hadoop/ozone/insight/scm/ReplicaManagerInsight.java
index e42f7fc855..d7769a8cc3 100644
--- 
a/hadoop-ozone/insight/src/main/java/org/apache/hadoop/ozone/insight/scm/ReplicaManagerInsight.java
+++ 
b/hadoop-ozone/insight/src/main/java/org/apache/hadoop/ozone/insight/scm/ReplicaManagerInsight.java
@@ -25,10 +25,11 @@ import 
org.apache.hadoop.hdds.scm.container.replication.ReplicationManager;
 import org.apache.hadoop.ozone.insight.BaseInsightPoint;
 import org.apache.hadoop.ozone.insight.Component.Type;
 import org.apache.hadoop.ozone.insight.LoggerSource;
+import org.apache.hadoop.ozone.insight.MetricDisplay;
 import org.apache.hadoop.ozone.insight.MetricGroupDisplay;
 
 /**
- * Insight definition to chech the replication manager internal state.
+ * Insight definition to check the replication manager internal state.
  */
 public class ReplicaManagerInsight extends BaseInsightPoint {
 
@@ -44,6 +45,131 @@ public class ReplicaManagerInsight extends BaseInsightPoint 
{
   @Override
   public List<MetricGroupDisplay> getMetrics(Map<String, String> filters) {
     List<MetricGroupDisplay> display = new ArrayList<>();
+
+    MetricGroupDisplay containerMetrics = new MetricGroupDisplay(Type.SCM,
+        "ReplicationManager Container Metrics");
+    containerMetrics.addMetrics(new MetricDisplay("Open Containers",
+        "replication_manager_metrics_open_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Closing Containers",
+        "replication_manager_metrics_closing_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Quasi-closed Containers",
+        "replication_manager_metrics_quasi_closed_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Closed Containers",
+        "replication_manager_metrics_closed_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Deleting Containers",
+        "replication_manager_metrics_deleting_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Deleted Containers",
+        "replication_manager_metrics_deleted_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Recovering Containers",
+        "replication_manager_metrics_recovering_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("UnderReplicated Containers",
+        "replication_manager_metrics_under_replicated_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("MisReplicated Containers",
+        "replication_manager_metrics_mis_replicated_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("OverReplicated Containers",
+        "replication_manager_metrics_over_replicated_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Missing Containers",
+        "replication_manager_metrics_missing_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Unhealthy Containers",
+        "replication_manager_metrics_unhealthy_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Empty Containers",
+        "replication_manager_metrics_empty_containers"));
+    containerMetrics.addMetrics(new MetricDisplay("Open Unhealthy Containers",
+        "replication_manager_metrics_open_unhealthy_containers"));
+    containerMetrics.addMetrics(new MetricDisplay(
+        "Stuck QuasiClosed Containers",
+        "replication_manager_metrics_stuck_quasi_closed_containers"));
+    display.add(containerMetrics);
+
+    MetricGroupDisplay ecMetrics = new MetricGroupDisplay(Type.SCM,
+        "ReplicationManager EC Metrics");
+    ecMetrics.addMetrics(new MetricDisplay("EcReplicationCmdsSentTotal",
+        "replication_manager_metrics_ec_replication_cmds_sent_total"));
+    ecMetrics.addMetrics(new MetricDisplay("EcDeletionCmdsSentTotal",
+        "replication_manager_metrics_ec_deletion_cmds_sent_total"));
+    ecMetrics.addMetrics(new MetricDisplay("EcReplicasCreatedTotal",
+        "replication_manager_metrics_ec_replicas_created_total"));
+    ecMetrics.addMetrics(new MetricDisplay("EcReplicasDeletedTotal",
+        "replication_manager_metrics_ec_replicas_deleted_total"));
+    ecMetrics.addMetrics(new MetricDisplay("EcReconstructionCmdsSentTotal",
+        "replication_manager_metrics_ec_reconstruction_cmds_sent_total"));
+    ecMetrics.addMetrics(new MetricDisplay("EcReplicaCreateTimeoutTotal",
+        "replication_manager_metrics_ec_replica_create_timeout_total"));
+    ecMetrics.addMetrics(new MetricDisplay("EcReplicasDeletedTotal",
+        "replication_manager_metrics_ec_replicas_deleted_total"));
+    ecMetrics.addMetrics(new MetricDisplay("EcReplicaDeleteTimeoutTotal",
+        "replication_manager_metrics_ec_replica_delete_timeout_total"));
+    ecMetrics.addMetrics(new MetricDisplay(
+        "EcReconstructionCmdsDeferredTotal",
+        "replication_manager_metrics_ec_reconstruction_cmds_deferred_total"));
+    ecMetrics.addMetrics(new MetricDisplay(
+        "EcPartialReconstructionSkippedTotal",
+        
"replication_manager_metrics_ec_partial_reconstruction_skipped_total"));
+    ecMetrics.addMetrics(new MetricDisplay(
+        "EcPartialReconstructionCriticalTotal",
+        "replication_manager_metrics_ec_partial_reconstruction_" +
+            "critical_total"));
+    ecMetrics.addMetrics(new MetricDisplay(
+        "EcPartialReconstructionNoneOverloadedTotal",
+        "replication_manager_metrics_ec_partial_reconstruction_none_" +
+            "overloaded_total"));
+    ecMetrics.addMetrics(new MetricDisplay(
+        "EcPartialReplicationForOutOfServiceReplicasTotal",
+        "replication_manager_metrics_ec_partial_replication_for_" +
+            "out_of_service_replicas_total"));
+    ecMetrics.addMetrics(new MetricDisplay(
+        "EcPartialReplicationForMisReplicationTotal",
+        "replication_manager_metrics_ec_partial_replication_for_" +
+            "mis_replication_total"));
+    display.add(ecMetrics);
+
+    MetricGroupDisplay replicaMetrics = new MetricGroupDisplay(Type.SCM,
+        "ReplicationManager Metrics");
+    replicaMetrics.addMetrics(new MetricDisplay("InflightReplication",
+        "replication_manager_metrics_inflight_replication"));
+    replicaMetrics.addMetrics(new MetricDisplay("InflightDeletion",
+        "replication_manager_metrics_inflight_deletion"));
+    replicaMetrics.addMetrics(new MetricDisplay("InflightEcReplication",
+        "replication_manager_metrics_inflight_ec_replication"));
+    replicaMetrics.addMetrics(new MetricDisplay("InflightEcDeletion",
+        "replication_manager_metrics_inflight_ec_deletion"));
+    replicaMetrics.addMetrics(new MetricDisplay("UnderReplicatedQueueSize",
+        "replication_manager_metrics_under_replicated_queue_size"));
+    replicaMetrics.addMetrics(new MetricDisplay("OverReplicatedQueueSize",
+        "replication_manager_metrics_over_replicated_queue_size"));
+    replicaMetrics.addMetrics(new MetricDisplay("ReplicationCmdsSentTotal",
+        "replication_manager_metrics_replication_cmds_sent_total"));
+    replicaMetrics.addMetrics(new MetricDisplay("ReplicasCreatedTotal",
+        "replication_manager_metrics_replicas_created_total"));
+    replicaMetrics.addMetrics(new MetricDisplay(
+        "ReplicaCreateTimeoutTotal",
+        "replication_manager_metrics_replica_create_timeout_total"));
+    replicaMetrics.addMetrics(new MetricDisplay(
+        "DeletionCmdsSentTotal",
+        "replication_manager_metrics_deletion_cmds_sent_total"));
+    replicaMetrics.addMetrics(new MetricDisplay(
+        "ReplicasDeletedTotal",
+        "replication_manager_metrics_replicas_deleted_total"));
+    replicaMetrics.addMetrics(new MetricDisplay(
+        "ReplicaDeleteTimeoutTotal",
+        "replication_manager_metrics_replica_delete_timeout_total"));
+    replicaMetrics.addMetrics(new MetricDisplay(
+        "DeleteContainerCmdsDeferredTotal",
+        "replication_manager_metrics_delete_container_cmds_deferred_total"));
+    replicaMetrics.addMetrics(new MetricDisplay(
+        "ReplicateContainerCmdsDeferredTotal",
+        
"replication_manager_metrics_replicate_container_cmds_deferred_total"));
+    replicaMetrics.addMetrics(new MetricDisplay(
+        "PendingReplicationLimitReachedTotal",
+        
"replication_manager_metrics_pending_replication_limit_reached_total"));
+    replicaMetrics.addMetrics(new MetricDisplay(
+        "PartialReplicationTotal",
+        "replication_manager_metrics_partial_replication_total"));
+    replicaMetrics.addMetrics(new MetricDisplay(
+        "PartialReplicationForMisReplicationTotal",
+        "replication_manager_metrics_partial_replication_for_" +
+            "mis_replication_total"));
+    display.add(replicaMetrics);
     return display;
   }
 


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to