csd: remove from repo It never really made sense for the CSD to exist in Kudu's repo, as it is tightly coupled to Cloudera Manager. After ensuring that it'll live on in a separate Cloudera repository, this commit removes it.
I searched for CSD-related references using 'git grep -i csd'. Change-Id: I8cffc1e536e92adc45a12354c9aacb8046739fb7 Reviewed-on: http://gerrit.cloudera.org:8080/5973 Tested-by: Kudu Jenkins Reviewed-by: Todd Lipcon <[email protected]> Reviewed-by: Jean-Daniel Cryans <[email protected]> Project: http://git-wip-us.apache.org/repos/asf/kudu/repo Commit: http://git-wip-us.apache.org/repos/asf/kudu/commit/f7d5c73d Tree: http://git-wip-us.apache.org/repos/asf/kudu/tree/f7d5c73d Diff: http://git-wip-us.apache.org/repos/asf/kudu/diff/f7d5c73d Branch: refs/heads/master Commit: f7d5c73dd06f0388bd4cb46ef3c24c94886baa09 Parents: 49c4817 Author: Adar Dembo <[email protected]> Authored: Fri Feb 10 20:33:29 2017 -0800 Committer: Adar Dembo <[email protected]> Committed: Mon Feb 13 23:39:33 2017 +0000 ---------------------------------------------------------------------- RELEASING.adoc | 4 - build-support/jenkins/build-and-test.sh | 2 +- build-support/release/rat_exclude_files.txt | 1 - java/README.md | 16 - java/kudu-csd/check_csd_compatibility.py | 92 -- java/kudu-csd/generate_mdl.py | 261 ---- .../old-version-metrics/0.10.0-master.json | 1236 ------------------ .../old-version-metrics/0.10.0-tserver.json | 1124 ---------------- .../old-version-metrics/0.9.1-master.json | 1196 ----------------- .../old-version-metrics/0.9.1-tserver.json | 1116 ---------------- .../old-version-metrics/1.0.0-master.json | 1236 ------------------ .../old-version-metrics/1.0.0-tserver.json | 1124 ---------------- .../old-version-metrics/1.0.1-master.json | 1236 ------------------ .../old-version-metrics/1.0.1-tserver.json | 1124 ---------------- java/kudu-csd/pom.xml | 116 -- java/kudu-csd/src/descriptor/service.sdl | 319 ----- java/kudu-csd/src/images/icon.png | Bin 693 -> 0 bytes java/kudu-csd/src/scripts/kudu.sh | 131 -- java/pom.xml | 10 - 19 files changed, 1 insertion(+), 10343 deletions(-) ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/kudu/blob/f7d5c73d/RELEASING.adoc ---------------------------------------------------------------------- diff --git a/RELEASING.adoc b/RELEASING.adoc index 60cb802..161e4ac 100644 --- a/RELEASING.adoc +++ b/RELEASING.adoc @@ -77,10 +77,6 @@ branch with the same name and the previously-noted SHA1. mvn versions:set -DnewVersion=0.X.0-SNAPSHOT ---- -. Check to make sure the version number in `java/kudu-csd/pom.xml` under - "com.cloudera.csd" matches. Itâs listed in two places and some versions of - maven apparently do not update both. - . If the python API has changed since the previous release, bump the Python version in `python/setup.py` in master. (the Python API uses separate versioning). http://git-wip-us.apache.org/repos/asf/kudu/blob/f7d5c73d/build-support/jenkins/build-and-test.sh ---------------------------------------------------------------------- diff --git a/build-support/jenkins/build-and-test.sh b/build-support/jenkins/build-and-test.sh index cb86b00..98b0d1c 100755 --- a/build-support/jenkins/build-and-test.sh +++ b/build-support/jenkins/build-and-test.sh @@ -353,7 +353,7 @@ if [ "$BUILD_JAVA" == "1" ]; then pushd $SOURCE_ROOT/java export TSAN_OPTIONS="$TSAN_OPTIONS suppressions=$SOURCE_ROOT/build-support/tsan-suppressions.txt history_size=7" set -x - if ! mvn $MVN_FLAGS -PbuildCSD \ + if ! mvn $MVN_FLAGS \ -Dsurefire.rerunFailingTestsCount=3 \ -Dfailsafe.rerunFailingTestsCount=3 \ clean verify ; then http://git-wip-us.apache.org/repos/asf/kudu/blob/f7d5c73d/build-support/release/rat_exclude_files.txt ---------------------------------------------------------------------- diff --git a/build-support/release/rat_exclude_files.txt b/build-support/release/rat_exclude_files.txt index 566ba19..6dbcb4f 100644 --- a/build-support/release/rat_exclude_files.txt +++ b/build-support/release/rat_exclude_files.txt @@ -10,7 +10,6 @@ pax_global_header version.txt build-support/release/rat_exclude_files.txt docs/support/doxygen/client_api.footer.in -java/kudu-csd/old-version-metrics/*.json java/kudu-flume-sink/src/test/avro/testAvroKuduOperationsProducer.avsc java/kudu-client/src/main/java/com/google/protobuf/ZeroCopyLiteralByteString.java java/kudu-client/src/main/java/org/apache/kudu/client/AsyncKuduClient.java http://git-wip-us.apache.org/repos/asf/kudu/blob/f7d5c73d/java/README.md ---------------------------------------------------------------------- diff --git a/java/README.md b/java/README.md index ac45186..0ce538e 100644 --- a/java/README.md +++ b/java/README.md @@ -136,19 +136,3 @@ likely a bug in maven-protoc-plugin. There's a simple workaround: delete the errant folder within Eclipse and refresh the kudu-client project. - - -Building the Kudu Custom Service Descriptor (CSD) ------------------------------------------------------------- - -By default, the Kudu CSD will not be built with the client -and isn't needed by any API. - -It requires access to the Kudu binaries which have to be built -prior to building this module. - -Here's how to build the kudu-csd module: - -$ mvn package -DskipTests -PbuildCSD - -This will both build the Kudu CSD and validate it for correctness. http://git-wip-us.apache.org/repos/asf/kudu/blob/f7d5c73d/java/kudu-csd/check_csd_compatibility.py ---------------------------------------------------------------------- diff --git a/java/kudu-csd/check_csd_compatibility.py b/java/kudu-csd/check_csd_compatibility.py deleted file mode 100755 index 2c875c0..0000000 --- a/java/kudu-csd/check_csd_compatibility.py +++ /dev/null @@ -1,92 +0,0 @@ -#!/usr/bin/env python -# -# Licensed to the Apache Software Foundation (ASF) under one -# or more contributor license agreements. See the NOTICE file -# distributed with this work for additional information -# regarding copyright ownership. The ASF licenses this file -# to you under the Apache License, Version 2.0 (the -# "License"); you may not use this file except in compliance -# with the License. You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed to in writing, -# software distributed under the License is distributed on an -# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY -# KIND, either express or implied. See the License for the -# specific language governing permissions and limitations -# under the License. - -# This tool checks for compatibility between two CSD jars. -# Namely, it ensures that no metrics have been removed. - -import argparse -import json -import sys -import zipfile - -# The path within a CSD that contains the MDL file. -MDL_PATH = "descriptor/service.mdl" - - -def metrics_from_mdl(mdl): - """ - Return a set() representing the metrics in the given MDL JSON object. - - Each entry is a tuple of either: - ('entity', entity_name, metric_name) - or - ('role', role_name, metric_name) - """ - metrics = set() - for entity_def in mdl['metricEntityTypeDefinitions']: - for metric_def in entity_def['metricDefinitions']: - metrics.add(('entity', entity_def['name'], metric_def['name'])) - for role_def in mdl['roles']: - for metric_def in role_def['metricDefinitions']: - metrics.add(('role', role_def['name'], metric_def['name'])) - return metrics - - -def check_mdl_compat(old_zip, new_zip, args): - old_mdl = json.load(old_zip.open(MDL_PATH)) - new_mdl = json.load(new_zip.open(MDL_PATH)) - - old_metrics = metrics_from_mdl(old_mdl) - new_metrics = metrics_from_mdl(new_mdl) - - added_metrics = new_metrics.difference(old_metrics) - removed_metrics = old_metrics.difference(new_metrics) - - print "Added %d metric(s):" % len(added_metrics) - for m_type, m_entity, m_name in added_metrics: - print " %s metric %s" % (m_entity, m_name) - if removed_metrics: - print "Removed %d metric(s):" % len(removed_metrics) - for m_type, m_entity, m_name in removed_metrics: - print " %s metric %s" % (m_entity, m_name) - print "Compatibility check FAILED" - sys.exit(1) - print "No metrics were removed." - print "Compatibility check PASSED" - - -def main(): - p = argparse.ArgumentParser( - description=("Checks for compatibility between CSD JARs. " + - "May also generate a file containing JSON for " + - "metrics that were removed between the old version " - "of the CSD and the specified new one.")) - p.add_argument("old_jar", metavar="KUDU-old.jar", type=str, - help="The old CSD JAR to compare") - p.add_argument("new_jar", metavar="KUDU-new.jar", type=str, - help="The new CSD JAR to compare") - args = p.parse_args() - - old_zip = zipfile.ZipFile(args.old_jar) - new_zip = zipfile.ZipFile(args.new_jar) - check_mdl_compat(old_zip, new_zip, args) - - -if __name__ == "__main__": - main() http://git-wip-us.apache.org/repos/asf/kudu/blob/f7d5c73d/java/kudu-csd/generate_mdl.py ---------------------------------------------------------------------- diff --git a/java/kudu-csd/generate_mdl.py b/java/kudu-csd/generate_mdl.py deleted file mode 100755 index 0fe054f..0000000 --- a/java/kudu-csd/generate_mdl.py +++ /dev/null @@ -1,261 +0,0 @@ -#!/usr/bin/env python -# -# Licensed to the Apache Software Foundation (ASF) under one -# or more contributor license agreements. See the NOTICE file -# distributed with this work for additional information -# regarding copyright ownership. The ASF licenses this file -# to you under the Apache License, Version 2.0 (the -# "License"); you may not use this file except in compliance -# with the License. You may obtain a copy of the License at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# Unless required by applicable law or agreed to in writing, -# software distributed under the License is distributed on an -# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY -# KIND, either express or implied. See the License for the -# specific language governing permissions and limitations -# under the License. -# -# Script to generate a CM-compatible MDL file from the metrics -# metadata dumped by our daemon processes. -# -# Requires that the daemon processes have already been built and available -# in the build/latest/bin directory. -# -# Outputs the MDL file on stdout by default or to a file specified in the first -# argument. - -import collections -from distutils.version import LooseVersion -try: - import simplejson as json -except: - import json -import os -import subprocess -import sys - -BINARIES=["kudu-master", "kudu-tserver"] - -BASE_DIR = os.path.dirname(os.path.abspath(__file__)) -RELATIVE_BUILD_DIR="../../build/latest/bin" - -DEPRECATION_MESSAGE = " This metric is no longer produced in " + \ - "current versions of Kudu." - -def find_binary(bin_name): - build_dir = os.path.join(BASE_DIR, RELATIVE_BUILD_DIR) - path = os.path.join(build_dir, bin_name) - if os.path.exists(path): - return path - raise Exception("Cannot find %s in build dir %s" % (bin_name, build_dir)) - -def load_current_metrics(): - """ - For each binary, dump and parse its metrics schema by running it with - the --dump_metrics_json flag. - """ - all_metrics = [] - for binary in BINARIES: - binary = find_binary(binary) - p = subprocess.Popen([binary, "--dump_metrics_json"], - stdout=subprocess.PIPE, - stderr=subprocess.PIPE) - stdout, stderr = p.communicate() - rc = p.returncode - - if rc != 0: - print >>sys.stderr, "error: %s exited with return code %d:\n" % (binary, rc) - print >>sys.stderr, stderr - sys.exit(1) - - metrics_dump = json.loads(stdout) - all_metrics.extend(metrics_dump['metrics']) - return all_metrics - - -def load_historical_metrics(): - """ - Load the metrics dump output from older versions of Kudu. These are checked - into the source repository in the "old-version-metrics" directory. - - If any of these metrics has been removed in the current version of Kudu, - it will be included, but marked as deprecated and no longer produced. - """ - - old_metrics = {} - old_dir = os.path.join(BASE_DIR, "old-version-metrics") - - # Load the metrics dumps from previous versions in ascending - # version order. This way, we retain the latest description/name - # of the metric in the remaining (deprecated) metric. - for path in sorted(os.listdir(old_dir), key=LooseVersion): - if not path.endswith(".json") or path.startswith("."): - continue - j = json.load(file(os.path.join(old_dir, path))) - old_metrics.update((m['name'], m) for m in j['metrics']) - return old_metrics.values() - - -def append_sentence(a, b): - if not a.endswith("."): - a += "." - return a + " " + b - -def metric_to_mdl_entries(m): - if m['type'] == 'histogram': - return [ - dict( - context=(m['name'] + "::total_count"), - name=('kudu_' + m['name'].lower()) + '_count', - counter=True, - numeratorUnit='samples', - description=append_sentence(m['description'], - "This is the total number of recorded samples."), - label=m['label'] + ": Samples"), - dict( - context=(m['name'] + "::total_sum"), - name=('kudu_' + m['name'].lower()) + '_sum', - counter=True, - numeratorUnit=m['unit'], - description=append_sentence(m['description'], - "This is the total sum of recorded samples."), - label=m['label'] + ": Total") - ] - - return [dict( - context=(m['name'] + "::value"), - name=('kudu_' + m['name'].lower()), - counter=(m['type'] == 'counter'), - numeratorUnit=m['unit'], - description=m['description'], - label=m['label'])] - - -def deprecate_entries(mdl_entries): - """ For each entry in 'mdl_entries', mark it as deprecated. """ - for m in mdl_entries: - m['label'] = "DEPRECATED: %s" % m['label'] - m['description'] += DEPRECATION_MESSAGE - - -def metrics_to_mdl(metrics, historical_metrics): - """ - For each metric returned by the daemon, convert it to the MDL-compatible dictionary. - Metrics which are in 'historical_metrics' but not in 'metrics' are added, but marked - as deprecated. - - Returns a map of entity_type_name -> [metric dicts]. - """ - seen = set() - - by_entity = collections.defaultdict(lambda: []) - def add_metrics(metrics, deprecated=False): - for m in metrics: - # Don't process any metric more than once. Some metrics show up - # in both daemons. - key = (m['entity_type'], m['name']) - if key in seen: - continue - seen.add(key) - # Convert to the format that CM expects. - mdl_entries = metric_to_mdl_entries(m) - if deprecated: - deprecate_entries(mdl_entries) - by_entity[m['entity_type']].extend(mdl_entries) - - # First add all the current metrics. - add_metrics(metrics) - # Then add any metrics from old versions that were not already - # added by the current version. These are marked as DEPRECATED. - add_metrics(historical_metrics, deprecated=True) - return by_entity - - -def main(): - current_metrics = load_current_metrics() - historical_metrics = load_historical_metrics() - metrics_by_entity = metrics_to_mdl(current_metrics, historical_metrics) - server_metrics = metrics_by_entity['server'] - tablet_metrics = metrics_by_entity['tablet'] - - output = dict( - name="KUDU", - version="0.6.0", - metricDefinitions=[], - nameForCrossEntityAggregateMetrics="kudus", - roles=[ - dict(name="KUDU_TSERVER", - nameForCrossEntityAggregateMetrics="kudu_tservers", - metricDefinitions=server_metrics), - dict(name="KUDU_MASTER", - nameForCrossEntityAggregateMetrics="kudu_masters", - metricDefinitions=server_metrics) - ], - metricEntityAttributeDefinitions=[ - dict(name="kuduTableId", - label="Table ID", - description="UUID for Kudu Table.", - valueCaseSensitive=False), - dict(name="kuduTableName", - label="Table Name", - description="Name for Kudu Table.", - valueCaseSensitive=True), - dict(name="kuduTableState", - label="Table State", - description="State for Kudu Table.", - valueCaseSensitive=False), - dict(name="kuduTabletId", - label="Tablet ID", - description="UUID for Kudu Tablet.", - valueCaseSensitive=False), - dict(name="kuduTabletState", - label="Tablet State", - description="State for Kudu Tablet.", - valueCaseSensitive=False) - # TODO: add the role's persistent UUID after discussing with - # Chris on how to inject it into their CM entity. - ], - metricEntityTypeDefinitions=[ - dict(name="KUDU_TABLE", - nameForCrossEntityAggregateMetrics="kudu_tables", - immutableAttributeNames=["serviceName", "kuduTableId"], - mutableAttributeNames=["kuduTableName", "kuduTableState"], - entityNameFormat=["serviceName", "kuduTableId"], - description="A Kudu table.", - label="Kudu Table", - labelPlural="Kudu Tables", - entityLabelFormat="$kuduTableName ($serviceDisplayName)", - parentMetricEntityTypeNames=["KUDU"], - metricDefinitions=[]), - dict(name="KUDU_TABLET", - nameForCrossEntityAggregateMetrics="kudu_tablets", - immutableAttributeNames=["serviceName", "kuduTableId", "kuduTabletId"], - mutableAttributeNames=["kuduTabletState"], - entityNameFormat=["serviceName", "kuduTabletId"], - description="A Kudu tablet.", - label="Kudu Tablet", - labelPlural="Kudu Tablets", - entityLabelFormat="$kuduTabletId ($kuduTableName) ($serviceDisplayName)", - parentMetricEntityTypeNames=["KUDU_TABLE"], - metricDefinitions=[]), - dict(name="KUDU_REPLICA", - nameForCrossEntityAggregateMetrics="kudu_replicas", - immutableAttributeNames=["kuduTabletId", "serviceName", "roleName"], - entityNameFormat=["roleName","kuduTabletId"], - description="A Kudu replica.", - label="Kudu Replica", - labelPlural="Kudu Replicas", - entityLabelFormat="$kuduTabletId ($kuduTableName) ($hostname)", - parentMetricEntityTypeNames=["KUDU_TABLET","KUDU-KUDU_TSERVER"], - metricDefinitions=tablet_metrics), - ]) - - f = sys.stdout - if len(sys.argv) > 1: - f = open(sys.argv[1], 'w') - f.write(json.dumps(output, indent=4)) - -if __name__ == "__main__": - main() http://git-wip-us.apache.org/repos/asf/kudu/blob/f7d5c73d/java/kudu-csd/old-version-metrics/0.10.0-master.json ---------------------------------------------------------------------- diff --git a/java/kudu-csd/old-version-metrics/0.10.0-master.json b/java/kudu-csd/old-version-metrics/0.10.0-master.json deleted file mode 100644 index 5ade70f..0000000 --- a/java/kudu-csd/old-version-metrics/0.10.0-master.json +++ /dev/null @@ -1,1236 +0,0 @@ -{ - "metrics": [ - { - "name": "op_apply_queue_length", - "label": "Operation Apply Queue Length", - "type": "histogram", - "unit": "tasks", - "description": "Number of operations waiting to be applied to the tablet. High queue lengths indicate that the server is unable to process operations as fast as they are being written to the WAL.", - "entity_type": "server" - }, - { - "name": "op_apply_queue_time", - "label": "Operation Apply Queue Time", - "type": "histogram", - "unit": "microseconds", - "description": "Time that operations spent waiting in the apply queue before being processed. High queue times indicate that the server is unable to process operations as fast as they are being written to the WAL.", - "entity_type": "server" - }, - { - "name": "op_apply_run_time", - "label": "Operation Apply Run Time", - "type": "histogram", - "unit": "microseconds", - "description": "Time that operations spent being applied to the tablet. High values may indicate that the server is under-provisioned or that operations consist of very large batches.", - "entity_type": "server" - }, - { - "name": "active_scanners", - "label": "Active Scanners", - "type": "gauge", - "unit": "scanners", - "description": "Number of scanners that are currently active", - "entity_type": "server" - }, - { - "name": "scanners_expired", - "label": "Scanners Expired", - "type": "counter", - "unit": "scanners", - "description": "Number of scanners that have expired since service start", - "entity_type": "server" - }, - { - "name": "scanner_duration", - "label": "Scanner Duration", - "type": "histogram", - "unit": "microseconds", - "description": "Histogram of the duration of active scanners on this tablet.", - "entity_type": "server" - }, - { - "name": "memrowset_size", - "label": "MemRowSet Memory Usage", - "type": "gauge", - "unit": "bytes", - "description": "Size of this tablet's memrowset", - "entity_type": "tablet" - }, - { - "name": "on_disk_size", - "label": "Tablet Size On Disk", - "type": "gauge", - "unit": "bytes", - "description": "Size of this tablet on disk.", - "entity_type": "tablet" - }, - { - "name": "rows_inserted", - "label": "Rows Inserted", - "type": "counter", - "unit": "rows", - "description": "Number of rows inserted into this tablet since service start", - "entity_type": "tablet" - }, - { - "name": "rows_upserted", - "label": "Rows Upserted", - "type": "counter", - "unit": "rows", - "description": "Number of rows upserted into this tablet since service start", - "entity_type": "tablet" - }, - { - "name": "rows_updated", - "label": "Rows Updated", - "type": "counter", - "unit": "rows", - "description": "Number of row update operations performed on this tablet since service start", - "entity_type": "tablet" - }, - { - "name": "rows_deleted", - "label": "Rows Deleted", - "type": "counter", - "unit": "rows", - "description": "Number of row delete operations performed on this tablet since service start", - "entity_type": "tablet" - }, - { - "name": "scanner_rows_returned", - "label": "Scanner Rows Returned", - "type": "counter", - "unit": "rows", - "description": "Number of rows returned by scanners to clients. This count is measured after predicates are applied, and thus is not a reflection of the amount of work being done by scanners.", - "entity_type": "tablet" - }, - { - "name": "scanner_cells_returned", - "label": "Scanner Cells Returned", - "type": "counter", - "unit": "cells", - "description": "Number of table cells returned by scanners to clients. This count is measured after predicates are applied, and thus is not a reflection of the amount of work being done by scanners.", - "entity_type": "tablet" - }, - { - "name": "scanner_bytes_returned", - "label": "Scanner Bytes Returned", - "type": "counter", - "unit": "bytes", - "description": "Number of bytes returned by scanners to clients. This count is measured after predicates are applied and the data is decoded for consumption by clients, and thus is not a reflection of the amount of work being done by scanners.", - "entity_type": "tablet" - }, - { - "name": "scanner_rows_scanned", - "label": "Scanner Rows Scanned", - "type": "counter", - "unit": "rows", - "description": "Number of rows processed by scan requests. This is measured as a raw count prior to application of predicates, deleted data,or MVCC-based filtering. Thus, this is a better measure of actual table rows that have been processed by scan operations compared to the Scanner Rows Returned metric.", - "entity_type": "tablet" - }, - { - "name": "scanner_cells_scanned_from_disk", - "label": "Scanner Cells Scanned From Disk", - "type": "counter", - "unit": "cells", - "description": "Number of table cells processed by scan requests. This is measured as a raw count prior to application of predicates, deleted data,or MVCC-based filtering. Thus, this is a better measure of actual table cells that have been processed by scan operations compared to the Scanner Cells Returned metric.\nNote that this only counts data that has been flushed to disk, and does not include data read from in-memory stores. However, itincludes both cache misses and cache hits.", - "entity_type": "tablet" - }, - { - "name": "scanner_bytes_scanned_from_disk", - "label": "Scanner Bytes Scanned From Disk", - "type": "counter", - "unit": "bytes", - "description": "Number of bytes read by scan requests. This is measured as a raw count prior to application of predicates, deleted data,or MVCC-based filtering. Thus, this is a better measure of actual IO that has been caused by scan operations compared to the Scanner Bytes Returned metric.\nNote that this only counts data that has been flushed to disk, and does not include data read from in-memory stores. However, itincludes both cache misses and cache hits.", - "entity_type": "tablet" - }, - { - "name": "insertions_failed_dup_key", - "label": "Duplicate Key Inserts", - "type": "counter", - "unit": "rows", - "description": "Number of inserts which failed because the key already existed", - "entity_type": "tablet" - }, - { - "name": "scans_started", - "label": "Scans Started", - "type": "counter", - "unit": "scanners", - "description": "Number of scanners which have been started on this tablet", - "entity_type": "tablet" - }, - { - "name": "bloom_lookups", - "label": "Bloom Filter Lookups", - "type": "counter", - "unit": "probes", - "description": "Number of times a bloom filter was consulted", - "entity_type": "tablet" - }, - { - "name": "key_file_lookups", - "label": "Key File Lookups", - "type": "counter", - "unit": "probes", - "description": "Number of times a key cfile was consulted", - "entity_type": "tablet" - }, - { - "name": "delta_file_lookups", - "label": "Delta File Lookups", - "type": "counter", - "unit": "probes", - "description": "Number of times a delta file was consulted", - "entity_type": "tablet" - }, - { - "name": "mrs_lookups", - "label": "MemRowSet Lookups", - "type": "counter", - "unit": "probes", - "description": "Number of times a MemRowSet was consulted.", - "entity_type": "tablet" - }, - { - "name": "bytes_flushed", - "label": "Bytes Flushed", - "type": "counter", - "unit": "bytes", - "description": "Amount of data that has been flushed to disk by this tablet.", - "entity_type": "tablet" - }, - { - "name": "bloom_lookups_per_op", - "label": "Bloom Lookups per Operation", - "type": "histogram", - "unit": "probes", - "description": "Tracks the number of bloom filter lookups performed by each operation. A single operation may perform several bloom filter lookups if the tablet is not fully compacted. High frequency of high values may indicate that compaction is falling behind.", - "entity_type": "tablet" - }, - { - "name": "key_file_lookups_per_op", - "label": "Key Lookups per Operation", - "type": "histogram", - "unit": "probes", - "description": "Tracks the number of key file lookups performed by each operation. A single operation may perform several key file lookups if the tablet is not fully compacted and if bloom filters are not effectively culling lookups.", - "entity_type": "tablet" - }, - { - "name": "delta_file_lookups_per_op", - "label": "Delta File Lookups per Operation", - "type": "histogram", - "unit": "probes", - "description": "Tracks the number of delta file lookups performed by each operation. A single operation may perform several delta file lookups if the tablet is not fully compacted. High frequency of high values may indicate that compaction is falling behind.", - "entity_type": "tablet" - }, - { - "name": "write_op_duration_client_propagated_consistency", - "label": "Write Op Duration with Propagated Consistency", - "type": "histogram", - "unit": "microseconds", - "description": "Duration of writes to this tablet with external consistency set to CLIENT_PROPAGATED.", - "entity_type": "tablet" - }, - { - "name": "write_op_duration_commit_wait_consistency", - "label": "Write Op Duration with Commit-Wait Consistency", - "type": "histogram", - "unit": "microseconds", - "description": "Duration of writes to this tablet with external consistency set to COMMIT_WAIT.", - "entity_type": "tablet" - }, - { - "name": "commit_wait_duration", - "label": "Commit-Wait Duration", - "type": "histogram", - "unit": "microseconds", - "description": "Time spent waiting for COMMIT_WAIT external consistency writes for this tablet.", - "entity_type": "tablet" - }, - { - "name": "snapshot_read_inflight_wait_duration", - "label": "Time Waiting For Snapshot Reads", - "type": "histogram", - "unit": "microseconds", - "description": "Time spent waiting for in-flight writes to complete for READ_AT_SNAPSHOT scans.", - "entity_type": "tablet" - }, - { - "name": "flush_dms_running", - "label": "DeltaMemStore Flushes Running", - "type": "gauge", - "unit": "operations", - "description": "Number of delta memstore flushes currently running.", - "entity_type": "tablet" - }, - { - "name": "flush_mrs_running", - "label": "MemRowSet Flushes Running", - "type": "gauge", - "unit": "operations", - "description": "Number of MemRowSet flushes currently running.", - "entity_type": "tablet" - }, - { - "name": "compact_rs_running", - "label": "RowSet Compactions Running", - "type": "gauge", - "unit": "operations", - "description": "Number of RowSet compactions currently running.", - "entity_type": "tablet" - }, - { - "name": "delta_minor_compact_rs_running", - "label": "Minor Delta Compactions Running", - "type": "gauge", - "unit": "operations", - "description": "Number of delta minor compactions currently running.", - "entity_type": "tablet" - }, - { - "name": "delta_major_compact_rs_running", - "label": "Major Delta Compactions Running", - "type": "gauge", - "unit": "operations", - "description": "Number of delta major compactions currently running.", - "entity_type": "tablet" - }, - { - "name": "flush_dms_duration", - "label": "DeltaMemStore Flush Duration", - "type": "histogram", - "unit": "milliseconds", - "description": "Time spent flushing DeltaMemStores.", - "entity_type": "tablet" - }, - { - "name": "flush_mrs_duration", - "label": "MemRowSet Flush Duration", - "type": "histogram", - "unit": "milliseconds", - "description": "Time spent flushing MemRowSets.", - "entity_type": "tablet" - }, - { - "name": "compact_rs_duration", - "label": "RowSet Compaction Duration", - "type": "histogram", - "unit": "milliseconds", - "description": "Time spent compacting RowSets.", - "entity_type": "tablet" - }, - { - "name": "delta_minor_compact_rs_duration", - "label": "Minor Delta Compaction Duration", - "type": "histogram", - "unit": "milliseconds", - "description": "Time spent minor delta compacting.", - "entity_type": "tablet" - }, - { - "name": "delta_major_compact_rs_duration", - "label": "Major Delta Compaction Duration", - "type": "histogram", - "unit": "seconds", - "description": "Seconds spent major delta compacting.", - "entity_type": "tablet" - }, - { - "name": "leader_memory_pressure_rejections", - "label": "Leader Memory Pressure Rejections", - "type": "counter", - "unit": "requests", - "description": "Number of RPC requests rejected due to memory pressure while LEADER.", - "entity_type": "tablet" - }, - { - "name": "op_prepare_queue_length", - "label": "Operation Prepare Queue Length", - "type": "histogram", - "unit": "tasks", - "description": "Number of operations waiting to be prepared within this tablet. High queue lengths indicate that the server is unable to process operations as fast as they are being written to the WAL.", - "entity_type": "tablet" - }, - { - "name": "op_prepare_queue_time", - "label": "Operation Prepare Queue Time", - "type": "histogram", - "unit": "microseconds", - "description": "Time that operations spent waiting in the prepare queue before being processed. High queue times indicate that the server is unable to process operations as fast as they are being written to the WAL.", - "entity_type": "tablet" - }, - { - "name": "op_prepare_run_time", - "label": "Operation Prepare Run Time", - "type": "histogram", - "unit": "microseconds", - "description": "Time that operations spent being prepared in the tablet. High values may indicate that the server is under-provisioned or that operations are experiencing high contention with one another for locks.", - "entity_type": "tablet" - }, - { - "name": "all_transactions_inflight", - "label": "Transactions In Flight", - "type": "gauge", - "unit": "transactions", - "description": "Number of transactions currently in-flight, including any type.", - "entity_type": "tablet" - }, - { - "name": "write_transactions_inflight", - "label": "Write Transactions In Flight", - "type": "gauge", - "unit": "transactions", - "description": "Number of write transactions currently in-flight", - "entity_type": "tablet" - }, - { - "name": "alter_schema_transactions_inflight", - "label": "Alter Schema Transactions In Flight", - "type": "gauge", - "unit": "transactions", - "description": "Number of alter schema transactions currently in-flight", - "entity_type": "tablet" - }, - { - "name": "transaction_memory_pressure_rejections", - "label": "Transaction Memory Pressure Rejections", - "type": "counter", - "unit": "transactions", - "description": "Number of transactions rejected because the tablet's transaction memory limit was reached.", - "entity_type": "tablet" - }, - { - "name": "log_gc_running", - "label": "Log GCs Running", - "type": "gauge", - "unit": "operations", - "description": "Number of log GC operations currently running.", - "entity_type": "tablet" - }, - { - "name": "log_gc_duration", - "label": "Log GC Duration", - "type": "histogram", - "unit": "milliseconds", - "description": "Time spent garbage collecting the logs.", - "entity_type": "tablet" - }, - { - "name": "generic_current_allocated_bytes", - "label": "Heap Memory Usage", - "type": "gauge", - "unit": "bytes", - "description": "Number of bytes used by the application. This will not typically match the memory use reported by the OS, because it does not include TCMalloc overhead or memory fragmentation.", - "entity_type": "server" - }, - { - "name": "generic_heap_size", - "label": "Reserved Heap Memory", - "type": "gauge", - "unit": "bytes", - "description": "Bytes of system memory reserved by TCMalloc.", - "entity_type": "server" - }, - { - "name": "tcmalloc_pageheap_free_bytes", - "label": "Free Heap Memory", - "type": "gauge", - "unit": "bytes", - "description": "Number of bytes in free, mapped pages in page heap. These bytes can be used to fulfill allocation requests. They always count towards virtual memory usage, and unless the underlying memory is swapped out by the OS, they also count towards physical memory usage.", - "entity_type": "server" - }, - { - "name": "tcmalloc_pageheap_unmapped_bytes", - "label": "Unmapped Heap Memory", - "type": "gauge", - "unit": "bytes", - "description": "Number of bytes in free, unmapped pages in page heap. These are bytes that have been released back to the OS, possibly by one of the MallocExtension \"Release\" calls. They can be used to fulfill allocation requests, but typically incur a page fault. They always count towards virtual memory usage, and depending on the OS, typically do not count towards physical memory usage.", - "entity_type": "server" - }, - { - "name": "tcmalloc_max_total_thread_cache_bytes", - "label": "Thread Cache Memory Limit", - "type": "gauge", - "unit": "bytes", - "description": "A limit to how much memory TCMalloc dedicates for small objects. Higher numbers trade off more memory use for -- in some situations -- improved efficiency.", - "entity_type": "server" - }, - { - "name": "tcmalloc_current_total_thread_cache_bytes", - "label": "Thread Cache Memory Usage", - "type": "gauge", - "unit": "bytes", - "description": "A measure of some of the memory TCMalloc is using (for small objects).", - "entity_type": "server" - }, - { - "name": "glog_info_messages", - "label": "INFO-level Log Messages", - "type": "counter", - "unit": "messages", - "description": "Number of INFO-level log messages emitted by the application.", - "entity_type": "server" - }, - { - "name": "glog_warning_messages", - "label": "WARNING-level Log Messages", - "type": "counter", - "unit": "messages", - "description": "Number of WARNING-level log messages emitted by the application.", - "entity_type": "server" - }, - { - "name": "glog_error_messages", - "label": "ERROR-level Log Messages", - "type": "counter", - "unit": "messages", - "description": "Number of ERROR-level log messages emitted by the application.", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_server_GenericService_SetFlag", - "label": "kudu.server.GenericService.SetFlag RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.server.GenericService.SetFlag() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_server_GenericService_FlushCoverage", - "label": "kudu.server.GenericService.FlushCoverage RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.server.GenericService.FlushCoverage() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_server_GenericService_ServerClock", - "label": "kudu.server.GenericService.ServerClock RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.server.GenericService.ServerClock() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_server_GenericService_SetServerWallClockForTests", - "label": "kudu.server.GenericService.SetServerWallClockForTests RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.server.GenericService.SetServerWallClockForTests() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_server_GenericService_GetStatus", - "label": "kudu.server.GenericService.GetStatus RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.server.GenericService.GetStatus() RPC requests", - "entity_type": "server" - }, - { - "name": "majority_done_ops", - "label": "Leader Operations Acked by Majority", - "type": "gauge", - "unit": "operations", - "description": "Number of operations in the leader queue ack'd by a majority but not all peers.", - "entity_type": "tablet" - }, - { - "name": "in_progress_ops", - "label": "Leader Operations in Progress", - "type": "gauge", - "unit": "operations", - "description": "Number of operations in the leader queue ack'd by a minority of peers.", - "entity_type": "tablet" - }, - { - "name": "log_cache_num_ops", - "label": "Log Cache Operation Count", - "type": "gauge", - "unit": "operations", - "description": "Number of operations in the log cache.", - "entity_type": "tablet" - }, - { - "name": "log_cache_size", - "label": "Log Cache Memory Usage", - "type": "gauge", - "unit": "bytes", - "description": "Amount of memory in use for caching the local log.", - "entity_type": "tablet" - }, - { - "name": "follower_memory_pressure_rejections", - "label": "Follower Memory Pressure Rejections", - "type": "counter", - "unit": "requests", - "description": "Number of RPC requests rejected due to memory pressure while FOLLOWER.", - "entity_type": "tablet" - }, - { - "name": "raft_term", - "label": "Current Raft Consensus Term", - "type": "gauge", - "unit": "units", - "description": "Current Term of the Raft Consensus algorithm. This number increments each time a leader election is started.", - "entity_type": "tablet" - }, - { - "name": "log_reader_bytes_read", - "label": "Bytes Read From Log", - "type": "counter", - "unit": "bytes", - "description": "Data read from the WAL since tablet start", - "entity_type": "tablet" - }, - { - "name": "log_reader_entries_read", - "label": "Entries Read From Log", - "type": "counter", - "unit": "entries", - "description": "Number of entries read from the WAL since tablet start", - "entity_type": "tablet" - }, - { - "name": "log_reader_read_batch_latency", - "label": "Log Read Latency", - "type": "histogram", - "unit": "bytes", - "description": "Microseconds spent reading log entry batches", - "entity_type": "tablet" - }, - { - "name": "log_bytes_logged", - "label": "Bytes Written to WAL", - "type": "counter", - "unit": "bytes", - "description": "Number of bytes logged since service start", - "entity_type": "tablet" - }, - { - "name": "log_sync_latency", - "label": "Log Sync Latency", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent on synchronizing the log segment file", - "entity_type": "tablet" - }, - { - "name": "log_append_latency", - "label": "Log Append Latency", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent on appending to the log segment file", - "entity_type": "tablet" - }, - { - "name": "log_group_commit_latency", - "label": "Log Group Commit Latency", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent on committing an entire group", - "entity_type": "tablet" - }, - { - "name": "log_roll_latency", - "label": "Log Roll Latency", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent on rolling over to a new log segment file", - "entity_type": "tablet" - }, - { - "name": "log_entry_batches_per_group", - "label": "Log Group Commit Batch Size", - "type": "histogram", - "unit": "requests", - "description": "Number of log entry batches in a group commit group", - "entity_type": "tablet" - }, - { - "name": "hybrid_clock_timestamp", - "label": "Hybrid Clock Timestamp", - "type": "gauge", - "unit": "microseconds", - "description": "Hybrid clock timestamp.", - "entity_type": "server" - }, - { - "name": "hybrid_clock_error", - "label": "Hybrid Clock Error", - "type": "gauge", - "unit": "microseconds", - "description": "Server clock maximum error.", - "entity_type": "server" - }, - { - "name": "logical_clock_timestamp", - "label": "Logical Clock Timestamp", - "type": "gauge", - "unit": "units", - "description": "Logical clock timestamp.", - "entity_type": "server" - }, - { - "name": "code_cache_hits", - "label": "Codegen Cache Hits", - "type": "counter", - "unit": "hits", - "description": "Number of codegen cache hits since start", - "entity_type": "server" - }, - { - "name": "code_cache_queries", - "label": "Codegen Cache Queries", - "type": "counter", - "unit": "queries", - "description": "Number of codegen cache queries (hits + misses) since start", - "entity_type": "server" - }, - { - "name": "log_block_manager_bytes_under_management", - "label": "Bytes Under Management", - "type": "gauge", - "unit": "bytes", - "description": "Number of bytes of data blocks currently under management", - "entity_type": "server" - }, - { - "name": "log_block_manager_blocks_under_management", - "label": "Blocks Under Management", - "type": "gauge", - "unit": "blocks", - "description": "Number of data blocks currently under management", - "entity_type": "server" - }, - { - "name": "log_block_manager_containers", - "label": "Number of Block Containers", - "type": "counter", - "unit": "log block containers", - "description": "Number of log block containers", - "entity_type": "server" - }, - { - "name": "log_block_manager_full_containers", - "label": "Number of Full Block Counters", - "type": "counter", - "unit": "log block containers", - "description": "Number of full log block containers", - "entity_type": "server" - }, - { - "name": "log_block_manager_unavailable_containers", - "label": "Number of Unavailable Log Block Containers", - "type": "counter", - "unit": "log block containers", - "description": "Number of non-full log block containers that are under root paths whose disks are full", - "entity_type": "server" - }, - { - "name": "block_manager_blocks_open_reading", - "label": "Data Blocks Open For Read", - "type": "gauge", - "unit": "blocks", - "description": "Number of data blocks currently open for reading", - "entity_type": "server" - }, - { - "name": "block_manager_blocks_open_writing", - "label": "Data Blocks Open For Write", - "type": "gauge", - "unit": "blocks", - "description": "Number of data blocks currently open for writing", - "entity_type": "server" - }, - { - "name": "block_manager_total_writable_blocks", - "label": "Data Blocks Opened For Write", - "type": "counter", - "unit": "blocks", - "description": "Number of data blocks opened for writing since service start", - "entity_type": "server" - }, - { - "name": "block_manager_total_readable_blocks", - "label": "Data Blocks Opened For Read", - "type": "counter", - "unit": "blocks", - "description": "Number of data blocks opened for reading since service start", - "entity_type": "server" - }, - { - "name": "block_manager_total_bytes_written", - "label": "Block Data Bytes Written", - "type": "counter", - "unit": "bytes", - "description": "Number of bytes of block data written since service start", - "entity_type": "server" - }, - { - "name": "block_manager_total_bytes_read", - "label": "Block Data Bytes Read", - "type": "counter", - "unit": "bytes", - "description": "Number of bytes of block data read since service start", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletServerService_Ping", - "label": "kudu.tserver.TabletServerService.Ping RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletServerService.Ping() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletServerService_Write", - "label": "kudu.tserver.TabletServerService.Write RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletServerService.Write() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletServerService_Scan", - "label": "kudu.tserver.TabletServerService.Scan RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletServerService.Scan() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletServerService_ScannerKeepAlive", - "label": "kudu.tserver.TabletServerService.ScannerKeepAlive RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletServerService.ScannerKeepAlive() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletServerService_ListTablets", - "label": "kudu.tserver.TabletServerService.ListTablets RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletServerService.ListTablets() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletServerService_Checksum", - "label": "kudu.tserver.TabletServerService.Checksum RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletServerService.Checksum() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletCopyService_BeginTabletCopySession", - "label": "kudu.tserver.TabletCopyService.BeginTabletCopySession RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletCopyService.BeginTabletCopySession() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletCopyService_CheckSessionActive", - "label": "kudu.tserver.TabletCopyService.CheckSessionActive RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletCopyService.CheckSessionActive() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletCopyService_FetchData", - "label": "kudu.tserver.TabletCopyService.FetchData RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletCopyService.FetchData() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletCopyService_EndTabletCopySession", - "label": "kudu.tserver.TabletCopyService.EndTabletCopySession RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletCopyService.EndTabletCopySession() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_consensus_ConsensusService_UpdateConsensus", - "label": "kudu.consensus.ConsensusService.UpdateConsensus RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.consensus.ConsensusService.UpdateConsensus() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_consensus_ConsensusService_RequestConsensusVote", - "label": "kudu.consensus.ConsensusService.RequestConsensusVote RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.consensus.ConsensusService.RequestConsensusVote() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_consensus_ConsensusService_ChangeConfig", - "label": "kudu.consensus.ConsensusService.ChangeConfig RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.consensus.ConsensusService.ChangeConfig() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_consensus_ConsensusService_GetNodeInstance", - "label": "kudu.consensus.ConsensusService.GetNodeInstance RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.consensus.ConsensusService.GetNodeInstance() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_consensus_ConsensusService_RunLeaderElection", - "label": "kudu.consensus.ConsensusService.RunLeaderElection RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.consensus.ConsensusService.RunLeaderElection() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_consensus_ConsensusService_LeaderStepDown", - "label": "kudu.consensus.ConsensusService.LeaderStepDown RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.consensus.ConsensusService.LeaderStepDown() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_consensus_ConsensusService_GetLastOpId", - "label": "kudu.consensus.ConsensusService.GetLastOpId RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.consensus.ConsensusService.GetLastOpId() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_consensus_ConsensusService_GetConsensusState", - "label": "kudu.consensus.ConsensusService.GetConsensusState RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.consensus.ConsensusService.GetConsensusState() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_consensus_ConsensusService_StartTabletCopy", - "label": "kudu.consensus.ConsensusService.StartTabletCopy RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.consensus.ConsensusService.StartTabletCopy() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletServerAdminService_CreateTablet", - "label": "kudu.tserver.TabletServerAdminService.CreateTablet RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletServerAdminService.CreateTablet() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletServerAdminService_DeleteTablet", - "label": "kudu.tserver.TabletServerAdminService.DeleteTablet RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletServerAdminService.DeleteTablet() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_tserver_TabletServerAdminService_AlterSchema", - "label": "kudu.tserver.TabletServerAdminService.AlterSchema RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.tserver.TabletServerAdminService.AlterSchema() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_Ping", - "label": "kudu.master.MasterService.Ping RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.Ping() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_TSHeartbeat", - "label": "kudu.master.MasterService.TSHeartbeat RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.TSHeartbeat() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_GetTabletLocations", - "label": "kudu.master.MasterService.GetTabletLocations RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.GetTabletLocations() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_CreateTable", - "label": "kudu.master.MasterService.CreateTable RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.CreateTable() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_IsCreateTableDone", - "label": "kudu.master.MasterService.IsCreateTableDone RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.IsCreateTableDone() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_DeleteTable", - "label": "kudu.master.MasterService.DeleteTable RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.DeleteTable() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_AlterTable", - "label": "kudu.master.MasterService.AlterTable RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.AlterTable() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_IsAlterTableDone", - "label": "kudu.master.MasterService.IsAlterTableDone RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.IsAlterTableDone() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_ListTables", - "label": "kudu.master.MasterService.ListTables RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.ListTables() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_GetTableLocations", - "label": "kudu.master.MasterService.GetTableLocations RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.GetTableLocations() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_GetTableSchema", - "label": "kudu.master.MasterService.GetTableSchema RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.GetTableSchema() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_ListTabletServers", - "label": "kudu.master.MasterService.ListTabletServers RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.ListTabletServers() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_ListMasters", - "label": "kudu.master.MasterService.ListMasters RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.ListMasters() RPC requests", - "entity_type": "server" - }, - { - "name": "handler_latency_kudu_master_MasterService_GetMasterRegistration", - "label": "kudu.master.MasterService.GetMasterRegistration RPC Time", - "type": "histogram", - "unit": "microseconds", - "description": "Microseconds spent handling kudu.master.MasterService.GetMasterRegistration() RPC requests", - "entity_type": "server" - }, - { - "name": "rpc_connections_accepted", - "label": "RPC Connections Accepted", - "type": "counter", - "unit": "connections", - "description": "Number of incoming TCP connections made to the RPC server", - "entity_type": "server" - }, - { - "name": "rpc_incoming_queue_time", - "label": "RPC Queue Time", - "type": "histogram", - "unit": "microseconds", - "description": "Number of microseconds incoming RPC requests spend in the worker queue", - "entity_type": "server" - }, - { - "name": "rpcs_timed_out_in_queue", - "label": "RPC Queue Timeouts", - "type": "counter", - "unit": "requests", - "description": "Number of RPCs whose timeout elapsed while waiting in the service queue, and thus were not processed.", - "entity_type": "server" - }, - { - "name": "rpcs_queue_overflow", - "label": "RPC Queue Overflows", - "type": "counter", - "unit": "requests", - "description": "Number of RPCs dropped because the service queue was full.", - "entity_type": "server" - }, - { - "name": "block_cache_inserts", - "label": "Block Cache Inserts", - "type": "counter", - "unit": "blocks", - "description": "Number of blocks inserted in the cache", - "entity_type": "server" - }, - { - "name": "block_cache_lookups", - "label": "Block Cache Lookups", - "type": "counter", - "unit": "blocks", - "description": "Number of blocks looked up from the cache", - "entity_type": "server" - }, - { - "name": "block_cache_evictions", - "label": "Block Cache Evictions", - "type": "counter", - "unit": "blocks", - "description": "Number of blocks evicted from the cache", - "entity_type": "server" - }, - { - "name": "block_cache_misses", - "label": "Block Cache Misses", - "type": "counter", - "unit": "blocks", - "description": "Number of lookups that didn't yield a block", - "entity_type": "server" - }, - { - "name": "block_cache_misses_caching", - "label": "Block Cache Misses (Caching)", - "type": "counter", - "unit": "blocks", - "description": "Number of lookups that were expecting a block that didn't yield one.Use this number instead of cache_misses when trying to determine how efficient the cache is", - "entity_type": "server" - }, - { - "name": "block_cache_hits", - "label": "Block Cache Hits", - "type": "counter", - "unit": "blocks", - "description": "Number of lookups that found a block", - "entity_type": "server" - }, - { - "name": "block_cache_hits_caching", - "label": "Block Cache Hits (Caching)", - "type": "counter", - "unit": "blocks", - "description": "Number of lookups that were expecting a block that found one.Use this number instead of cache_hits when trying to determine how efficient the cache is", - "entity_type": "server" - }, - { - "name": "block_cache_usage", - "label": "Block Cache Memory Usage", - "type": "gauge", - "unit": "bytes", - "description": "Memory consumed by the block cache", - "entity_type": "server" - }, - { - "name": "spinlock_contention_time", - "label": "Spinlock Contention Time", - "type": "counter", - "unit": "microseconds", - "description": "Amount of time consumed by contention on internal spinlocks since the server started. If this increases rapidly, it may indicate a performance issue in Kudu internals triggered by a particular workload and warrant investigation.", - "entity_type": "server" - }, - { - "name": "tcmalloc_contention_time", - "label": "TCMalloc Contention Time", - "type": "counter", - "unit": "microseconds", - "description": "Amount of time consumed by contention on tcmalloc's locks since the server started. If this increases rapidly, it may indicate a performance issue in Kudu internals triggered by a particular workload and warrant investigation.", - "entity_type": "server" - }, - { - "name": "threads_started", - "label": "Threads Started", - "type": "counter", - "unit": "threads", - "description": "Total number of threads started on this server", - "entity_type": "server" - }, - { - "name": "threads_running", - "label": "Threads Running", - "type": "gauge", - "unit": "threads", - "description": "Current number of running threads", - "entity_type": "server" - }, - { - "name": "cpu_utime", - "label": "User CPU Time", - "type": "counter", - "unit": "milliseconds", - "description": "Total user CPU time of the process", - "entity_type": "server" - }, - { - "name": "cpu_stime", - "label": "System CPU Time", - "type": "counter", - "unit": "milliseconds", - "description": "Total system CPU time of the process", - "entity_type": "server" - }, - { - "name": "voluntary_context_switches", - "label": "Voluntary Context Switches", - "type": "counter", - "unit": "context switches", - "description": "Total voluntary context switches", - "entity_type": "server" - }, - { - "name": "involuntary_context_switches", - "label": "Involuntary Context Switches", - "type": "counter", - "unit": "context switches", - "description": "Total involuntary context switches", - "entity_type": "server" - } - ], - "entities": [ - { - "name": "tablet" - }, - { - "name": "server" - } - ] -}
