This page describes the mapping between metrics provided by Prometheus to Akamas metrics for each supported component type
Component Type | Notes |
---|---|
Component metric | Prometheus query |
---|---|
The following metrics are configured to work for Kubernetes. When using the Docker optimization pack, override the required metrics in the telemetry instance configuration.
Component metric | Prometheus query |
---|---|
Component metric | Prometheus query |
---|---|
Component metric | Prometheus metric |
---|---|
Component metric | Prometheus query |
---|---|
Component metric | Prometheus query |
---|---|
Component metric | Prometheus query |
---|---|
Component metric | Prometheus query |
---|---|
Component metric | Dynatrace metric | Scale | Aggregate multiple Dynatrace entities | Multiple entitites aggregation |
---|---|---|---|---|
Component metric | Dynatrace metric | Default Value | Scale |
---|---|---|---|
Component Metric | Dynatrace Metric | Scale | Aggregate multiple Dynatrace entities | Multiple entitites aggregation |
---|---|---|---|---|
Component Metric | Dynatrace Metric | Default Value | Aggregate multiple Dynatrace entities | Multiple entitites aggregation |
---|---|---|---|---|
Component Metric | Dynatrace Metric | Scale | Aggregate multiple Dynatrace entities | Multiple entitites aggregation |
---|---|---|---|---|
The default metrics in this table are based on the cadvisor and kube-state-metrics
The default metrics in this table are based on the cadvisor and kube-state-metrics
The default metrics in this table are based on the CloudWatch Exporter, configured with the attached custom configuration file
The default metrics in this table are based on the OracleDB Exporter, extending the default queries with the attached custom configuration file
The default metrics in this table are based on the Prometheus Listener for Jmeter
cpu_load_avg
node_load1{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}
cpu_num
count(node_cpu_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$", mode="system" %FILTERS%})
cpu_used
sum by (job) (sum by (cpu, job) (rate(node_cpu_seconds_total{instance=~"$INSTANCE$", mode=~"user|system|softirq|irq|nice", job=~"$JOB$" %FILTERS%}[$DURATION$])))
cpu_util
avg by (job) (sum by (cpu, job) (rate(node_cpu_seconds_total{instance=~"$INSTANCE$", mode=~"user|system|softirq|irq|nice", job=~"$JOB$" %FILTERS%}[$DURATION$])))
cpu_util_details
avg by (instance, cpu, mode, job) (sum by (instance, cpu, mode, job) (rate(node_cpu_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])))
disk_io_inflight_details
node_disk_io_now{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}
disk_iops
sum by (instance, job) (rate(node_disk_writes_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])) + sum by (instance, job) (rate(node_disk_reads_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_iops_details
sum by (instance, device, job) (rate(node_disk_writes_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_iops_details
sum by (instance, device, job) (rate(node_disk_reads_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_iops_details
sum by (instance, device, job) (rate(node_disk_writes_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])) + sum by (instance, device, job) (rate(node_disk_reads_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_iops_reads
sum by (instance, job) (rate(node_disk_reads_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_iops_writes
sum by (instance, job) (rate(node_disk_writes_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_read_bytes
sum by (instance, device, job) (rate(node_disk_read_bytes_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_read_bytes_details
sum by (instance, device, job) (rate(node_disk_read_bytes_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_read_write_bytes
sum by (instance, device, job) (rate(node_disk_written_bytes_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]) + rate(node_disk_read_bytes_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_response_time
avg by (instance, job) ((rate(node_disk_read_time_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]) + rate(node_disk_write_time_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])) / (rate(node_disk_reads_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]) + rate(node_disk_writes_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]) > 0 ))
disk_response_time_details
avg by (instance, device, job) ((rate(node_disk_read_time_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]) + rate(node_disk_write_time_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])) / ((rate(node_disk_reads_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]) + rate(node_disk_writes_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])) > 0))
disk_response_time_read
rate(node_disk_read_time_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])/ rate(node_disk_reads_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
disk_response_time_worst
max by (instance, job) ((rate(node_disk_read_time_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]) + rate(node_disk_write_time_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])) / (rate(node_disk_reads_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]) + rate(node_disk_writes_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]) > 0 ))
disk_response_time_write
rate(node_disk_write_time_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])/ rate(node_disk_writes_completed_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
disk_swap_used
node_memory_SwapTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_memory_SwapFree_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}
disk_swap_util
((node_memory_SwapTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_memory_SwapFree_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}) / (node_memory_SwapTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} > 0)) or ((node_memory_SwapTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_memory_SwapFree_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}))
disk_util_details
rate(node_disk_io_time_seconds_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
disk_write_bytes
sum by (instance, device, job) (rate(node_disk_written_bytes_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
disk_write_bytes_details
sum by (instance, device, job) (rate(node_disk_written_bytes_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$]))
filesystem_size
node_filesystem_size_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}
filesystem_used
node_filesystem_size_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_filesystem_free_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}
filesystem_util
((node_filesystem_size_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_filesystem_free_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}) / node_filesystem_size_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%})
mem_fault_major
rate(node_vmstat_pgmajfault{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
mem_fault_minor
rate(node_vmstat_pgfault{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
mem_swapins
rate(node_vmstat_pswpin{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
mem_swapouts
rate(node_vmstat_pswpout{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
mem_total
node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}
mem_used
(node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_memory_MemFree_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%})
mem_util
(node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_memory_MemFree_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}) / node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}
mem_util_details
(node_memory_Active_file_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} / node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%})
mem_util_details
(node_memory_Active_anon_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} / node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%})
mem_util_details
(node_memory_Inactive_file_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} / node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%})
mem_util_details
(node_memory_Inactive_anon_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} / node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%})
mem_util_nocache
(node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_memory_Buffers_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_memory_Cached_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%} - node_memory_MemFree_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}) / node_memory_MemTotal_bytes{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}
network_in_bytes_details
rate(node_network_receive_bytes_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
network_out_bytes_details
rate(node_network_transmit_bytes_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
network_tcp_retrans
rate(node_netstat_Tcp_RetransSegs{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
os_context_switch
rate(node_context_switches_total{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}[$DURATION$])
proc_blocked
node_procs_blocked{instance=~"$INSTANCE$", job=~"$JOB$" %FILTERS%}
jvm_heap_size
avg(jvm_memory_bytes_max{area="heap" %FILTERS%})
jvm_heap_committed
avg(jvm_memory_bytes_committed{area="heap" %FILTERS%})
jvm_heap_used
avg(jvm_memory_bytes_used{area="heap" %FILTERS%})
jvm_off_heap_used
avg(jvm_memory_bytes_used{area="nonheap" %FILTERS%})
jvm_heap_util
avg(jvm_memory_bytes_used{area="heap" %FILTERS%} / jvm_memory_bytes_max{area="heap" %FILTERS%})
jvm_memory_used
avg(sum by (instance) (jvm_memory_bytes_used))
jvm_heap_young_gen_size
avg(sum by (instance) (jvm_memory_pool_bytes_max{pool=~".*Eden Space|.*Survivor Space" %FILTERS%}))
jvm_heap_young_gen_used
avg(sum by (instance) (jvm_memory_pool_bytes_used{pool=~".*Eden Space|.*Survivor Space" %FILTERS%}))
jvm_heap_old_gen_size
avg(sum by (instance) (jvm_memory_pool_bytes_max{pool=~".*Tenured Gen|.*Old Gen" %FILTERS%}))
jvm_heap_old_gen_used
avg(sum by (instance) (jvm_memory_pool_bytes_used{pool=~".*Tenured Gen|.*Old Gen" %FILTERS%}))
jvm_memory_buffer_pool_used
avg(sum by (instance) (jvm_buffer_pool_used_bytes))
jvm_gc_time
avg(sum by (instance) (rate(jvm_gc_collection_seconds_sum[$DURATION$])))
jvm_gc_count
avg(sum by (instance) (rate(jvm_gc_collection_seconds_count[$DURATION$])))
jvm_gc_duration
(sum(rate(jvm_gc_collection_seconds_sum[$DURATION$])) / sum(rate(jvm_gc_collection_seconds_count[$DURATION$])) > 0 ) or sum(rate(jvm_gc_collection_seconds_count[$DURATION$]))
jvm_threads_current
avg(jvm_threads_current)
jvm_threads_deadlocked
avg(jvm_threads_deadlocked)
transactions_response_time
avg(rate(ResponseTime_sum{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])/rate(ResponseTime_count{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])>0)
transactions_response_time_max
max(rate(ResponseTime_sum{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])/rate(ResponseTime_count{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])>0)
transactions_response_time_min
min(rate(ResponseTime_sum{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])/rate(ResponseTime_count{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])>0)
transactions_response_time_p50
ResponseTime{quantile="0.5", code="200", job=~"$JOB$" %FILTERS%}
transactions_response_time_p85
ResponseTime{quantile="0.85", code="200", job=~"$JOB$" %FILTERS%}
transactions_response_time_p90
ResponseTime{quantile="0.9", code="200", job=~"$JOB$" %FILTERS%}
transactions_response_time_p99
ResponseTime{quantile="0.99", code="200", job=~"$JOB$" %FILTERS%}
transactions_throughput
sum(rate(Ratio_success{job=~"$JOB$" %FILTERS%}[$DURATION$]))
transactions_error_throughput
sum(rate(Ratio_failure{job=~"$JOB$" %FILTERS%}[$DURATION$]))
transactions_error_rate
(avg(rate(Ratio_failure{job=~"$JOB$" %FILTERS%}[$DURATION$]))/avg(rate(Ratio_total{job=~"$JOB$" %FILTERS%}[$DURATION$])))*100
users
sum(jmeter_threads{state="active", job=~"$JOB$" %FILTERS%})
k8s_workload_desired_pods
kube_deployment_spec_replicas{namespace=~"$NAMESPACE$", deployment=~"$DEPLOYMENT$" %FILTERS%}
k8s_workload_running_pods
kube_deployment_status_replicas_available{namespace=~"$NAMESPACE$", deployment=~"$DEPLOYMENT$" %FILTERS%}
k8s_workload_ready_pods
kube_deployment_status_replicas_ready{namespace=~"$NAMESPACE$", deployment=~"$DEPLOYMENT$" %FILTERS%}
k8s_workload_cpu_used
1e3 * sum(rate(container_cpu_usage_seconds_total{container="", namespace=~"$NAMESPACE$", pod=~"$DEPLOYMENT$.*" %FILTERS%}[$DURATION$]))
k8s_workload_memory_used
sum(last_over_time(container_memory_usage_bytes{container="", namespace=~"$NAMESPACE$", pod=~"$DEPLOYMENT$.*" %FILTERS%}[$DURATION$]))
k8s_workload_cpu_request
1e3 * sum(kube_pod_container_resource_requests{resource="cpu", namespace=~"$NAMESPACE$", pod=~"$DEPLOYMENT$.*" %FILTERS%})
k8s_workload_cpu_limit
1e3 * sum(kube_pod_container_resource_limits{resource="cpu", namespace=~"$NAMESPACE$", pod=~"$DEPLOYMENT$.*" %FILTERS%})
k8s_workload_memory_request
sum(kube_pod_container_resource_requests{resource="memory", namespace=~"$NAMESPACE$", pod=~"$DEPLOYMENT$.*" %FILTERS%})
k8s_workload_memory_limit
sum(kube_pod_container_resource_limits{resource="memory", namespace=~"$NAMESPACE$", pod=~"$DEPLOYMENT$.*" %FILTERS%})
k8s_pod_cpu_used
1e3 * avg(rate(container_cpu_usage_seconds_total{container="", namespace=~"$NAMESPACE$", pod=~"$POD$" %FILTERS%}[$DURATION$]))
k8s_pod_cpu_request
1e3 * avg(sum by (pod) (kube_pod_container_resource_requests{resource="cpu", namespace=~"$NAMESPACE$", pod=~"$POD$" %FILTERS%}))
k8s_pod_cpu_limit
1e3 * avg(sum by (pod) (kube_pod_container_resource_limits{resource="cpu", namespace=~"$NAMESPACE$", pod=~"$POD$" %FILTERS%}))
k8s_pod_memory_used
avg(last_over_time(container_memory_usage_bytes{container="", namespace=~"$NAMESPACE$", pod=~"$POD$" %FILTERS%}[$DURATION$]))
k8s_pod_memory_working_set
avg(container_memory_working_set_bytes{container="", namespace=~"$NAMESPACE$", pod=~"$POD$" %FILTERS%})
k8s_pod_memory_request
avg(sum by (pod) (kube_pod_container_resource_requests{resource="memory", namespace=~"$NAMESPACE$", pod=~"$POD$" %FILTERS%}))
k8s_pod_memory_limit
avg(sum by (pod) (kube_pod_container_resource_limits{resource="memory", namespace=~"$NAMESPACE$", pod=~"$POD$" %FILTERS%}))
k8s_pod_restarts
avg(sum by (pod) (increase(kube_pod_container_status_restarts_total{namespace=~"$NAMESPACE$", pod=~"$POD$" %FILTERS%}[$DURATION$])))
container_cpu_used
1e3 * avg(rate(container_cpu_usage_seconds_total{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]))
container_cpu_used_max
1e3 * max(rate(container_cpu_usage_seconds_total{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]))
container_cpu_util
avg(rate(container_cpu_usage_seconds_total{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]) / on (pod) group_left kube_pod_container_resource_limits{resource="cpu", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})
container_cpu_util_max
max(rate(container_cpu_usage_seconds_total{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]) / on (pod) group_left kube_pod_container_resource_limits{resource="cpu", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})
container_cpu_throttled_millicores
1e3 * avg(rate(container_cpu_cfs_throttled_seconds_total{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]))
container_cpu_throttle_time
avg(last_over_time(container_cpu_cfs_throttled_periods_total{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]) / container_cpu_cfs_periods_total{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})
container_memory_used
avg(last_over_time(container_memory_working_set_bytes{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]))
container_memory_used_max
max(last_over_time(container_memory_working_set_bytes{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]))
container_memory_util
avg(last_over_time(container_memory_working_set_bytes{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]) / on (pod) group_left kube_pod_container_resource_limits{resource="memory", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})
container_memory_util_max
max(last_over_time(container_memory_working_set_bytes{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]) / on (pod) group_left kube_pod_container_resource_limits{resource="memory", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})
container_memory_resident_set_used
avg(last_over_time(container_memory_rss{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]))
container_memory_cache
avg(last_over_time(container_memory_cache{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]))
container_cpu_request
1e3 * avg(kube_pod_container_resource_requests{resource="cpu", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})
container_cpu_limit
1e3 * avg(kube_pod_container_resource_limits{resource="cpu", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})
container_memory_request
avg(kube_pod_container_resource_requests{resource="memory", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})
container_memory_limit
avg(kube_pod_container_resource_limits{resource="memory", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})
container_restarts
avg(increase(kube_pod_container_status_restarts_total{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]))
container_oom_kills_count
avg(increase(container_oom_events_total{namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%}[$DURATION$]))
cost
sum(kube_pod_container_resource_requests{resource="cpu", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})*29 + sum(kube_pod_container_resource_requests{resource="memory", namespace=~"$NAMESPACE$", pod=~"$POD$", container=~"$CONTAINER$" %FILTERS%})/1024/1024/1024*8
cpu_util
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() aws_ec2_cpuutilization_average{job='$JOB$'}/100
network_in_bytes_details
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() (aws_ec2_network_in_sum{job='$JOB$'} * count_over_time(aws_ec2_network_in_sum{job='$JOB$'}[300s]) / 300)
network_out_bytes_details
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() (aws_ec2_network_out_sum{job='$JOB$'} * count_over_time(aws_ec2_network_out_sum{job='$JOB$'}[300s]) / 300)
aws_ec2_credits_cpu_available
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() aws_ec2_cpucredit_balance_average{job='$JOB$'}
aws_ec2_credits_cpu_used
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() aws_ec2_cpucredit_usage_sum{job='$JOB$'}
disk_read_bytes
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() (aws_ec2_ebsread_bytes_sum{job='$JOB$'} * count_over_time(aws_ec2_ebsread_bytes_sum{job='$JOB$'}[300s]) / 300)
disk_write_bytes
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() (aws_ec2_ebswrite_bytes_sum{job='$JOB$'} * count_over_time(aws_ec2_ebswrite_bytes_sum{job='$JOB$'}[300s]) / 300)
aws_ec2_disk_iops
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() ((aws_ec2_ebsread_ops_sum{job='$JOB$'} + aws_ec2_ebswrite_ops_sum{job='$JOB$'}) * count_over_time(aws_ec2_ebsread_ops_sum{job='$JOB$'}[300s])/300)
aws_ec2_disk_iops_reads
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() (aws_ec2_ebsread_ops_sum{job='$JOB$'} * count_over_time(aws_ec2_ebsread_ops_sum{job='$JOB$'}[300s]) / 300)
aws_ec2_disk_iops_writes
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() (aws_ec2_ebswrite_ops_sum{job='$JOB$'} * count_over_time(aws_ec2_ebswrite_ops_sum{job='$JOB$'}[300s]) / 300)
aws_ec2_ebs_credits_io_util
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() aws_ec2_ebsiobalance__average{job='$JOB$'} / 100
aws_ec2_ebs_credits_bytes_util
aws_resource_info{instance='$INSTANCE$', job='$JOB$' %FILTERS%} * on(instance_id) group_left() aws_ec2_ebsbyte_balance__average{job='$JOB$'} / 100
oracle_sga_total_size
oracledb_memory_size{component='SGA Target', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_sga_free_size
oracledb_memory_size{component='Free SGA Memory Available', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_sga_max_size
oracledb_memory_size{component='Maximum SGA Size', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_pga_target_size
oracledb_memory_size{component='PGA Target', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_redo_buffers_size
oracledb_memory_size{component='Redo Buffers', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_default_buffer_cache_size
oracledb_memory_size{component='DEFAULT buffer cache', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_default_2k_buffer_cache_size
oracledb_memory_size{component='DEFAULT 2K buffer cache', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_default_4k_buffer_cache_size
oracledb_memory_size{component='DEFAULT 4K buffer cache', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_default_8k_buffer_cache_size
oracledb_memory_size{component='DEFULT 8K buffer cache', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_default_16k_buffer_cache_size
oracledb_memory_size{component='DEFAULT 16K buffer cache', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_default_32k_buffer_cache_size
oracledb_memory_size{component='DEFAULT 32K buffer cache', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_keep_buffer_cache_size
oracledb_memory_size{component='KEEP buffer cache', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_recycle_buffer_cache_size
oracledb_memory_size{component='RECYCLE buffer cache', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_asm_buffer_cache_size
oracledb_memory_size{component='ASM Buffer Cache', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_shared_io_pool_size
oracledb_memory_size{component='Shared IO Pool', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_java_pool_size
oracledb_memory_size{component='java pool', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_large_pool_size
oracledb_memory_size{component='large pool', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_shared_pool_size
oracledb_memory_size{component='shared pool', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_streams_pool_size
oracledb_memory_size{component='streams pool', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_sessions_active_user
oracledb_sessions_value{type='USER', status='ACTIVE', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_sessions_inactive_user
oracledb_sessions_value{type='USER', status='INACTIVE', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_sessions_active_background
oracledb_sessions_value{type='BACKGROUND', status='ACTIVE', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_sessions_inactive_background
oracledb_sessions_value{type='BACKGROUND', status='INACTIVE', instance='$INSTANCE$', job='$JOB$' %FILTERS%}
oracle_buffer_cache_hit_ratio
ttps://docs.oracle.com/database/121/TGDBA/tune_buffer_cache.htm#TGDBA533
oracle_redo_log_space_requests
rate(oracledb_activity_redo_log_space_requests{instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])
oracle_wait_event_log_file_sync
rate(oracledb_system_event_time_waited{event='log file sync', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_log_file_parallel_write
rate(oracledb_system_event_time_waited{event='log file sequential read', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_log_file_sequential_read
rate(oracledb_system_event_time_waited{event='log file parallel write', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_enq_tx_contention
rate(oracledb_system_event_time_waited{event='enq: TX - contention', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_enq_tx_row_lock_contention
rate(oracledb_system_event_time_waited{event='enq: TX - row lock contention', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_latch_row_cache_objects
rate(oracledb_system_event_time_waited{event='latch: row cache objects', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_latch_shared_pool
rate(oracledb_system_event_time_waited{event='latch: shared pool', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_resmgr_cpu_quantum
rate(oracledb_system_event_time_waited{event='resmgr:cpu quantum', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_sql_net_message_from_client
rate(oracledb_system_event_time_waited{event='SQL*Net message from client', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_rdbms_ipc_message
rate(oracledb_system_event_time_waited{event='rdbms ipc message', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_db_file_sequential_read
rate(oracledb_system_event_time_waited{event='db file sequential read', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_log_file_switch_checkpoint_incomplete
rate(oracledb_system_event_time_waited{event='log file switch (checkpoint incomplete)', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_row_cache_lock
rate(oracledb_system_event_time_waited{event='row cache lock', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_buffer_busy_waits
rate(oracledb_system_event_time_waited{event='buffer busy waits', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_event_db_file_async_io_submit
rate(oracledb_system_event_time_waited{event='db file async I/O submit', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$])/100
oracle_wait_class_commit
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='Commit', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
oracle_wait_class_concurrency
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='Concurrency', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
oracle_wait_class_system_io
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='System I/O', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
oracle_wait_class_user_io
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='User I/O', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
oracle_wait_class_other
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='Other', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
oracle_wait_class_scheduler
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='Scheduler', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
oracle_wait_class_idle
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='Idle', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
oracle_wait_class_application
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='Application', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
oracle_wait_class_network
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='Network', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
oracle_wait_class_configuration
sum without(event) (rate(oracledb_system_event_time_waited{wait_class='Configuration', instance='$INSTANCE$', job='$JOB$' %FILTERS%}[$DURATION$]))/100
transactions_response_time
avg(rate(ResponseTime_sum{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])/rate(ResponseTime_count{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])>0)
transactions_response_time_max
max(rate(ResponseTime_sum{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])/rate(ResponseTime_count{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])>0)
transactions_response_time_min
min(rate(ResponseTime_sum{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])/rate(ResponseTime_count{code="200", job=~"$JOB$" %FILTERS%}[$DURATION$])>0)
transactions_response_time_p50
ResponseTime{quantile="0.5", code="200", job=~"$JOB$" %FILTERS%}
transactions_response_time_p85
ResponseTime{quantile="0.85", code="200", job=~"$JOB$" %FILTERS%}
transactions_response_time_p90
ResponseTime{quantile="0.9", code="200", job=~"$JOB$" %FILTERS%}
transactions_response_time_p99
ResponseTime{quantile="0.99", code="200", job=~"$JOB$" %FILTERS%}
transactions_throughput
sum(rate(Ratio_success{job=~"$JOB$" %FILTERS%}[$DURATION$]))
transactions_error_throughput
sum(rate(Ratio_failure{job=~"$JOB$" %FILTERS%}[$DURATION$]))
transactions_error_rate
(avg(rate(Ratio_failure{job=~"$JOB$" %FILTERS%}[$DURATION$]))/avg(rate(Ratio_total{job=~"$JOB$" %FILTERS%}[$DURATION$])))*100
users
sum(jmeter_threads{state="active", job=~"$JOB$" %FILTERS%})
cpu_load_avg
builtin:host.cpu.load
cpu_num
N/A
cpu_util
builtin:host.cpu.usage
0.01
cpu_util_details
mode:
idle
user
system
iowait
builtin:host.cpu.idle
(mode=idle
)
builtin:host.cpu.system
(mode=system
)
builtin:host.cpu.user
(mode=user
)
builtin:host.cpu.iowait
(mode=iowait
)
0.01
mem_util
N/A
mem_util_nocache
builtin:host.mem.usage
0.01
mem_util_details
N/A
mem_used
N/A
mem_used_nocache
builtin:host.mem.used
mem_total
N/A
mem_fault
builtin:host.mem.avail
.pfps
mem_fault_minor
N/A
mem_fault_major
N/A
mem_swapins
N/A
mem_swapouts
N/A
disk_swap_util
N/A
disk_swap_used
N/A
filesystem_util
Disk
builtin:host.disk.usedPct
filesystem_used
N/A
filesystem_size
N/A
disk_util_details
Disk
builtin:host.disk.free
0.01
disk_iops_writes
N/A
disk_iops_reads
N/A
disk_iops
N/A
disk_iops_details
N/A
disk_response_time_worst
N/A
disk_response_time
N/A
disk_io_inflight_details
N/A
0.01
disk_write_bytes
N/A
disk_read_bytes
N/A
disk_read_write_bytes
N/A
disk_write_bytes_details
Disk
builtin:host.disk.bytesWritten
disk_read_bytes_details
Disk
builtin:host.disk.bytesRead
disk_response_time_details
Disk
builtin:host.disk.readTime
0.001
proc_blocked
N/A
os_context_switch
N/A
network_tcp_retrans
N/A
network_in_bytes_details
Network interface
builtin:host.net.nic.bytesRx
network_out_bytes_details
Network interface
builtin:host.net.nic.bytesTx
jvm_gc_count
builtin:tech.jvm.memory.pool.collectionCount:merge(poolname,gcname):sum
1/60
Yes
avg
jvm_gc_time
builtin:tech.jvm.memory.gc.suspensionTime
0.01
Yes
avg
jvm_heap_size
builtin:tech.jvm.memory.runtime.max
Yes
avg
jvm_heap_committed
Yes
avg
jvm_heap_used
Yes
avg
jvm_off_heap_used
Yes
avg
jvm_heap_old_gen_size
Yes
avg
jvm_heap_old_gen_used
Yes
avg
jvm_heap_young_gen_size
Yes
avg
jvm_heap_young_gen_used
Yes
avg
jvm_threads_current
builtin:tech.jvm.threads.count
Yes
avg
requests_response_time
builtin:service.response.time
0
0.000001
requests_response_time_min
builtin:service.response.time:min
0
0.000001
requests_response_time_max
builtin:service.response.time:max
0
0.000001
requests_throughput
builtin:service.errors.total.successCount
0
1/60
requests_error_rate
builtin:service.errors.total.rate
0
0.01
requests_response_time_p50
builtin:service.response.time:percentile(50)
0
0.001
requests_response_time_p85
builtin:service.response.time:percentile(85)
0
0.001
requests_response_time_p90
builtin:service.response.time:percentile(90)
0
0.001
requests_response_time_p95
builtin:service.response.time:percentile(95)
0
0.001
requests_response_time_p99
builtin:service.response.time:percentile(99)
0
0.001
container_cpu_limit
builtin:containers.cpu.limit
Yes
avg
container_cpu_util
builtin:containers.cpu.usagePercent
0.01
Yes
avg
container_cpu_util_max
builtin:containers.cpu.usagePercent
0.01
Yes
max
container_cpu_throttled_millicores
builtin:containers.cpu.throttledMilliCores
Yes
avg
container_cpu_throttle_time
builtin:containers.cpu.throttledTime
1 / 10^9 / 60
Yes
avg
container_cpu_used
builtin:containers.cpu.usageMilliCores
Yes
avg
container_cpu_used_max
builtin:containers.cpu.usageMilliCores
Yes
max
container_memory_limit
builtin:containers.memory.limitBytes
Yes
avg
container_memory_used
builtin:containers.memory.residentSetBytes
Yes
avg
container_memory_used_max
builtin:containers.memory.residentSetBytes
Yes
max
container_memory_util
builtin:containers.memory.usagePercent
0.01
Yes
avg
container_memory_util_max
builtin:containers.memory.usagePercent
0.01
Yes
max
container_oom_kills_count
builtin:containers.memory.outOfMemoryKills
1/60
Yes
avg
k8s_pod_cpu_limit
builtin:cloud.kubernetes.pod.cpuLimits
Yes
avg
k8s_pod_cpu_request
builtin:cloud.kubernetes.pod.cpuRequests
Yes
avg
k8s_pod_memory_limit
builtin:cloud.kubernetes.pod.memoryLimits
Yes
avg
k8s_pod_memory_request
builtin:cloud.kubernetes.pod.memoryRequests
Yes
avg
k8s_pod_restarts
builtin:kubernetes.container.restarts:merge(k8s.container.name):sum
0
Yes
avg
k8s_workload_desired_pods
builtin:kubernetes.workload.pods_desired
No
k8s_workload_running_pods
builtin:kubernetes.pods:filter(eq(pod_phase,Running))
No
k8s_workload_cpu_limit
builtin:kubernetes.workload.limits_cpu
No
k8s_workload_cpu_request
builtin:kubernetes.workload.requests_cpu
No
k8s_workload_memory_limit
builtin:kubernetes.workload.limits_memory
No
k8s_workload_memory_request
builtin:kubernetes.workload.requests_memory
No
k8s_workload_cpu_used
builtin:containers.cpu.usageMilliCores
Yes
sum
k8s_workload_memory_used
builtin:containers.memory.residentSetBytes
Yes
sum
users
The average number of users active in a specific timeframe.
transactions_throughput
The average throughput of LoadRunner transaction (requests), per second
transactions_response_time_min
The min response time of LoadRunner transaction (requests)
transactions_response_time_max
The max response time of LoadRunner transaction (requests)
transactions_response_time
The response time of LoadRunner transaction (requests)
transactions_response_time_p50
The 50th percentile (weighted median) of the response time of LoadRunner transaction (requests)
transactions_response_time_p85
The 85th percentile of the response time of LoadRunner transaction (requests)
transactions_response_time_p95
The 95th percentile of the response time of LoadRunner transaction (requests)
transactions_response_time_p99
The 99th percentile of the response time of LoadRunner transaction (requests)
pages_throughput
The average throughput of LoadRunner pages (transactions breakdown, second level) , per second
pages_response_time_min
The min response time of LoadRunner pages (transactions breakdown, second level)
pages_response_time_max
The max response time of LoadRunner pages (transactions breakdown, second level)
pages_response_time
The response time of LoadRunner pages (transactions breakdown, second level)
pages_response_time_p50
The 50th percentile (weighted median) of the response time of LoadRunner requests
pages_response_time_p85
The 85th percentile of the response time of LoadRunner transaction breakdown, first level (pages)
pages_response_time_p95
The 95th percentile of the response time of LoadRunner transaction breakdown, first level (pages)
pages_response_time_p99
The 99th percentile of the response time of LoadRunner transaction breakdown, first level (pages)
requests_throughput
The average throughput of LoadRunner requests, per second
requests_response_time_min
The min response time of LoadRunner requests
requests_response_time_max
The max response time of LoadRunner requests
requests_response_time
The response time of LoadRunner requests
requests_response_time_p50
The 50th percentile (weighted median) of the response time of LoadRunner requests
requests_response_time_p85
The 85th percentile of the response time of LoadRunner transaction breakdown, second level (requests)
requests_response_time_p95
The 95th percentile of the response time of LoadRunner transaction breakdown, second level (requests)
requests_response_time_p99
The 99th percentile of the response time of LoadRunner transaction breakdown, second level (requests)
requests_error_throughput
The number of requests (transactions breakdown, first level) flagged as error by LoadRunner, per second
transactions_response_time
transactions
AVG_DURATION
pages_response_time
pages
AVG_DURATION
requests_response_time
requests
AVG_DURATION
transactions_response_time_min
transactions
MIN_DURATION
pages_response_time_min
pages
MIN_DURATION
requests_response_time_min
requests
MIN_DURATION
transactions_response_time_max
transactions
MAX_DURATION
pages_response_time_max
pages
MAX_DURATION
requests_response_time_max
requests
MAX_DURATION
transactions_throughput
transactions
THROUGHPUT
pages_throughput
pages
THROUGHPUT
requests_throughput
requests
THROUGHPUT
transactions_error_rate
transactions
ERROR_RATE
pages_error_rate
pages
ERROR_RATE
requests_error_rate
requests
ERROR_RATE
transactions_error_throughput
transactions
ERRORS_PER_SECOND
pages_error_throughput
pages
ERRORS_PER_SECOND
requests_error_throughput
requests
ERRORS_PER_SECOND
users
Controller/User Load
AVG
This section documents the mapping between the metrics provided by Telemetry Providers and the Akamas metrics for each supported component type.
Telemetry Provider | Telemetry Provider metric mapping |
---|---|
no predefined mapping as CSV provider is extensible
spark_duration
job
/{appId}/1/jobs/{jobId}
.duration
spark_completed_tasks
job
/{appId}/1/jobs/{jobId}
.numCompletedTasks
spark_active_tasks
job
/{appId}/1/jobs/{jobId}
.numActiveTasks
spark_skipped_tasks
job
/{appId}/1/jobs/{jobId}
.numSkippedTasks
spark_failed_tasks
job
/{appId}/1/jobs/{jobId}
.numFailedTasks
spark_killed_tasks
job
/{appId}/1/jobs/{jobId}
.numKilledTasks
spark_completed_stages
job
/{appId}/1/jobs/{jobId}
.numCompletedStages
spark_failed_stages
job
/{appId}/1/jobs/{jobId}
.numFailedStages
spark_skipped_stages
job
/{appId}/1/jobs/{jobId}
.numSkippedStages
spark_active_stages
job
/{appId}/1/jobs/{jobId}
.numActiveStages
spark_duration
stage
/{appId}/1/stages/{stageId}
.getDuration
spark_task_stage_executor_run_time
stage
/{appId}/1/stages/{stageId}
.getExecutorRunTime
spark_task_stage_executor_cpu_time
stage
/{appId}/1/stages/{stageId}
.getExecutorCpuTime
spark_active_tasks
stage
/{appId}/1/stages/{stageId}
.getNumActiveTasks
spark_completed_tasks
stage
/{appId}/1/stages/{stageId}
.getNumCompleteTasks
spark_failed_tasks
stage
/{appId}/1/stages/{stageId}
.getNumFailedTasks
spark_killed_tasks
stage
/{appId}/1/stages/{stageId}
.getNumKilledTasks
spark_task_stage_input_bytes_read
stage
/{appId}/1/stages/{stageId}
.getInputBytes
spark_task_stage_input_records_read
stage
/{appId}/1/stages/{stageId}
.getInputRecords
spark_task_stage_output_bytes_written
stage
/{appId}/1/stages/{stageId}
.getOutputBytes
spark_task_stage_output_records_written
stage
/{appId}/1/stages/{stageId}
.getOutputRecords
spark_stage_shuffle_read_bytes
stage
/{appId}/1/stages/{stageId}
.getShuffleReadBytes
spark_task_stage_shuffle_read_records
stage
/{appId}/1/stages/{stageId}
.getShuffleReadRecords
spark_task_stage_shuffle_write_bytes
stage
/{appId}/1/stages/{stageId}
.getShuffleWriteBytes
spark_task_stage_shuffle_write_records
stage
/{appId}/1/stages/{stageId}
.getShuffleWriteRecords
spark_task_stage_memory_bytes_spilled
stage
/{appId}/1/stages/{stageId}
.getMemoryBytesSpilled
spark_task_stage_disk_bytes_spilled
stage
/{appId}/1/stages/{stageId}
.getDiskBytesSpilled
spark_duration
task
/{appId}/1/stages/{stageId}
.tasks[].duration
spark_task_executor_deserialize_time
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.executorDeserializeTime
spark_task_executor_deserialize_cpu_time
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.executorDeserializeCpuTime
spark_task_stage_executor_run_time
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.executorRunTime
spark_task_stage_executor_cpu_time
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.executorCpuTime
spark_task_result_size
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.resultSize
spark_task_jvm_gc_duration
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.jvmGcTime
spark_task_result_serialization_time
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.resultSerializationTime
spark_task_stage_memory_bytes_spilled
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.memoryBytesSpilled
spark_task_stage_disk_bytes_spilled
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.diskBytesSpilled
spark_task_peak_execution_memory
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.peakExecutionMemory
spark_task_stage_input_bytes_read
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.inputMetrics.bytesRead
spark_task_stage_input_records_read
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.inputMetrics.recordsRead
spark_task_stage_output_bytes_written
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.outputMetrics.bytesWritten
spark_task_stage_output_records_written
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.outputMetrics.recordsWritten
spark_task_shuffle_read_remote_blocks_fetched
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleReadMetrics.remoteBlocksFetched
spark_task_shuffle_read_local_blocks_fetched
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleReadMetrics.localBlocksFetched
spark_task_shuffle_read_fetch_wait_time
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleReadMetrics.fetchWaitTime
spark_task_shuffle_read_remote_bytes
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleReadMetrics.remoteBytesRead
spark_task_shuffle_read_remote_bytes_to_disk
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleReadMetrics.remoteBytesReadToDisk
spark_task_shuffle_read_local_bytes
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleReadMetrics.localBytesRead
spark_task_stage_shuffle_read_records
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleReadMetrics.recordsRead
spark_task_stage_shuffle_write_bytes
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleWriteMetrics.bytesWritten
spark_task_shuffle_write_time
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleWriteMetrics.writeTime
spark_task_stage_shuffle_write_records
task
/{appId}/1/stages/{stageId}
.tasks[].taskMetrics.shuffleWriteMetrics.recordsWritten
spark_executor_rdd_blocks
executor
/{appId}/1/allexecutors
select(.id!='driver) | .rddBlocks
spark_executor_mem_used
executor
/{appId}/1/allexecutors
select(.id!='driver) | .memoryUsed
spark_executor_disk_used
executor
/{appId}/1/allexecutors
select(.id!='driver) | .diskUsed
spark_executor_cores
executor
/{appId}/1/allexecutors
select(.id!='driver) | .totalCores
spark_active_tasks
executor
/{appId}/1/allexecutors
select(.id!='driver) | .activeTasks
spark_failed_tasks
executor
/{appId}/1/allexecutors
select(.id!='driver) | .failedTasks
spark_completed_tasks
executor
/{appId}/1/allexecutors
select(.id!='driver) | .completedTasks
spark_executor_total_tasks
executor
/{appId}/1/allexecutors
select(.id!='driver) | .totalTasks
spark_executor_total_duration
executor
/{appId}/1/allexecutors
select(.id!='driver) | .totalDuration
spark_executor_total_jvm_gc_duration
executor
/{appId}/1/allexecutors
select(.id!='driver) | .totalGCTime
spark_executor_total_input_bytes
executor
/{appId}/1/allexecutors
select(.id!='driver) | .totalInputBytes
spark_executor_total_shuffle_read
executor
/{appId}/1/allexecutors
select(.id!='driver) | .totalShuffleRead
spark_executor_total_shuffle_write
executor
/{appId}/1/allexecutors
select(.id!='driver) | .totalShuffleWrite
spark_executor_max_mem_used
executor
/{appId}/1/allexecutors
select(.id!='driver) | .maxMemory
spark_executor_used_on_heap_storage_memory
executor
/{appId}/1/allexecutors
select(.id!='driver) | .memoryMetrics.usedOnHeapStorageMemory
spark_executor_used_off_heap_storage_memory
executor
/{appId}/1/allexecutors
select(.id!='driver) | .memoryMetrics.usedOffHeapStorageMemory
spark_executor_total_on_heap_storage_memory
executor
/{appId}/1/allexecutors
select(.id!='driver) | .memoryMetrics.totalOnHeapStorageMemory
spark_executor_total_off_heap_storage_memory
executor
/{appId}/1/allexecutors
select(.id!='driver) | .memoryMetrics.totalOffHeapStorageMemory
spark_driver_rdd_blocks
driver
/{appId}/1/allexecutors
select(.id=='driver') | .rddBlocks
spark_driver_mem_used
driver
/{appId}/1/allexecutors
select(.id=='driver') | .memoryUsed
spark_driver_disk_used
driver
/{appId}/1/allexecutors
select(.id=='driver') | .diskUsed
spark_driver_cores
driver
/{appId}/1/allexecutors
select(.id=='driver') | .totalCores
spark_driver_total_duration
driver
/{appId}/1/allexecutors
select(.id=='driver') | .totalDuration
spark_driver_total_jvm_gc_duration
driver
/{appId}/1/allexecutors
select(.id=='driver') | .totalGCTime
spark_driver_total_input_bytes
driver
/{appId}/1/allexecutors
select(.id=='driver') | .totalInputBytes
spark_driver_total_shuffle_read
driver
/{appId}/1/allexecutors
select(.id=='driver') | .totalShuffleRead
spark_driver_total_shuffle_write
driver
/{appId}/1/allexecutors
select(.id=='driver') | .totalShuffleWrite
spark_driver_max_mem_used
driver
/{appId}/1/allexecutors
select(.id=='driver') | .maxMemory
spark_driver_used_on_heap_storage_memory
driver
/{appId}/1/allexecutors
select(.id=='driver') | .memoryMetrics.usedOnHeapStorageMemory
spark_driver_used_off_heap_storage_memory
driver
/{appId}/1/allexecutors
select(.id=='driver') | .memoryMetrics.usedOffHeapStorageMemory
spark_driver_total_on_heap_storage_memory
driver
/{appId}/1/allexecutors
select(.id=='driver') | .memoryMetrics.totalOnHeapStorageMemory
spark_driver_total_off_heap_storage_memory
driver
/{appId}/1/allexecutors
select(.id=='driver') | .memoryMetrics.totalOffHeapStorageMemory