translator/tocwconfig/sampleConfig/kubernetes_on_prem_config.yaml (653 lines of code) (raw):
exporters:
awsemf/containerinsights:
add_entity: true
certificate_file_path: ""
detailed_metrics: false
dimension_rollup_option: NoDimensionRollup
disable_metric_extraction: true
eks_fargate_container_insights_enabled: false
endpoint: https://fake_endpoint
enhanced_container_insights: true
imds_retries: 1
local_mode: true
log_group_name: /aws/containerinsights/{ClusterName}/performance
log_retention: 0
log_stream_name: '{NodeName}'
max_retries: 2
metric_declarations:
- dimensions:
- - ClusterName
- - ClusterName
- ContainerName
- FullPodName
- Namespace
- PodName
- - ClusterName
- ContainerName
- Namespace
- PodName
metric_name_selectors:
- container_cpu_utilization
- container_cpu_utilization_over_container_limit
- container_cpu_limit
- container_cpu_request
- container_memory_utilization
- container_memory_utilization_over_container_limit
- container_memory_failures_total
- container_memory_limit
- container_memory_request
- container_filesystem_usage
- container_filesystem_available
- container_filesystem_utilization
- dimensions:
- - ClusterName
- Namespace
- PodName
- - ClusterName
- - ClusterName
- Namespace
- Service
- - ClusterName
- Namespace
- - ClusterName
- FullPodName
- Namespace
- PodName
metric_name_selectors:
- pod_cpu_utilization
- pod_memory_utilization
- pod_network_rx_bytes
- pod_network_tx_bytes
- pod_cpu_utilization_over_pod_limit
- pod_memory_utilization_over_pod_limit
- dimensions:
- - ClusterName
- FullPodName
- Namespace
- PodName
- - ClusterName
- Namespace
- PodName
- - ClusterName
- Namespace
- - ClusterName
metric_name_selectors:
- pod_interface_network_rx_dropped
- pod_interface_network_tx_dropped
- dimensions:
- - ClusterName
- Namespace
- PodName
- - ClusterName
- - ClusterName
- FullPodName
- Namespace
- PodName
- - ClusterName
- Namespace
- Service
metric_name_selectors:
- pod_cpu_reserved_capacity
- pod_memory_reserved_capacity
- pod_number_of_container_restarts
- pod_number_of_containers
- pod_number_of_running_containers
- pod_status_ready
- pod_status_scheduled
- pod_status_running
- pod_status_pending
- pod_status_failed
- pod_status_unknown
- pod_status_succeeded
- pod_memory_request
- pod_memory_limit
- pod_cpu_limit
- pod_cpu_request
- pod_cpu_usage_total
- pod_memory_working_set
- pod_container_status_running
- pod_container_status_terminated
- pod_container_status_waiting
- pod_container_status_waiting_reason_crash_loop_back_off
- pod_container_status_waiting_reason_image_pull_error
- pod_container_status_waiting_reason_start_error
- pod_container_status_waiting_reason_create_container_error
- pod_container_status_waiting_reason_create_container_config_error
- pod_container_status_terminated_reason_oom_killed
- dimensions:
- - ClusterName
- InstanceId
- NodeName
- - ClusterName
metric_name_selectors:
- node_cpu_utilization
- node_memory_utilization
- node_network_total_bytes
- node_cpu_reserved_capacity
- node_memory_reserved_capacity
- node_number_of_running_pods
- node_number_of_running_containers
- node_cpu_usage_total
- node_cpu_limit
- node_memory_working_set
- node_memory_limit
- node_status_condition_ready
- node_status_condition_disk_pressure
- node_status_condition_memory_pressure
- node_status_condition_pid_pressure
- node_status_condition_network_unavailable
- node_status_condition_unknown
- node_status_capacity_pods
- node_status_allocatable_pods
- dimensions:
- - ClusterName
- InstanceId
- NodeName
- - ClusterName
metric_name_selectors:
- node_interface_network_rx_dropped
- node_interface_network_tx_dropped
- node_diskio_io_service_bytes_total
- node_diskio_io_serviced_total
- hyperpod_node_health_status_schedulable
- hyperpod_node_health_status_unschedulable_pending_replacement
- hyperpod_node_health_status_unschedulable_pending_reboot
- hyperpod_node_health_status_unschedulable
- dimensions:
- - ClusterName
- InstanceId
- NodeName
- - ClusterName
metric_name_selectors:
- node_filesystem_utilization
- node_filesystem_inodes
- node_filesystem_inodes_free
- dimensions:
- - ClusterName
- Namespace
- Service
- - ClusterName
metric_name_selectors:
- service_number_of_running_pods
- dimensions:
- - ClusterName
- Namespace
- PodName
- - ClusterName
metric_name_selectors:
- replicas_desired
- replicas_ready
- status_replicas_available
- status_replicas_unavailable
- dimensions:
- - ClusterName
- Namespace
- PodName
- - ClusterName
metric_name_selectors:
- daemonset_status_number_available
- daemonset_status_number_unavailable
- dimensions:
- - ClusterName
- Namespace
- - ClusterName
metric_name_selectors:
- namespace_number_of_running_pods
- dimensions:
- - ClusterName
metric_name_selectors:
- cluster_node_count
- cluster_failed_node_count
- cluster_number_of_running_pods
- dimensions:
- - ClusterName
- endpoint
- - ClusterName
metric_name_selectors:
- apiserver_storage_size_bytes
- apiserver_storage_db_total_size_in_bytes
- etcd_db_total_size_in_bytes
- dimensions:
- - ClusterName
- resource
- - ClusterName
metric_name_selectors:
- apiserver_storage_list_duration_seconds
- apiserver_longrunning_requests
- apiserver_storage_objects
- dimensions:
- - ClusterName
- verb
- - ClusterName
metric_name_selectors:
- apiserver_request_duration_seconds
- rest_client_request_duration_seconds
- dimensions:
- - ClusterName
- code
- verb
- - ClusterName
metric_name_selectors:
- apiserver_request_total
- apiserver_request_total_5xx
- dimensions:
- - ClusterName
- operation
- - ClusterName
metric_name_selectors:
- apiserver_admission_controller_admission_duration_seconds
- apiserver_admission_step_admission_duration_seconds
- etcd_request_duration_seconds
- dimensions:
- - ClusterName
- code
- method
- - ClusterName
metric_name_selectors:
- rest_client_requests_total
- dimensions:
- - ClusterName
- request_kind
- - ClusterName
metric_name_selectors:
- apiserver_current_inflight_requests
- apiserver_current_inqueue_requests
- dimensions:
- - ClusterName
- name
- - ClusterName
metric_name_selectors:
- apiserver_admission_webhook_admission_duration_seconds
- dimensions:
- - ClusterName
- group
- - ClusterName
metric_name_selectors:
- apiserver_requested_deprecated_apis
- dimensions:
- - ClusterName
- reason
- - ClusterName
metric_name_selectors:
- apiserver_flowcontrol_rejected_requests_total
- dimensions:
- - ClusterName
- priority_level
- - ClusterName
metric_name_selectors:
- apiserver_flowcontrol_request_concurrency_limit
- dimensions:
- - ClusterName
- - ClusterName
- InstanceId
- NodeName
- - ClusterName
- InstanceId
- NodeName
- VolumeId
metric_name_selectors:
- node_diskio_ebs_total_read_ops
- node_diskio_ebs_total_write_ops
- node_diskio_ebs_total_read_bytes
- node_diskio_ebs_total_write_bytes
- node_diskio_ebs_total_read_time
- node_diskio_ebs_total_write_time
- node_diskio_ebs_volume_performance_exceeded_iops
- node_diskio_ebs_volume_performance_exceeded_tp
- node_diskio_ebs_ec2_instance_performance_exceeded_iops
- node_diskio_ebs_ec2_instance_performance_exceeded_tp
- node_diskio_ebs_volume_queue_length
metric_descriptors:
- metric_name: apiserver_admission_controller_admission_duration_seconds
overwrite: true
unit: Seconds
- metric_name: apiserver_admission_step_admission_duration_seconds
overwrite: true
unit: Seconds
- metric_name: apiserver_admission_webhook_admission_duration_seconds
overwrite: true
unit: Seconds
- metric_name: apiserver_current_inflight_requests
overwrite: true
unit: Count
- metric_name: apiserver_current_inqueue_requests
overwrite: true
unit: Count
- metric_name: apiserver_flowcontrol_rejected_requests_total
overwrite: true
unit: Count
- metric_name: apiserver_flowcontrol_request_concurrency_limit
overwrite: true
unit: Count
- metric_name: apiserver_longrunning_requests
overwrite: true
unit: Count
- metric_name: apiserver_request_duration_seconds
overwrite: true
unit: Seconds
- metric_name: apiserver_request_total
overwrite: true
unit: Count
- metric_name: apiserver_request_total_5xx
overwrite: true
unit: Count
- metric_name: apiserver_requested_deprecated_apis
overwrite: true
unit: Count
- metric_name: apiserver_storage_objects
overwrite: true
unit: Count
- metric_name: etcd_request_duration_seconds
overwrite: true
unit: Seconds
- metric_name: apiserver_storage_list_duration_seconds
overwrite: true
unit: Seconds
- metric_name: apiserver_storage_db_total_size_in_bytes
overwrite: true
unit: Bytes
- metric_name: apiserver_storage_size_bytes
overwrite: true
unit: Bytes
- metric_name: etcd_db_total_size_in_bytes
overwrite: true
unit: Bytes
- metric_name: rest_client_request_duration_seconds
overwrite: true
unit: Seconds
- metric_name: rest_client_requests_total
overwrite: true
unit: Count
middleware: agenthealth/logs
namespace: ContainerInsights
no_verify_ssl: false
num_workers: 8
output_destination: cloudwatch
parse_json_encoded_attr_values:
- Sources
- kubernetes
profile: AmazonCloudWatchAgent
proxy_address: ""
region: us-east-1
request_timeout_seconds: 30
resource_arn: ""
resource_to_telemetry_conversion:
enabled: true
retain_initial_value_of_delta_metric: false
role_arn: ""
shared_credentials_file:
- fake-path
version: "0"
extensions:
agenthealth/logs:
is_usage_data_enabled: true
stats:
operations:
- PutLogEvents
usage_flags:
mode: OP
region_type: ACJ
agenthealth/statuscode:
is_status_code_enabled: true
is_usage_data_enabled: true
stats:
usage_flags:
mode: OP
region_type: ACJ
entitystore:
mode: onPremise
profile: AmazonCloudWatchAgent
region: us-east-1
shared_credential_file: fake-path
processors:
awsentity/resource/containerinsights:
entity_type: Resource
platform: onPremise
batch/containerinsights:
metadata_cardinality_limit: 1000
send_batch_max_size: 0
send_batch_size: 8192
timeout: 5s
filter/containerinsights:
error_mode: propagate
logs: {}
metrics:
exclude:
match_type: strict
metric_names:
- up
- scrape_duration_seconds
- scrape_samples_scraped
- scrape_series_added
- scrape_samples_post_metric_relabeling
spans: {}
traces: {}
metricstransform/containerinsights:
transforms:
- action: insert
aggregation_type: ""
experimental_match_labels:
code: ^5.*
include: apiserver_request_total
match_type: regexp
new_name: apiserver_request_total_5xx
submatch_case: ""
- action: update
aggregation_type: ""
include: aws_ebs_csi_read_ops_total
match_type: ""
new_name: node_diskio_ebs_total_read_ops
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_write_ops_total
match_type: ""
new_name: node_diskio_ebs_total_write_ops
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_read_bytes_total
match_type: ""
new_name: node_diskio_ebs_total_read_bytes
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_write_bytes_total
match_type: ""
new_name: node_diskio_ebs_total_write_bytes
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_read_seconds_total
match_type: ""
new_name: node_diskio_ebs_total_read_time
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_write_seconds_total
match_type: ""
new_name: node_diskio_ebs_total_write_time
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_exceeded_iops_seconds_total
match_type: ""
new_name: node_diskio_ebs_volume_performance_exceeded_iops
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_exceeded_tp_seconds_total
match_type: ""
new_name: node_diskio_ebs_volume_performance_exceeded_tp
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_ec2_exceeded_iops_seconds_total
match_type: ""
new_name: node_diskio_ebs_ec2_instance_performance_exceeded_iops
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_ec2_exceeded_tp_seconds_total
match_type: ""
new_name: node_diskio_ebs_ec2_instance_performance_exceeded_tp
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
- action: update
aggregation_type: ""
include: aws_ebs_csi_volume_queue_length
match_type: ""
new_name: node_diskio_ebs_volume_queue_length
submatch_case: ""
operations:
- action: add_label
aggregation_type: ""
experimental_scale: 0
label: ""
label_value: ""
new_label: Type
new_value: NodeEBS
receivers:
awscontainerinsightreceiver:
accelerated_compute_metrics: false
add_container_name_metric_label: true
add_full_pod_name_metric_label: true
add_service_as_attribute: true
certificate_file_path: ""
cluster_name: TestCluster
collection_interval: 30s
container_orchestrator: eks
enable_control_plane_metrics: true
endpoint: ""
host_ip: ""
host_name: ""
imds_retries: 1
kube_config_path: ""
leader_lock_name: cwagent-clusterleader
leader_lock_using_config_map_only: true
local_mode: true
max_retries: 0
middleware: agenthealth/statuscode
no_verify_ssl: false
num_workers: 0
prefer_full_pod_name: true
profile: AmazonCloudWatchAgent
proxy_address: ""
region: us-east-1
request_timeout_seconds: 0
resource_arn: ""
role_arn: ""
shared_credentials_file:
- fake-path
service:
extensions:
- agenthealth/logs
- agenthealth/statuscode
- entitystore
pipelines:
metrics/containerinsights:
exporters:
- awsemf/containerinsights
processors:
- batch/containerinsights
- filter/containerinsights
- awsentity/resource/containerinsights
- metricstransform/containerinsights
receivers:
- awscontainerinsightreceiver
telemetry:
logs:
development: false
disable_caller: false
disable_stacktrace: false
encoding: console
level: info
sampling:
enabled: true
initial: 2
thereafter: 500
tick: 10s
metrics:
address: ""
level: None
traces:
level: None