translator/tocwconfig/sampleConfig/emf_and_kubernetes_config.yaml (725 lines of code) (raw):

exporters: awscloudwatchlogs/emf_logs: certificate_file_path: "" emf_only: true endpoint: https://fake_endpoint imds_retries: 2 local_mode: true log_group_name: emf/logs/default log_retention: 0 log_stream_name: host_name_from_env max_retries: 2 middleware: agenthealth/logs no_verify_ssl: false num_workers: 8 profile: default proxy_address: "" raw_log: true region: us-east-1 request_timeout_seconds: 30 resource_arn: "" retry_on_failure: enabled: true initial_interval: 5s max_elapsed_time: 5m0s max_interval: 30s multiplier: 1.5 randomization_factor: 0.5 role_arn: "" sending_queue: enabled: true num_consumers: 1 queue_size: 1000 shared_credentials_file: - /root/.aws/credentials awsemf/containerinsights: add_entity: true certificate_file_path: "" detailed_metrics: false dimension_rollup_option: NoDimensionRollup disable_metric_extraction: true eks_fargate_container_insights_enabled: false endpoint: https://fake_endpoint enhanced_container_insights: true imds_retries: 2 local_mode: true log_group_name: /aws/containerinsights/{ClusterName}/performance log_retention: 0 log_stream_name: '{NodeName}' max_retries: 2 metric_declarations: - dimensions: - - ClusterName - - ClusterName - ContainerName - FullPodName - Namespace - PodName - - ClusterName - ContainerName - Namespace - PodName metric_name_selectors: - container_cpu_utilization - container_cpu_utilization_over_container_limit - container_cpu_limit - container_cpu_request - container_memory_utilization - container_memory_utilization_over_container_limit - container_memory_failures_total - container_memory_limit - container_memory_request - container_filesystem_usage - container_filesystem_available - container_filesystem_utilization - dimensions: - - ClusterName - Namespace - PodName - - ClusterName - - ClusterName - Namespace - Service - - ClusterName - Namespace - - ClusterName - FullPodName - Namespace - PodName metric_name_selectors: - pod_cpu_utilization - pod_memory_utilization - pod_network_rx_bytes - pod_network_tx_bytes - pod_cpu_utilization_over_pod_limit - pod_memory_utilization_over_pod_limit - dimensions: - - ClusterName - FullPodName - Namespace - PodName - - ClusterName - Namespace - PodName - - ClusterName - Namespace - - ClusterName metric_name_selectors: - pod_interface_network_rx_dropped - pod_interface_network_tx_dropped - dimensions: - - ClusterName - Namespace - PodName - - ClusterName - - ClusterName - FullPodName - Namespace - PodName - - ClusterName - Namespace - Service metric_name_selectors: - pod_cpu_reserved_capacity - pod_memory_reserved_capacity - pod_number_of_container_restarts - pod_number_of_containers - pod_number_of_running_containers - pod_status_ready - pod_status_scheduled - pod_status_running - pod_status_pending - pod_status_failed - pod_status_unknown - pod_status_succeeded - pod_memory_request - pod_memory_limit - pod_cpu_limit - pod_cpu_request - pod_cpu_usage_total - pod_memory_working_set - pod_container_status_running - pod_container_status_terminated - pod_container_status_waiting - pod_container_status_waiting_reason_crash_loop_back_off - pod_container_status_waiting_reason_image_pull_error - pod_container_status_waiting_reason_start_error - pod_container_status_waiting_reason_create_container_error - pod_container_status_waiting_reason_create_container_config_error - pod_container_status_terminated_reason_oom_killed - dimensions: - - ClusterName - InstanceId - NodeName - - ClusterName metric_name_selectors: - node_cpu_utilization - node_memory_utilization - node_network_total_bytes - node_cpu_reserved_capacity - node_memory_reserved_capacity - node_number_of_running_pods - node_number_of_running_containers - node_cpu_usage_total - node_cpu_limit - node_memory_working_set - node_memory_limit - node_status_condition_ready - node_status_condition_disk_pressure - node_status_condition_memory_pressure - node_status_condition_pid_pressure - node_status_condition_network_unavailable - node_status_condition_unknown - node_status_capacity_pods - node_status_allocatable_pods - dimensions: - - ClusterName - InstanceId - NodeName - - ClusterName metric_name_selectors: - node_interface_network_rx_dropped - node_interface_network_tx_dropped - node_diskio_io_service_bytes_total - node_diskio_io_serviced_total - hyperpod_node_health_status_schedulable - hyperpod_node_health_status_unschedulable_pending_replacement - hyperpod_node_health_status_unschedulable_pending_reboot - hyperpod_node_health_status_unschedulable - dimensions: - - ClusterName - InstanceId - NodeName - - ClusterName metric_name_selectors: - node_filesystem_utilization - node_filesystem_inodes - node_filesystem_inodes_free - dimensions: - - ClusterName - Namespace - Service - - ClusterName metric_name_selectors: - service_number_of_running_pods - dimensions: - - ClusterName - Namespace - PodName - - ClusterName metric_name_selectors: - replicas_desired - replicas_ready - status_replicas_available - status_replicas_unavailable - dimensions: - - ClusterName - Namespace - PodName - - ClusterName metric_name_selectors: - daemonset_status_number_available - daemonset_status_number_unavailable - dimensions: - - ClusterName - Namespace - - ClusterName metric_name_selectors: - namespace_number_of_running_pods - dimensions: - - ClusterName metric_name_selectors: - cluster_node_count - cluster_failed_node_count - cluster_number_of_running_pods - dimensions: - - ClusterName - endpoint - - ClusterName metric_name_selectors: - apiserver_storage_size_bytes - apiserver_storage_db_total_size_in_bytes - etcd_db_total_size_in_bytes - dimensions: - - ClusterName - resource - - ClusterName metric_name_selectors: - apiserver_storage_list_duration_seconds - apiserver_longrunning_requests - apiserver_storage_objects - dimensions: - - ClusterName - verb - - ClusterName metric_name_selectors: - apiserver_request_duration_seconds - rest_client_request_duration_seconds - dimensions: - - ClusterName - code - verb - - ClusterName metric_name_selectors: - apiserver_request_total - apiserver_request_total_5xx - dimensions: - - ClusterName - operation - - ClusterName metric_name_selectors: - apiserver_admission_controller_admission_duration_seconds - apiserver_admission_step_admission_duration_seconds - etcd_request_duration_seconds - dimensions: - - ClusterName - code - method - - ClusterName metric_name_selectors: - rest_client_requests_total - dimensions: - - ClusterName - request_kind - - ClusterName metric_name_selectors: - apiserver_current_inflight_requests - apiserver_current_inqueue_requests - dimensions: - - ClusterName - name - - ClusterName metric_name_selectors: - apiserver_admission_webhook_admission_duration_seconds - dimensions: - - ClusterName - group - - ClusterName metric_name_selectors: - apiserver_requested_deprecated_apis - dimensions: - - ClusterName - reason - - ClusterName metric_name_selectors: - apiserver_flowcontrol_rejected_requests_total - dimensions: - - ClusterName - priority_level - - ClusterName metric_name_selectors: - apiserver_flowcontrol_request_concurrency_limit - dimensions: - - ClusterName - - ClusterName - InstanceId - NodeName - - ClusterName - InstanceId - NodeName - VolumeId metric_name_selectors: - node_diskio_ebs_total_read_ops - node_diskio_ebs_total_write_ops - node_diskio_ebs_total_read_bytes - node_diskio_ebs_total_write_bytes - node_diskio_ebs_total_read_time - node_diskio_ebs_total_write_time - node_diskio_ebs_volume_performance_exceeded_iops - node_diskio_ebs_volume_performance_exceeded_tp - node_diskio_ebs_ec2_instance_performance_exceeded_iops - node_diskio_ebs_ec2_instance_performance_exceeded_tp - node_diskio_ebs_volume_queue_length metric_descriptors: - metric_name: apiserver_admission_controller_admission_duration_seconds overwrite: true unit: Seconds - metric_name: apiserver_admission_step_admission_duration_seconds overwrite: true unit: Seconds - metric_name: apiserver_admission_webhook_admission_duration_seconds overwrite: true unit: Seconds - metric_name: apiserver_current_inflight_requests overwrite: true unit: Count - metric_name: apiserver_current_inqueue_requests overwrite: true unit: Count - metric_name: apiserver_flowcontrol_rejected_requests_total overwrite: true unit: Count - metric_name: apiserver_flowcontrol_request_concurrency_limit overwrite: true unit: Count - metric_name: apiserver_longrunning_requests overwrite: true unit: Count - metric_name: apiserver_request_duration_seconds overwrite: true unit: Seconds - metric_name: apiserver_request_total overwrite: true unit: Count - metric_name: apiserver_request_total_5xx overwrite: true unit: Count - metric_name: apiserver_requested_deprecated_apis overwrite: true unit: Count - metric_name: apiserver_storage_objects overwrite: true unit: Count - metric_name: etcd_request_duration_seconds overwrite: true unit: Seconds - metric_name: apiserver_storage_list_duration_seconds overwrite: true unit: Seconds - metric_name: apiserver_storage_db_total_size_in_bytes overwrite: true unit: Bytes - metric_name: apiserver_storage_size_bytes overwrite: true unit: Bytes - metric_name: etcd_db_total_size_in_bytes overwrite: true unit: Bytes - metric_name: rest_client_request_duration_seconds overwrite: true unit: Seconds - metric_name: rest_client_requests_total overwrite: true unit: Count middleware: agenthealth/logs namespace: ContainerInsights no_verify_ssl: false num_workers: 8 output_destination: cloudwatch parse_json_encoded_attr_values: - Sources - kubernetes profile: default proxy_address: "" region: us-east-1 request_timeout_seconds: 30 resource_arn: "" resource_to_telemetry_conversion: enabled: true retain_initial_value_of_delta_metric: false role_arn: "" shared_credentials_file: - /root/.aws/credentials version: "0" extensions: agenthealth/logs: is_usage_data_enabled: true stats: operations: - PutLogEvents usage_flags: mode: OP region_type: ACJ agenthealth/statuscode: is_status_code_enabled: true is_usage_data_enabled: true stats: usage_flags: mode: OP region_type: ACJ entitystore: mode: onPremise profile: default region: us-east-1 shared_credential_file: /root/.aws/credentials processors: awsentity/resource/containerinsights: entity_type: Resource platform: onPremise batch/containerinsights: metadata_cardinality_limit: 1000 send_batch_max_size: 0 send_batch_size: 8192 timeout: 5s batch/emf_logs: metadata_cardinality_limit: 1000 send_batch_max_size: 0 send_batch_size: 8192 timeout: 5s filter/containerinsights: error_mode: propagate logs: {} metrics: exclude: match_type: strict metric_names: - up - scrape_duration_seconds - scrape_samples_scraped - scrape_series_added - scrape_samples_post_metric_relabeling spans: {} traces: {} metricstransform/containerinsights: transforms: - action: insert aggregation_type: "" experimental_match_labels: code: ^5.* include: apiserver_request_total match_type: regexp new_name: apiserver_request_total_5xx submatch_case: "" - action: update aggregation_type: "" include: aws_ebs_csi_read_ops_total match_type: "" new_name: node_diskio_ebs_total_read_ops submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS - action: update aggregation_type: "" include: aws_ebs_csi_write_ops_total match_type: "" new_name: node_diskio_ebs_total_write_ops operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS submatch_case: "" - action: update aggregation_type: "" include: aws_ebs_csi_read_bytes_total match_type: "" new_name: node_diskio_ebs_total_read_bytes submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS - action: update aggregation_type: "" include: aws_ebs_csi_write_bytes_total match_type: "" new_name: node_diskio_ebs_total_write_bytes submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS - action: update aggregation_type: "" include: aws_ebs_csi_read_seconds_total match_type: "" new_name: node_diskio_ebs_total_read_time submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS - action: update aggregation_type: "" include: aws_ebs_csi_write_seconds_total match_type: "" new_name: node_diskio_ebs_total_write_time submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS - action: update aggregation_type: "" include: aws_ebs_csi_exceeded_iops_seconds_total match_type: "" new_name: node_diskio_ebs_volume_performance_exceeded_iops submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS - action: update aggregation_type: "" include: aws_ebs_csi_exceeded_tp_seconds_total match_type: "" new_name: node_diskio_ebs_volume_performance_exceeded_tp submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS - action: update aggregation_type: "" include: aws_ebs_csi_ec2_exceeded_iops_seconds_total match_type: "" new_name: node_diskio_ebs_ec2_instance_performance_exceeded_iops submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS - action: update aggregation_type: "" include: aws_ebs_csi_ec2_exceeded_tp_seconds_total match_type: "" new_name: node_diskio_ebs_ec2_instance_performance_exceeded_tp submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS - action: update aggregation_type: "" include: aws_ebs_csi_volume_queue_length match_type: "" new_name: node_diskio_ebs_volume_queue_length submatch_case: "" operations: - action: add_label aggregation_type: "" experimental_scale: 0 label: "" label_value: "" new_label: Type new_value: NodeEBS receivers: awscontainerinsightreceiver: accelerated_compute_metrics: false add_container_name_metric_label: true add_full_pod_name_metric_label: true add_service_as_attribute: true certificate_file_path: "" cluster_name: TestCluster collection_interval: 30s container_orchestrator: eks enable_control_plane_metrics: true endpoint: "" host_ip: "" host_name: "" imds_retries: 2 kube_config_path: "" leader_lock_name: cwagent-clusterleader leader_lock_using_config_map_only: true local_mode: true max_retries: 0 middleware: agenthealth/statuscode no_verify_ssl: false num_workers: 0 prefer_full_pod_name: true profile: default proxy_address: "" region: us-east-1 request_timeout_seconds: 0 resource_arn: "" role_arn: "" shared_credentials_file: - /root/.aws/credentials tcplog/emf_logs: encoding: utf-8 id: tcp_input listen_address: 0.0.0.0:25888 operators: [] retry_on_failure: enabled: false initial_interval: 0s max_elapsed_time: 0s max_interval: 0s type: tcp_input udplog/emf_logs: encoding: utf-8 id: udp_input listen_address: 0.0.0.0:25888 multiline: line_end_pattern: .^ line_start_pattern: "" omit_pattern: false operators: [] retry_on_failure: enabled: false initial_interval: 0s max_elapsed_time: 0s max_interval: 0s type: udp_input service: extensions: - agenthealth/logs - agenthealth/statuscode - entitystore pipelines: logs/emf_logs: exporters: - awscloudwatchlogs/emf_logs processors: - batch/emf_logs receivers: - tcplog/emf_logs - udplog/emf_logs metrics/containerinsights: exporters: - awsemf/containerinsights processors: - batch/containerinsights - filter/containerinsights - awsentity/resource/containerinsights - metricstransform/containerinsights receivers: - awscontainerinsightreceiver telemetry: logs: development: false disable_caller: false disable_stacktrace: false encoding: console level: info sampling: enabled: true initial: 2 thereafter: 500 tick: 10s metrics: address: "" level: None traces: level: None