kubelet-servicemonitor.yaml 7.0 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091
  1. apiVersion: monitoring.coreos.com/v1
  2. kind: ServiceMonitor
  3. metadata:
  4. labels:
  5. app.kubernetes.io/name: kubelet
  6. name: kubelet
  7. name: kubelet
  8. namespace: monitoring
  9. spec:
  10. endpoints:
  11. - bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
  12. honorLabels: true
  13. interval: 30s
  14. metricRelabelings:
  15. - action: drop
  16. regex: kubelet_(pod_worker_latency_microseconds|pod_start_latency_microseconds|cgroup_manager_latency_microseconds|pod_worker_start_latency_microseconds|pleg_relist_latency_microseconds|pleg_relist_interval_microseconds|runtime_operations|runtime_operations_latency_microseconds|runtime_operations_errors|eviction_stats_age_microseconds|device_plugin_registration_count|device_plugin_alloc_latency_microseconds|network_plugin_operations_latency_microseconds)
  17. sourceLabels:
  18. - __name__
  19. - action: drop
  20. regex: scheduler_(e2e_scheduling_latency_microseconds|scheduling_algorithm_predicate_evaluation|scheduling_algorithm_priority_evaluation|scheduling_algorithm_preemption_evaluation|scheduling_algorithm_latency_microseconds|binding_latency_microseconds|scheduling_latency_seconds)
  21. sourceLabels:
  22. - __name__
  23. - action: drop
  24. regex: apiserver_(request_count|request_latencies|request_latencies_summary|dropped_requests|storage_data_key_generation_latencies_microseconds|storage_transformation_failures_total|storage_transformation_latencies_microseconds|proxy_tunnel_sync_latency_secs)
  25. sourceLabels:
  26. - __name__
  27. - action: drop
  28. regex: kubelet_docker_(operations|operations_latency_microseconds|operations_errors|operations_timeout)
  29. sourceLabels:
  30. - __name__
  31. - action: drop
  32. regex: reflector_(items_per_list|items_per_watch|list_duration_seconds|lists_total|short_watches_total|watch_duration_seconds|watches_total)
  33. sourceLabels:
  34. - __name__
  35. - action: drop
  36. regex: etcd_(helper_cache_hit_count|helper_cache_miss_count|helper_cache_entry_count|request_cache_get_latencies_summary|request_cache_add_latencies_summary|request_latencies_summary)
  37. sourceLabels:
  38. - __name__
  39. - action: drop
  40. regex: transformation_(transformation_latencies_microseconds|failures_total)
  41. sourceLabels:
  42. - __name__
  43. - action: drop
  44. regex: (admission_quota_controller_adds|crd_autoregistration_controller_work_duration|APIServiceOpenAPIAggregationControllerQueue1_adds|AvailableConditionController_retries|crd_openapi_controller_unfinished_work_seconds|APIServiceRegistrationController_retries|admission_quota_controller_longest_running_processor_microseconds|crdEstablishing_longest_running_processor_microseconds|crdEstablishing_unfinished_work_seconds|crd_openapi_controller_adds|crd_autoregistration_controller_retries|crd_finalizer_queue_latency|AvailableConditionController_work_duration|non_structural_schema_condition_controller_depth|crd_autoregistration_controller_unfinished_work_seconds|AvailableConditionController_adds|DiscoveryController_longest_running_processor_microseconds|autoregister_queue_latency|crd_autoregistration_controller_adds|non_structural_schema_condition_controller_work_duration|APIServiceRegistrationController_adds|crd_finalizer_work_duration|crd_naming_condition_controller_unfinished_work_seconds|crd_openapi_controller_longest_running_processor_microseconds|DiscoveryController_adds|crd_autoregistration_controller_longest_running_processor_microseconds|autoregister_unfinished_work_seconds|crd_naming_condition_controller_queue_latency|crd_naming_condition_controller_retries|non_structural_schema_condition_controller_queue_latency|crd_naming_condition_controller_depth|AvailableConditionController_longest_running_processor_microseconds|crdEstablishing_depth|crd_finalizer_longest_running_processor_microseconds|crd_naming_condition_controller_adds|APIServiceOpenAPIAggregationControllerQueue1_longest_running_processor_microseconds|DiscoveryController_queue_latency|DiscoveryController_unfinished_work_seconds|crd_openapi_controller_depth|APIServiceOpenAPIAggregationControllerQueue1_queue_latency|APIServiceOpenAPIAggregationControllerQueue1_unfinished_work_seconds|DiscoveryController_work_duration|autoregister_adds|crd_autoregistration_controller_queue_latency|crd_finalizer_retries|AvailableConditionController_unfinished_work_seconds|autoregister_longest_running_processor_microseconds|non_structural_schema_condition_controller_unfinished_work_seconds|APIServiceOpenAPIAggregationControllerQueue1_depth|AvailableConditionController_depth|DiscoveryController_retries|admission_quota_controller_depth|crdEstablishing_adds|APIServiceOpenAPIAggregationControllerQueue1_retries|crdEstablishing_queue_latency|non_structural_schema_condition_controller_longest_running_processor_microseconds|autoregister_work_duration|crd_openapi_controller_retries|APIServiceRegistrationController_work_duration|crdEstablishing_work_duration|crd_finalizer_adds|crd_finalizer_depth|crd_openapi_controller_queue_latency|APIServiceOpenAPIAggregationControllerQueue1_work_duration|APIServiceRegistrationController_queue_latency|crd_autoregistration_controller_depth|AvailableConditionController_queue_latency|admission_quota_controller_queue_latency|crd_naming_condition_controller_work_duration|crd_openapi_controller_work_duration|DiscoveryController_depth|crd_naming_condition_controller_longest_running_processor_microseconds|APIServiceRegistrationController_depth|APIServiceRegistrationController_longest_running_processor_microseconds|crd_finalizer_unfinished_work_seconds|crdEstablishing_retries|admission_quota_controller_unfinished_work_seconds|non_structural_schema_condition_controller_adds|APIServiceRegistrationController_unfinished_work_seconds|admission_quota_controller_work_duration|autoregister_depth|autoregister_retries|kubeproxy_sync_proxy_rules_latency_microseconds|rest_client_request_latency_seconds|non_structural_schema_condition_controller_retries)
  45. sourceLabels:
  46. - __name__
  47. port: https-metrics
  48. relabelings:
  49. - sourceLabels:
  50. - __metrics_path__
  51. targetLabel: metrics_path
  52. scheme: https
  53. tlsConfig:
  54. insecureSkipVerify: true
  55. - bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
  56. honorLabels: true
  57. honorTimestamps: false
  58. interval: 30s
  59. metricRelabelings:
  60. - action: drop
  61. regex: container_(network_tcp_usage_total|network_udp_usage_total|tasks_state|cpu_load_average_10s)
  62. sourceLabels:
  63. - __name__
  64. path: /metrics/cadvisor
  65. port: https-metrics
  66. relabelings:
  67. - sourceLabels:
  68. - __metrics_path__
  69. targetLabel: metrics_path
  70. scheme: https
  71. tlsConfig:
  72. insecureSkipVerify: true
  73. - bearerTokenFile: /var/run/secrets/kubernetes.io/serviceaccount/token
  74. honorLabels: true
  75. interval: 30s
  76. path: /metrics/probes
  77. port: https-metrics
  78. relabelings:
  79. - sourceLabels:
  80. - __metrics_path__
  81. targetLabel: metrics_path
  82. scheme: https
  83. tlsConfig:
  84. insecureSkipVerify: true
  85. jobLabel: k8s-app
  86. namespaceSelector:
  87. matchNames:
  88. - kube-system
  89. selector:
  90. matchLabels:
  91. k8s-app: kubelet