metadata.yaml 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497
  1. type: k8s_cluster
  2. status:
  3. class: receiver
  4. stability:
  5. beta: [metrics]
  6. development: [logs]
  7. distributions: [contrib, splunk, observiq, sumo]
  8. codeowners:
  9. active: [dmitryax, TylerHelmuth, povilasv]
  10. sem_conv_version: 1.18.0
  11. resource_attributes:
  12. k8s.namespace.uid:
  13. description: The k8s namespace uid.
  14. type: string
  15. enabled: true
  16. k8s.namespace.name:
  17. description: The k8s namespace name.
  18. type: string
  19. enabled: true
  20. k8s.node.uid:
  21. description: The k8s node uid.
  22. type: string
  23. enabled: true
  24. k8s.node.name:
  25. description: The k8s node name.
  26. type: string
  27. enabled: true
  28. container.id:
  29. description: The container id.
  30. type: string
  31. enabled: true
  32. container.image.name:
  33. description: The container image name
  34. type: string
  35. enabled: true
  36. container.image.tag:
  37. description: The container image tag
  38. type: string
  39. enabled: true
  40. k8s.container.name:
  41. description: The k8s container name
  42. type: string
  43. enabled: true
  44. k8s.pod.name:
  45. description: The k8s pod name.
  46. type: string
  47. enabled: true
  48. k8s.pod.uid:
  49. description: The k8s pod uid.
  50. type: string
  51. enabled: true
  52. k8s.pod.qos_class:
  53. description: "The k8s pod qos class name. One of Guaranteed, Burstable, BestEffort."
  54. type: string
  55. enabled: false
  56. k8s.replicaset.name:
  57. description: The k8s replicaset name
  58. type: string
  59. enabled: true
  60. k8s.replicaset.uid:
  61. description: The k8s replicaset uid
  62. type: string
  63. enabled: true
  64. k8s.replicationcontroller.name:
  65. description: The k8s replicationcontroller name.
  66. type: string
  67. enabled: true
  68. k8s.replicationcontroller.uid:
  69. description: The k8s replicationcontroller uid.
  70. type: string
  71. enabled: true
  72. k8s.resourcequota.uid:
  73. description: The k8s resourcequota uid.
  74. type: string
  75. enabled: true
  76. k8s.resourcequota.name:
  77. description: The k8s resourcequota name.
  78. type: string
  79. enabled: true
  80. k8s.statefulset.uid:
  81. description: The k8s statefulset uid.
  82. type: string
  83. enabled: true
  84. k8s.statefulset.name:
  85. description: The k8s statefulset name.
  86. type: string
  87. enabled: true
  88. k8s.deployment.uid:
  89. description: The UID of the Deployment.
  90. type: string
  91. enabled: true
  92. k8s.deployment.name:
  93. description: The name of the Deployment.
  94. type: string
  95. enabled: true
  96. k8s.cronjob.uid:
  97. description: The k8s CronJob uid.
  98. type: string
  99. enabled: true
  100. k8s.cronjob.name:
  101. description: The k8s CronJob name
  102. type: string
  103. enabled: true
  104. k8s.daemonset.name:
  105. description: The k8s daemonset name.
  106. type: string
  107. enabled: true
  108. k8s.daemonset.uid:
  109. description: The k8s daemonset uid.
  110. type: string
  111. enabled: true
  112. k8s.hpa.uid:
  113. description: The k8s hpa uid.
  114. type: string
  115. enabled: true
  116. k8s.hpa.name:
  117. description: The k8s hpa name.
  118. type: string
  119. enabled: true
  120. k8s.job.name:
  121. description: The k8s pod name.
  122. type: string
  123. enabled: true
  124. k8s.job.uid:
  125. description: The k8s job uid.
  126. type: string
  127. enabled: true
  128. k8s.kubelet.version:
  129. description: The version of Kubelet running on the node.
  130. type: string
  131. enabled: false
  132. k8s.kubeproxy.version:
  133. description: The version of Kube Proxy running on the node.
  134. type: string
  135. enabled: false
  136. openshift.clusterquota.uid:
  137. description: The k8s ClusterResourceQuota uid.
  138. type: string
  139. enabled: true
  140. openshift.clusterquota.name:
  141. description: The k8s ClusterResourceQuota name.
  142. type: string
  143. enabled: true
  144. attributes:
  145. k8s.namespace.name:
  146. description: The k8s namespace name.
  147. type: string
  148. enabled: true
  149. resource:
  150. description: the name of the resource on which the quota is applied
  151. type: string
  152. enabled: true
  153. condition:
  154. description: "the name of Kubernetes Node condition. Example: Ready, Memory, PID, DiskPressure"
  155. type: string
  156. enabled: true
  157. metrics:
  158. k8s.container.cpu_request:
  159. enabled: true
  160. description: Resource requested for the container. See https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#resourcerequirements-v1-core for details
  161. unit: "{cpu}"
  162. gauge:
  163. value_type: double
  164. k8s.container.cpu_limit:
  165. enabled: true
  166. description: Maximum resource limit set for the container. See https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#resourcerequirements-v1-core for details
  167. unit: "{cpu}"
  168. gauge:
  169. value_type: double
  170. k8s.container.memory_request:
  171. enabled: true
  172. description: Resource requested for the container. See https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#resourcerequirements-v1-core for details
  173. unit: "By"
  174. gauge:
  175. value_type: int
  176. k8s.container.memory_limit:
  177. enabled: true
  178. description: Maximum resource limit set for the container. See https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#resourcerequirements-v1-core for details
  179. unit: "By"
  180. gauge:
  181. value_type: int
  182. k8s.container.storage_request:
  183. enabled: true
  184. description: Resource requested for the container. See https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#resourcerequirements-v1-core for details
  185. unit: "By"
  186. gauge:
  187. value_type: int
  188. k8s.container.storage_limit:
  189. enabled: true
  190. description: Maximum resource limit set for the container. See https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#resourcerequirements-v1-core for details
  191. unit: "By"
  192. gauge:
  193. value_type: int
  194. k8s.container.ephemeralstorage_request:
  195. enabled: true
  196. description: Resource requested for the container. See https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#resourcerequirements-v1-core for details
  197. unit: "By"
  198. gauge:
  199. value_type: int
  200. k8s.container.ephemeralstorage_limit:
  201. enabled: true
  202. description: Maximum resource limit set for the container. See https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#resourcerequirements-v1-core for details
  203. unit: "By"
  204. gauge:
  205. value_type: int
  206. k8s.container.restarts:
  207. enabled: true
  208. description: How many times the container has restarted in the recent past. This value is pulled directly from the K8s API and the value can go indefinitely high and be reset to 0 at any time depending on how your kubelet is configured to prune dead containers. It is best to not depend too much on the exact value but rather look at it as either == 0, in which case you can conclude there were no restarts in the recent past, or > 0, in which case you can conclude there were restarts in the recent past, and not try and analyze the value beyond that.
  209. unit: "{restart}"
  210. gauge:
  211. value_type: int
  212. k8s.container.ready:
  213. enabled: true
  214. description: Whether a container has passed its readiness probe (0 for no, 1 for yes)
  215. unit: ""
  216. gauge:
  217. value_type: int
  218. k8s.pod.phase:
  219. enabled: true
  220. description: Current phase of the pod (1 - Pending, 2 - Running, 3 - Succeeded, 4 - Failed, 5 - Unknown)
  221. unit: ""
  222. gauge:
  223. value_type: int
  224. k8s.pod.status_reason:
  225. enabled: false
  226. description: Current status reason of the pod (1 - Evicted, 2 - NodeAffinity, 3 - NodeLost, 4 - Shutdown, 5 - UnexpectedAdmissionError, 6 - Unknown)
  227. unit: ""
  228. gauge:
  229. value_type: int
  230. k8s.deployment.desired:
  231. enabled: true
  232. description: Number of desired pods in this deployment
  233. unit: "{pod}"
  234. gauge:
  235. value_type: int
  236. k8s.deployment.available:
  237. enabled: true
  238. description: Total number of available pods (ready for at least minReadySeconds) targeted by this deployment
  239. unit: "{pod}"
  240. gauge:
  241. value_type: int
  242. k8s.cronjob.active_jobs:
  243. enabled: true
  244. description: The number of actively running jobs for a cronjob
  245. unit: "{job}"
  246. gauge:
  247. value_type: int
  248. k8s.daemonset.current_scheduled_nodes:
  249. enabled: true
  250. description: Number of nodes that are running at least 1 daemon pod and are supposed to run the daemon pod
  251. unit: "{node}"
  252. gauge:
  253. value_type: int
  254. k8s.daemonset.desired_scheduled_nodes:
  255. enabled: true
  256. description: Number of nodes that should be running the daemon pod (including nodes currently running the daemon pod)
  257. unit: "{node}"
  258. gauge:
  259. value_type: int
  260. k8s.daemonset.misscheduled_nodes:
  261. enabled: true
  262. description: Number of nodes that are running the daemon pod, but are not supposed to run the daemon pod
  263. unit: "{node}"
  264. gauge:
  265. value_type: int
  266. k8s.daemonset.ready_nodes:
  267. enabled: true
  268. description: Number of nodes that should be running the daemon pod and have one or more of the daemon pod running and ready
  269. unit: "{node}"
  270. gauge:
  271. value_type: int
  272. k8s.hpa.max_replicas:
  273. enabled: true
  274. description: Maximum number of replicas to which the autoscaler can scale up.
  275. unit: "{pod}"
  276. gauge:
  277. value_type: int
  278. k8s.hpa.min_replicas:
  279. enabled: true
  280. description: Minimum number of replicas to which the autoscaler can scale up.
  281. unit: "{pod}"
  282. gauge:
  283. value_type: int
  284. k8s.hpa.current_replicas:
  285. enabled: true
  286. description: Current number of pod replicas managed by this autoscaler.
  287. unit: "{pod}"
  288. gauge:
  289. value_type: int
  290. k8s.hpa.desired_replicas:
  291. enabled: true
  292. description: Desired number of pod replicas managed by this autoscaler.
  293. unit: "{pod}"
  294. gauge:
  295. value_type: int
  296. k8s.job.active_pods:
  297. enabled: true
  298. description: The number of actively running pods for a job
  299. unit: "{pod}"
  300. gauge:
  301. value_type: int
  302. k8s.job.desired_successful_pods:
  303. enabled: true
  304. description: The desired number of successfully finished pods the job should be run with
  305. unit: "{pod}"
  306. gauge:
  307. value_type: int
  308. k8s.job.failed_pods:
  309. enabled: true
  310. description: The number of pods which reached phase Failed for a job
  311. unit: "{pod}"
  312. gauge:
  313. value_type: int
  314. k8s.job.max_parallel_pods:
  315. enabled: true
  316. description: The max desired number of pods the job should run at any given time
  317. unit: "{pod}"
  318. gauge:
  319. value_type: int
  320. k8s.job.successful_pods:
  321. enabled: true
  322. description: The number of pods which reached phase Succeeded for a job
  323. unit: "{pod}"
  324. gauge:
  325. value_type: int
  326. k8s.namespace.phase:
  327. enabled: true
  328. description: The current phase of namespaces (1 for active and 0 for terminating)
  329. unit: ""
  330. gauge:
  331. value_type: int
  332. k8s.replicaset.desired:
  333. enabled: true
  334. description: Number of desired pods in this replicaset
  335. unit: "{pod}"
  336. gauge:
  337. value_type: int
  338. k8s.replicaset.available:
  339. enabled: true
  340. description: Total number of available pods (ready for at least minReadySeconds) targeted by this replicaset
  341. unit: "{pod}"
  342. gauge:
  343. value_type: int
  344. k8s.replication_controller.desired:
  345. enabled: true
  346. description: Number of desired pods in this replication_controller
  347. unit: "{pod}"
  348. gauge:
  349. value_type: int
  350. k8s.replication_controller.available:
  351. enabled: true
  352. description: Total number of available pods (ready for at least minReadySeconds) targeted by this replication_controller
  353. unit: "{pod}"
  354. gauge:
  355. value_type: int
  356. k8s.resource_quota.hard_limit:
  357. enabled: true
  358. description: The upper limit for a particular resource in a specific namespace. Will only be sent if a quota is specified. CPU requests/limits will be sent as millicores
  359. unit: "{resource}"
  360. gauge:
  361. value_type: int
  362. attributes:
  363. - resource
  364. k8s.resource_quota.used:
  365. enabled: true
  366. description: The usage for a particular resource in a specific namespace. Will only be sent if a quota is specified. CPU requests/limits will be sent as millicores
  367. unit: "{resource}"
  368. gauge:
  369. value_type: int
  370. attributes:
  371. - resource
  372. k8s.statefulset.desired_pods:
  373. enabled: true
  374. description: Number of desired pods in the stateful set (the `spec.replicas` field)
  375. unit: "{pod}"
  376. gauge:
  377. value_type: int
  378. k8s.statefulset.ready_pods:
  379. enabled: true
  380. description: Number of pods created by the stateful set that have the `Ready` condition
  381. unit: "{pod}"
  382. gauge:
  383. value_type: int
  384. k8s.statefulset.current_pods:
  385. enabled: true
  386. description: The number of pods created by the StatefulSet controller from the StatefulSet version
  387. unit: "{pod}"
  388. gauge:
  389. value_type: int
  390. k8s.statefulset.updated_pods:
  391. enabled: true
  392. description: Number of pods created by the StatefulSet controller from the StatefulSet version
  393. unit: "{pod}"
  394. gauge:
  395. value_type: int
  396. openshift.clusterquota.limit:
  397. enabled: true
  398. description: The configured upper limit for a particular resource.
  399. unit: "{resource}"
  400. gauge:
  401. value_type: int
  402. attributes:
  403. - resource
  404. openshift.clusterquota.used:
  405. enabled: true
  406. description: The usage for a particular resource with a configured limit.
  407. unit: "{resource}"
  408. gauge:
  409. value_type: int
  410. attributes:
  411. - resource
  412. openshift.appliedclusterquota.limit:
  413. enabled: true
  414. description: The upper limit for a particular resource in a specific namespace.
  415. unit: "{resource}"
  416. gauge:
  417. value_type: int
  418. attributes:
  419. - k8s.namespace.name
  420. - resource
  421. openshift.appliedclusterquota.used:
  422. enabled: true
  423. description: The usage for a particular resource in a specific namespace.
  424. unit: "{resource}"
  425. gauge:
  426. value_type: int
  427. attributes:
  428. - k8s.namespace.name
  429. - resource
  430. k8s.node.condition:
  431. enabled: false
  432. description: The condition of a particular Node.
  433. unit: "{condition}"
  434. gauge:
  435. value_type: int
  436. attributes:
  437. - condition
  438. # k8s.node.condition_* metrics (k8s.node.condition_ready, k8s.node.condition_memory_pressure, etc) are controlled
  439. # by node_conditions_to_report config option. By default, only k8s.node.condition_ready is enabled.
  440. # k8s.node.allocatable_* metrics (k8s.node.allocatable_cpu, k8s.node.allocatable_memory, etc) are controlled
  441. # by allocatable_types_to_report config option. By default, none of them are reported.