This shows you the differences between two versions of the page.
| Both sides previous revision Previous revision Next revision | Previous revision | ||
|
мониторинг_кластера_kubernetes [2025/03/25 13:08] val |
мониторинг_кластера_kubernetes [2025/04/02 11:42] (current) val [Мониторинг кластера Kubernetes] |
||
|---|---|---|---|
| Line 7: | Line 7: | ||
| * [[https://selectel.ru/blog/tutorials/monitoring-in-k8s-with-prometheus/|selectel Мониторинг в K8s с помощью Prometheus]] | * [[https://selectel.ru/blog/tutorials/monitoring-in-k8s-with-prometheus/|selectel Мониторинг в K8s с помощью Prometheus]] | ||
| * [[https://www.groundcover.com/blog/kubernetes-observability|Kubernetes Observability Guide: Best Practices & Tools]] | * [[https://www.groundcover.com/blog/kubernetes-observability|Kubernetes Observability Guide: Best Practices & Tools]] | ||
| + | * [[https://sysdig.com/blog/how-to-monitor-kubelet/|How to Monitor the Kubelet]] | ||
| + | * [[https://valyala.medium.com/how-to-use-relabeling-in-prometheus-and-victoriametrics-8b90fc22c4b2|How to use relabeling in Prometheus and VictoriaMetrics]] | ||
| | | ||
| Line 21: | Line 23: | ||
| ===== Запись вебинара ===== | ===== Запись вебинара ===== | ||
| - | * Тэги: | + | * Тэги: Kubernetes, Monitoring, Observability, Metrics Server, VictoriaMetrics, Prometheus, Grafana |
| + | * https://youtu.be/qYKvsOFcpf4 | ||
| + | * https://rutube.ru/video/private/5bfc09467bd36c30276600e7b17b3bfc/ | ||
| ===== Методическая подготовка ===== | ===== Методическая подготовка ===== | ||
| Line 46: | Line 50: | ||
| ===== Шаг 2. Metrics Server ===== | ===== Шаг 2. Metrics Server ===== | ||
| - | * [[https://kubernetes-sigs.github.io/metrics-server/Kubernetes Metrics Server]] | + | * [[Система Kubernetes#Metrics Server]] |
| - | * [[https://medium.com/@cloudspinx/fix-error-metrics-api-not-available-in-kubernetes-aa10766e1c2f|Fix “error: Metrics API not available” in Kubernetes]] | + | |
| - | <code> | ||
| - | kube1:~/metrics-server# curl -L https://github.com/kubernetes-sigs/metrics-server/releases/download/v0.7.2/components.yaml | tee metrics-server-components.yaml | ||
| - | |||
| - | kube1:~/metrics-server# cat metrics-server-components.yaml | ||
| - | </code><code> | ||
| - | ... | ||
| - | containers: | ||
| - | - args: | ||
| - | - --cert-dir=/tmp | ||
| - | - --kubelet-insecure-tls # add this | ||
| - | ... | ||
| - | </code><code> | ||
| - | kube1:~/metrics-server# kubectl apply -f metrics-server-components.yaml | ||
| - | |||
| - | kube1# kubectl get pods -A | grep metrics-server | ||
| - | |||
| - | kube1# kubectl top pod #-n kube-system | ||
| - | |||
| - | kube1# kubectl top pod -A --sort-by=mem | ||
| - | |||
| - | kube1# kubectl top node | ||
| - | </code> | ||
| ===== Шаг 3. VictoriaMetrics ===== | ===== Шаг 3. VictoriaMetrics ===== | ||
| Line 77: | Line 58: | ||
| - | ===== История ===== | + | ===== Вопросы ===== |
| - | ==== loki-stack ==== | ||
| - | * [[https://github.com/grafana/helm-charts/tree/main/charts/loki-stack|Deploy Loki and Promtail to your cluster]] | ||
| - | |||
| - | <code> | ||
| - | http://loki.loki-stack.svc.cluster.local:3100 | ||
| - | http://loki-prometheus-server.loki-stack.svc.cluster.local:80 | ||
| - | |||
| - | |||
| - | kube1:~/loki-stack# helm pull grafana/loki-stack | ||
| - | |||
| - | kube1:~/loki-stack# less loki-stack/charts/loki/values.yaml | ||
| - | |||
| - | persistence: | ||
| - | enabled: false | ||
| - | accessModes: | ||
| - | - ReadWriteOnce | ||
| - | size: 10Gi | ||
| - | |||
| - | |||
| - | kube1:~/loki-stack# cat values.yaml | ||
| - | loki: | ||
| - | persistence: | ||
| - | enabled: true | ||
| - | |||
| - | prometheus: | ||
| - | enabled: true | ||
| - | alertmanager: | ||
| - | config: | ||
| - | global: | ||
| - | smtp_smarthost: 'server.corp13.un:25' | ||
| - | smtp_from: 'alertmanager@corp13.un' | ||
| - | smtp_require_tls: false | ||
| - | |||
| - | templates: | ||
| - | - '/etc/alertmanager/*.tmpl' | ||
| - | |||
| - | route: | ||
| - | group_wait: 30s | ||
| - | group_interval: 5m | ||
| - | repeat_interval: 3h | ||
| - | receiver: team-X-mails | ||
| - | |||
| - | receivers: | ||
| - | - name: 'team-X-mails' | ||
| - | email_configs: | ||
| - | - to: 'student@corp13.un' | ||
| - | send_resolved: true | ||
| - | |||
| - | serverFiles: | ||
| - | alerting_rules.yml: | ||
| - | groups: | ||
| - | |||
| - | |||
| - | kube1:~/loki-stack# helm upgrade --install loki --namespace=loki-stack grafana/loki-stack --create-namespace -f values.yaml | ||
| - | |||
| - | ### helm delete loki --namespace=loki-stack | ||
| - | </code> | ||