default manifest

This commit is contained in:
2025-12-10 12:56:47 +01:00
parent 00cf9c6530
commit 53bef561c4

View File

@@ -2,53 +2,303 @@ apiVersion: v1
kind: ConfigMap kind: ConfigMap
metadata: metadata:
name: argocd-metrics-server-configmap name: argocd-metrics-server-configmap
namespace: argocd
data: data:
# Define metrics for Deployments config.json: |
extension.metrics.deployments: | {
- name: "CPU Usage" "prometheus": {
description: "CPU usage for the deployment" "applications": [
type: "graph" {
graphType: "area" "name": "default",
yAxisLabel: "CPU Cores" "default": true,
query: 'sum(rate(container_cpu_usage_seconds_total{namespace="{{.metadata.namespace}}", pod=~"{{.metadata.name}}-.*"}[5m])) by (pod)' "dashboards": [
{
- name: "Memory Usage" "groupKind": "pod",
description: "Memory usage for the deployment" "tabs": ["Golden Signal"],
type: "graph" "rows": [
graphType: "area" {
yAxisLabel: "Memory (MB)" "name": "pod",
query: 'sum(container_memory_working_set_bytes{namespace="{{.metadata.namespace}}", pod=~"{{.metadata.name}}-.*"}) by (pod) / 1024 / 1024' "title": "Pods",
"tab": "Golden Signal",
- name: "Network Received" "graphs": [
description: "Network bytes received" {
type: "graph" "name": "pod_cpu_line",
graphType: "line" "title": "CPU",
yAxisLabel: "Bytes/sec" "description": "",
query: 'sum(rate(container_network_receive_bytes_total{namespace="{{.metadata.namespace}}", pod=~"{{.metadata.name}}-.*"}[5m])) by (pod)' "graphType": "line",
"metricName": "pod",
# Define metrics for Pods "queryExpression": "sum(rate(container_cpu_usage_seconds_total{pod=~\"{{.name}}\", image!=\"\", container!=\"POD\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
extension.metrics.pods: | },
- name: "CPU Usage" {
description: "CPU usage for the pod" "name": "pod_cpu_pie",
type: "graph" "title": "CPU Avg",
graphType: "area" "description": "",
yAxisLabel: "CPU Cores" "graphType": "pie",
query: 'sum(rate(container_cpu_usage_seconds_total{namespace="{{.metadata.namespace}}", pod="{{.metadata.name}}"}[5m])) by (container)' "metricName": "pod",
"queryExpression": "sum(rate(container_cpu_usage_seconds_total{pod=~\"{{.name}}\", container!=\"POD\", image!=\"\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
- name: "Memory Usage" },
description: "Memory usage for the pod" {
type: "graph" "name": "pod_memory_line",
graphType: "area" "title": "Memory",
yAxisLabel: "Memory (MB)" "description": "",
query: 'sum(container_memory_working_set_bytes{namespace="{{.metadata.namespace}}", pod="{{.metadata.name}}"}) by (container) / 1024 / 1024' "graphType": "line",
"metricName": "pod",
- name: "Container Restarts" "queryExpression": "sum(rate(container_memory_usage_bytes{pod=~\"{{.name}}\", container!=\"POD\", image!=\"\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
description: "Number of container restarts" },
type: "graph" {
graphType: "line" "name": "pod_memory_pie",
yAxisLabel: "Restarts" "title": "Mem Avg",
query: 'kube_pod_container_status_restarts_total{namespace="{{.metadata.namespace}}", pod="{{.metadata.name}}"}' "description": "",
"graphType": "pie",
# Prometheus connection settings "metricName": "pod",
prometheus.url: "http://prometheus-kube-prometheus-prometheus.monitoring.svc:9090" "queryExpression": "sum(rate(container_memory_usage_bytes{pod=~\"{{.name}}\", container!=\"POD\", image!=\"\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
}
]
},
{
"name": "container",
"title": "Containers",
"tab": "Golden Signal",
"graphs": [
{
"name": "container_cpu_line",
"title": "CPU",
"description": "",
"graphType": "line",
"metricName": "container",
"queryExpression": "sum(rate(container_cpu_usage_seconds_total{pod=~\"{{.name}}\", image!=\"\", container!=\"POD\", container!=\"\", container_name!=\"POD\"}[5m])) by (container)"
},
{
"name": "container_cpu_pie",
"title": "CPU Avg",
"description": "",
"graphType": "pie",
"metricName": "container",
"queryExpression": "sum(rate(container_cpu_usage_seconds_total{pod=~\"{{.name}}\", image!=\"\",container!=\"POD\", container!=\"\", container_name!=\"POD\"}[5m])) by (container)"
},
{
"name": "container_memory_line",
"title": "Memory",
"description": "",
"graphType": "line",
"metricName": "container",
"queryExpression": "sum(rate(container_memory_usage_bytes{pod=~\"{{.name}}\", image!=\"\", container!=\"POD\", container!=\"\", container_name!=\"POD\"}[5m])) by (container)"
},
{
"name": "container_memory_pie",
"title": "Mem Avg",
"description": "",
"graphType": "pie",
"metricName": "container",
"queryExpression": "sum(rate(container_memory_usage_bytes{pod=~\"{{.name}}\", image!=\"\", container!=\"POD\", container!=\"\", container_name!=\"POD\"}[5m])) by (container)"
}
]
}
]
},
{
"groupKind": "deployment",
"tabs": ["Golden Signal"],
"rows": [
{
"name": "httplatency",
"title": "HTTP Latency",
"tab": "Golden Signal",
"graphs": [
{
"name": "http_200_latency",
"title": "Latency",
"description": "",
"graphType": "line",
"metricName": "pod_template_hash",
"queryExpression": "sum(rate(http_server_requests_seconds_sum {namespace=\"{{.namespace}}\", status=\"200\"} [1m])) by (pod_template_hash)"
}
]
},
{
"name": "httperrortate",
"title": "HTTP Error Rate",
"tab": "Golden Signal",
"graphs": [
{
"name": "http_error_rate_500",
"title": "HTTP Error 500",
"description": "",
"graphType": "line",
"metricName": "pod_template_hash",
"queryExpression": "sum(rate(http_server_requests_seconds_count {namespace=\"{{.namespace}}\", status=\"500\"} [1m])) by (pod_template_hash)"
},
{
"name": "http_error_rate_400",
"title": "HTTP Error 400",
"description": "",
"graphType": "line",
"metricName": "pod_template_hash",
"queryExpression": "sum(rate(http_server_requests_seconds_count {namespace=\"{{.namespace}}\", status=\"404\"} [1m])) by (pod_template_hash)"
}
]
},
{
"name": "httptraffic",
"title": "HTTP Traffic",
"tab": "Golden Signal",
"graphs": [
{
"name": "http_traffic",
"title": "Traffic",
"description": "",
"graphType": "line",
"metricName": "pod_template_hash",
"queryExpression": "sum(rate(http_server_requests_seconds_count {namespace=\"{{.namespace}}\"} [1m])) by (pod_template_hash)"
}
]
},
{
"name": "pod",
"title": "Pods",
"tab": "Golden Signal",
"graphs": [
{
"name": "pod_cpu_line",
"title": "CPU",
"description": "",
"graphType": "line",
"metricName": "pod",
"queryExpression": "sum(rate(container_cpu_usage_seconds_total{pod=~\"{{.name}}\", image!=\"\", container!=\"POD\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
},
{
"name": "pod_cpu_pie",
"title": "CPU Avg",
"description": "",
"graphType": "pie",
"metricName": "pod",
"queryExpression": "sum(rate(container_cpu_usage_seconds_total{pod=~\"{{.name}}\", container!=\"POD\", image!=\"\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
},
{
"name": "pod_memory_line",
"title": "Memory",
"description": "",
"graphType": "line",
"metricName": "pod",
"queryExpression": "sum(rate(container_memory_usage_bytes{pod=~\"{{.name}}\", container!=\"POD\", image!=\"\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
},
{
"name": "pod_memory_pie",
"title": "Mem Avg",
"description": "",
"graphType": "pie",
"metricName": "pod",
"queryExpression": "sum(rate(container_memory_usage_bytes{pod=~\"{{.name}}\", container!=\"POD\", image!=\"\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
}
]
}
]
},
{
"groupKind": "rollout",
"tabs": ["Golden Signal"],
"rows": [
{
"name": "httplatency",
"title": "HTTP Latency",
"tab": "Golden Signal",
"graphs": [
{
"name": "http_200_latency",
"title": "Latency",
"description": "",
"graphType": "line",
"metricName": "rollout_template_hash",
"queryExpression": "sum(rate(http_server_requests_seconds_sum {namespace=\"{{.namespace}}\", status=\"200\"} [1m])) by (rollout_template_hash)"
}
]
},
{
"name": "httperrortate",
"title": "HTTP Error Rate",
"tab": "Golden Signal",
"graphs": [
{
"name": "http_error_rate_500",
"title": "HTTP Error 500",
"description": "",
"graphType": "line",
"metricName": "rollout_template_hash",
"queryExpression": "sum(rate(http_server_requests_seconds_count {namespace=\"{{.namespace}}\", status=\"500\"} [1m])) by (rollout_template_hash)"
},
{
"name": "http_error_rate_400",
"title": "HTTP Error 400",
"description": "",
"graphType": "line",
"metricName": "rollout_template_hash",
"queryExpression": "sum(rate(http_server_requests_seconds_count {namespace=\"{{.namespace}}\", status=\"404\"} [1m])) by (rollout_template_hash)"
}
]
},
{
"name": "httptraffic",
"title": "HTTP Traffic",
"tab": "Golden Signal",
"graphs": [
{
"name": "http_traffic",
"title": "Traffic",
"description": "",
"graphType": "line",
"metricName": "rollout_template_hash",
"queryExpression": "sum(rate(http_server_requests_seconds_count {namespace=\"{{.namespace}}\"} [1m])) by (rollout_template_hash)"
}
]
},
{
"name": "pod",
"title": "Pods",
"tab": "Golden Signal",
"graphs": [
{
"name": "pod_cpu_line",
"title": "CPU",
"description": "",
"graphType": "line",
"metricName": "pod",
"queryExpression": "sum(rate(container_cpu_usage_seconds_total{pod=~\"{{.name}}\", image!=\"\", container!=\"POD\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
},
{
"name": "pod_cpu_pie",
"title": "CPU Avg",
"description": "",
"graphType": "pie",
"metricName": "pod",
"queryExpression": "sum(rate(container_cpu_usage_seconds_total{pod=~\"{{.name}}\", container!=\"POD\", image!=\"\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
},
{
"name": "pod_memory_line",
"title": "Memory",
"description": "",
"graphType": "line",
"metricName": "pod",
"queryExpression": "sum(rate(container_memory_usage_bytes{pod=~\"{{.name}}\", container!=\"POD\", image!=\"\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
},
{
"name": "pod_memory_pie",
"title": "Mem Avg",
"description": "",
"graphType": "pie",
"metricName": "pod",
"queryExpression": "sum(rate(container_memory_usage_bytes{pod=~\"{{.name}}\", container!=\"POD\", image!=\"\", container!=\"\", container_name!=\"POD\"}[5m])) by (pod)"
}
]
}
]
}
]
}
],
"provider":
{
"Name": "default",
"default": true,
"address": "http://prometheus-operated.monitoring.svc.cluster.local:9090"
}
}
}