From 77bbf200321df605600cbc3e6599b5edaa17b016 Mon Sep 17 00:00:00 2001 From: Seth Call Date: Thu, 8 Jan 2026 04:39:03 -0600 Subject: [PATCH] prepare for production --- k8s/monitoring/templates/node-alerts.yaml | 11 +++++++++-- k8s/webrtc-be/values-production.yaml | 2 +- terraform/lke.tf | 2 +- 3 files changed, 11 insertions(+), 4 deletions(-) diff --git a/k8s/monitoring/templates/node-alerts.yaml b/k8s/monitoring/templates/node-alerts.yaml index 09ad5ea..43ad817 100644 --- a/k8s/monitoring/templates/node-alerts.yaml +++ b/k8s/monitoring/templates/node-alerts.yaml @@ -10,10 +10,17 @@ spec: - name: node.alerts rules: - alert: NodeHighCPU - expr: (1 - avg without (cpu, mode) (rate(node_cpu_seconds_total{mode="idle"}[1m]))) * 100 > 1 + expr: | + ( + (1 - avg without (cpu, mode) (rate(node_cpu_seconds_total{mode="idle", workload="media"}[1m]))) * 100 > 65 + ) + or + ( + (1 - avg without (cpu, mode) (rate(node_cpu_seconds_total{mode="idle", workload!="media"}[1m]))) * 100 > 80 + ) for: 1m labels: severity: warning annotations: summary: "High CPU usage on node {{ "{{" }} $labels.instance {{ "}}" }}" - description: "Node {{ "{{" }} $labels.instance {{ "}}" }} has CPU usage above 1% (current value: {{ "{{" }} $value | printf \"%.2f\" {{ "}}" }}%)" + description: "Node {{ "{{" }} $labels.instance {{ "}}" }} has CPU usage above threshold (current value: {{ "{{" }} $value | printf \"%.2f\" {{ "}}" }}%)" diff --git a/k8s/webrtc-be/values-production.yaml b/k8s/webrtc-be/values-production.yaml index 71c322d..7fe8c24 100644 --- a/k8s/webrtc-be/values-production.yaml +++ b/k8s/webrtc-be/values-production.yaml @@ -6,7 +6,7 @@ grafana: backendUrl: "https://www.jamkazam.com" auth: true # Webrtc_be image version -webrtc_tag: 1.0.139 +webrtc_tag: 1.0.157 unused_tag: 1.0.0 enableDieEndpoint: false mediasoup: diff --git a/terraform/lke.tf b/terraform/lke.tf index 75408ce..b0f12f3 100644 --- a/terraform/lke.tf +++ b/terraform/lke.tf @@ -71,7 +71,7 @@ resource "linode_lke_cluster" "prd-video-cluster" { } # Coturn pool pool { - type = "g6-standard-2" + type = "g6-standard-4" count = 3 labels = { workload = "media"