about summary refs log tree commit diff
diff options
context:
space:
mode:
authorFlorian Klink <flokli@flokli.de>2024-11-19T15·17+0200
committerflokli <flokli@flokli.de>2024-11-23T09·40+0000
commit6f1d059c7daed0dbd53d2f17734262cd17d8a37d (patch)
treeebab16b86bd0d5f89342bf7f3defa85062b795a5
parent52a8e47ac1330fc65a976c2bb8156d4bc31aa265 (diff)
feat(users/flokli/nixos/nixos-tvix-cache): collect metrics r/8950
This enables routing of metrics to an instance of VictoriaMetrics, and
configures opentelemetry-collector to route metrics there.

Change-Id: If765191a4cc70ddcaad821d45132b96a10a12148
Reviewed-on: https://cl.tvl.fyi/c/depot/+/12812
Reviewed-by: flokli <flokli@flokli.de>
Tested-by: BuildkiteCI
Reviewed-by: Jonas Chevalier <zimbatm@zimbatm.com>
-rw-r--r--users/flokli/nixos/nixos-tvix-cache/monitoring.nix118
1 files changed, 61 insertions, 57 deletions
diff --git a/users/flokli/nixos/nixos-tvix-cache/monitoring.nix b/users/flokli/nixos/nixos-tvix-cache/monitoring.nix
index 699d74cefc06..32cb7ddc0e11 100644
--- a/users/flokli/nixos/nixos-tvix-cache/monitoring.nix
+++ b/users/flokli/nixos/nixos-tvix-cache/monitoring.nix
@@ -1,4 +1,4 @@
-{ config, ... }:
+{ config, pkgs, ... }:
 let
   domain = config.machine.domain;
 in
@@ -18,12 +18,13 @@ in
         grpc_server_max_send_msg_size = 67108864;
         log_level = "warn";
       };
-      distributor.receivers = {
-        otlp.protocols = {
-          grpc = { }; # *:4317
-          http = { }; # *:4318
-        };
+
+      # move the otlp listener to another port than 4317, and disable the 4318 one.
+      # opentelemetry-connector binds on both 4317 and 4318.
+      distributor.receivers.otlp.protocols = {
+        grpc.endpoint = "127.0.0.1:4319";
       };
+
       storage.trace = {
         backend = "local";
         wal.path = "/var/lib/tempo/wal";
@@ -33,55 +34,51 @@ in
     };
   };
 
-  # No need, tempo collects the traces directly.
-  #
-  # services.opentelemetry-collector = {
-  #   enable = true;
-
-  #   settings = {
-  #     receivers = {
-  #       otlp.protocols.grpc.endpoint = "127.0.0.1:4317";
-  #       otlp.protocols.http.endpoint = "127.0.0.1:4318";
-  #     };
-
-  #     processors = {
-  #       batch = { };
-  #     };
-
-  #     exporters = {
-  #       otlp = {
-  #         endpoint = "127.0.0.1:9080"; # Tempo
-  #       };
-  #     };
-
-  #     extensions = {
-  #       zpages = { };
-  #     };
-
-  #     service = {
-  #       extensions = [
-  #         "zpages"
-  #       ];
-  #       pipelines = {
-  #         traces = {
-  #           receivers = [ "otlp" ];
-  #           processors = [ "batch" ];
-  #           exporters = [ "otlp" ];
-  #         };
-  #         metrics = {
-  #           receivers = [ "otlp" ];
-  #           processors = [ "batch" ];
-  #           exporters = [ "otlp" ];
-  #         };
-  #         logs = {
-  #           receivers = [ "otlp" ];
-  #           processors = [ "batch" ];
-  #           exporters = [ "otlp" ];
-  #         };
-  #       };
-  #     };
-  #   };
-  # };
+  services.opentelemetry-collector = {
+    enable = true;
+    settings = {
+      receivers = {
+        otlp.protocols.grpc.endpoint = "127.0.0.1:4317";
+        otlp.protocols.http.endpoint = "127.0.0.1:4318";
+      };
+
+      processors = {
+        batch = { };
+      };
+
+      exporters = {
+        otlp = {
+          endpoint = "127.0.0.1:4319"; # Tempo otlp-grpc
+          tls.insecure = true;
+        };
+        "otlphttp/metrics" = {
+          compression = "gzip";
+          encoding = "proto";
+          endpoint = "http://localhost:8428/opentelemetry";
+          tls.insecure = true;
+
+        };
+      };
+
+      service = {
+        pipelines = {
+          traces = {
+            receivers = [ "otlp" ];
+            processors = [ "batch" ];
+            exporters = [ "otlp" ];
+          };
+          metrics = {
+            receivers = [ "otlp" ];
+            processors = [ "batch" ];
+            exporters = [ "otlphttp/metrics" ];
+          };
+        };
+      };
+    };
+  };
+
+  services.victoriametrics.enable = true;
+
 
   services.grafana = {
     enable = true;
@@ -122,19 +119,25 @@ in
           name = "Tempo";
           type = "tempo";
           uid = "traces";
-          url = "http://127.0.0.1:3200";
+          url = "http://127.0.0.1:9080";
           access = "proxy";
           timeout = "300";
 
           jsonData = {
             nodeGraph.enabled = true;
             # tracesToLogs.datasourceUid = "logs";
-            # tracesToMetrics.datasourceUid = "metrics";
+            tracesToMetrics.datasourceUid = "metrics";
             # serviceMap.datasourceUid = "metrics";
             # nodeGraph.enabled = true;
             # lokiSearch.datasourceUid = "logs";
           };
         }
+        {
+          name = "prometheus";
+          type = "prometheus";
+          uid = "metrics";
+          url = "http://localhost:8428/";
+        }
       ];
     };
   };
@@ -143,5 +146,6 @@ in
 
   services.nginx.virtualHosts."${domain}".locations."/grafana" = {
     proxyPass = "http://localhost:3000";
+    proxyWebsockets = true;
   };
 }