2023-06-03 01:33:51 +03:00
|
|
|
{ cluster, config, depot, lib, pkgs, tools, ... }:
|
|
|
|
let
|
|
|
|
inherit (tools.meta) domain;
|
|
|
|
|
|
|
|
inherit (cluster.config.links) loki-ingest prometheus-ingest;
|
|
|
|
|
|
|
|
inherit (cluster.config) hostLinks;
|
|
|
|
|
|
|
|
inherit (config.networking) hostName;
|
|
|
|
|
|
|
|
svc = cluster.config.services.monitoring;
|
|
|
|
|
|
|
|
iniList = lib.concatStringsSep " ";
|
|
|
|
|
|
|
|
login = x: "https://login.${domain}/auth/realms/master/protocol/openid-connect/${x}";
|
|
|
|
in
|
|
|
|
{
|
|
|
|
age.secrets = {
|
|
|
|
grafana-db-credentials = {
|
|
|
|
file = ./secrets/grafana-db-credentials.age;
|
|
|
|
owner = "grafana";
|
|
|
|
};
|
|
|
|
grafana-secrets.file = ./secrets/grafana-secrets.age;
|
|
|
|
};
|
|
|
|
|
|
|
|
services.grafana = {
|
|
|
|
enable = true;
|
|
|
|
package = depot.packages.grafana;
|
|
|
|
settings = {
|
|
|
|
server = {
|
|
|
|
root_url = "https://monitoring.${domain}/";
|
|
|
|
http_addr = hostLinks.${hostName}.grafana.ipv4;
|
|
|
|
http_port = hostLinks.${hostName}.grafana.port;
|
|
|
|
};
|
|
|
|
database = {
|
|
|
|
type = "postgres";
|
|
|
|
host = cluster.config.links.patroni-pg-access.tuple;
|
|
|
|
user = "grafana";
|
|
|
|
password = "$__file{${config.age.secrets.grafana-db-credentials.path}}";
|
|
|
|
};
|
|
|
|
analytics.reporting_enabled = false;
|
|
|
|
"auth.generic_oauth" = {
|
|
|
|
enabled = true;
|
|
|
|
allow_sign_up = true;
|
|
|
|
client_id = "net.privatevoid.monitoring1";
|
|
|
|
auth_url = login "auth";
|
|
|
|
token_url = login "token";
|
|
|
|
api_url = login "userinfo";
|
|
|
|
scopes = iniList [ "openid" "profile" "email" "roles" ];
|
|
|
|
role_attribute_strict = true;
|
|
|
|
role_attribute_path = "resource_access.monitoring.roles[0]";
|
|
|
|
};
|
|
|
|
security = {
|
|
|
|
cookie_secure = true;
|
|
|
|
disable_gravatar = true;
|
|
|
|
};
|
|
|
|
feature_toggles.enable = iniList [
|
|
|
|
"tempoSearch"
|
|
|
|
"tempoBackendSearch"
|
|
|
|
"tempoServiceGraph"
|
|
|
|
];
|
|
|
|
};
|
|
|
|
provision = {
|
|
|
|
enable = true;
|
|
|
|
datasources.settings.datasources = [
|
|
|
|
{
|
|
|
|
name = "Prometheus";
|
|
|
|
uid = "PBFA97CFB590B2093";
|
|
|
|
inherit (prometheus-ingest) url;
|
|
|
|
type = "prometheus";
|
|
|
|
isDefault = true;
|
|
|
|
}
|
|
|
|
{
|
|
|
|
name = "Loki";
|
|
|
|
uid = "P8E80F9AEF21F6940";
|
|
|
|
inherit (loki-ingest) url;
|
|
|
|
type = "loki";
|
|
|
|
}
|
|
|
|
];
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
systemd.services = {
|
|
|
|
grafana = {
|
|
|
|
enable = false;
|
|
|
|
serviceConfig.EnvironmentFile = config.age.secrets.grafana-secrets.path;
|
|
|
|
};
|
|
|
|
grafana-ha = let
|
|
|
|
base = config.systemd.services.grafana;
|
|
|
|
inherit (config.services) consul;
|
|
|
|
svc = config.consul.services.grafana;
|
|
|
|
run = pkgs.writeShellScript "grafana-ha-start" ''
|
|
|
|
trap '${svc.commands.deregister}' EXIT
|
|
|
|
${svc.commands.register}
|
|
|
|
${base.serviceConfig.ExecStart}
|
|
|
|
'';
|
|
|
|
in {
|
|
|
|
inherit (base) wantedBy;
|
|
|
|
description = "Grafana | High Availability";
|
|
|
|
aliases = [ "grafana.service" ];
|
|
|
|
|
|
|
|
after = base.after ++ [ "consul.service" ];
|
|
|
|
requires = [ "consul.service" ];
|
|
|
|
|
|
|
|
serviceConfig = base.serviceConfig // {
|
|
|
|
ExecStart = "${consul.package}/bin/consul lock --shell=false services/grafana ${run}";
|
2023-08-21 20:03:56 +03:00
|
|
|
ExecStopPost = "${svc.commands.deregister}";
|
2023-06-03 01:33:51 +03:00
|
|
|
# consul uses AF_NETLINK to determine interface addresses, even when just registering a service
|
|
|
|
RestrictAddressFamilies = base.serviceConfig.RestrictAddressFamilies ++ [ "AF_NETLINK" ];
|
2023-06-09 19:14:33 +03:00
|
|
|
Restart = "on-failure";
|
2023-08-21 20:03:56 +03:00
|
|
|
RestartSec = "10s";
|
2023-06-03 01:33:51 +03:00
|
|
|
};
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
services.nginx = {
|
|
|
|
upstreams.grafana-ha.servers = lib.mapAttrs' (_: links: lib.nameValuePair links.grafana.tuple {}) (lib.getAttrs (svc.nodes.grafana) hostLinks);
|
|
|
|
|
|
|
|
virtualHosts."monitoring.${domain}" = lib.recursiveUpdate (tools.nginx.vhosts.proxy "http://grafana-ha") {
|
|
|
|
locations."/".proxyWebsockets = true;
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
security.acme.certs."monitoring.${domain}" = {
|
|
|
|
dnsProvider = "pdns";
|
|
|
|
webroot = lib.mkForce null;
|
|
|
|
};
|
|
|
|
|
|
|
|
consul.services.grafana = {
|
|
|
|
mode = "manual";
|
|
|
|
unit = "grafana-ha";
|
|
|
|
definition = rec {
|
|
|
|
name = "grafana";
|
|
|
|
address = depot.reflection.interfaces.primary.addrPublic;
|
|
|
|
port = 443;
|
|
|
|
checks = [
|
2023-06-05 21:26:22 +03:00
|
|
|
rec {
|
2023-06-03 01:33:51 +03:00
|
|
|
name = "Frontend";
|
|
|
|
id = "service:grafana:frontend";
|
|
|
|
interval = "30s";
|
2023-06-05 21:26:22 +03:00
|
|
|
http = "https://${address}/healthz";
|
2023-06-03 01:33:51 +03:00
|
|
|
tls_server_name = "monitoring.${domain}";
|
2023-06-05 21:26:22 +03:00
|
|
|
header.Host = lib.singleton tls_server_name;
|
2023-06-03 01:33:51 +03:00
|
|
|
}
|
|
|
|
{
|
|
|
|
name = "Backend";
|
|
|
|
id = "service:grafana:backend";
|
|
|
|
interval = "5s";
|
|
|
|
http = "${hostLinks.${hostName}.grafana.url}/healthz";
|
|
|
|
}
|
|
|
|
];
|
|
|
|
};
|
|
|
|
};
|
|
|
|
}
|