2023-11-26 09:56:08 -08:00
|
|
|
{ config, options, pkgs, lib, ... }:
|
2023-07-01 10:12:36 -07:00
|
|
|
|
|
|
|
let
|
|
|
|
cfg = config.shb.monitoring;
|
2023-07-15 15:09:54 -07:00
|
|
|
|
|
|
|
fqdn = "${cfg.subdomain}.${cfg.domain}";
|
2023-07-01 10:12:36 -07:00
|
|
|
in
|
|
|
|
{
|
|
|
|
options.shb.monitoring = {
|
|
|
|
enable = lib.mkEnableOption "selfhostblocks.monitoring";
|
|
|
|
|
2023-07-15 15:09:54 -07:00
|
|
|
subdomain = lib.mkOption {
|
|
|
|
type = lib.types.str;
|
|
|
|
description = "Subdomain under which home-assistant will be served.";
|
|
|
|
example = "grafana";
|
|
|
|
};
|
|
|
|
|
|
|
|
domain = lib.mkOption {
|
|
|
|
type = lib.types.str;
|
|
|
|
description = "domain under which home-assistant will be served.";
|
|
|
|
example = "mydomain.com";
|
|
|
|
};
|
2023-08-25 09:41:36 -07:00
|
|
|
|
2023-11-26 09:56:08 -08:00
|
|
|
grafanaPort = lib.mkOption {
|
|
|
|
type = lib.types.port;
|
|
|
|
description = "Port where Grafana listens to HTTP requests.";
|
|
|
|
default = 3000;
|
|
|
|
};
|
|
|
|
|
|
|
|
prometheusPort = lib.mkOption {
|
|
|
|
type = lib.types.port;
|
|
|
|
description = "Port where Prometheus listens to HTTP requests.";
|
|
|
|
default = 3001;
|
|
|
|
};
|
|
|
|
|
|
|
|
lokiPort = lib.mkOption {
|
|
|
|
type = lib.types.port;
|
|
|
|
description = "Port where Loki listens to HTTP requests.";
|
|
|
|
default = 3002;
|
|
|
|
};
|
|
|
|
|
2023-08-25 09:41:36 -07:00
|
|
|
debugLog = lib.mkOption {
|
|
|
|
type = lib.types.bool;
|
|
|
|
description = "Set to true to enable debug logging of the infrastructure serving Grafana.";
|
|
|
|
default = false;
|
|
|
|
example = true;
|
|
|
|
};
|
2023-11-26 09:56:08 -08:00
|
|
|
|
|
|
|
orgId = lib.mkOption {
|
|
|
|
type = lib.types.int;
|
|
|
|
description = "Org ID where all self host blocks related config will be stored.";
|
|
|
|
default = 1;
|
|
|
|
};
|
|
|
|
|
|
|
|
provisionDashboards = lib.mkOption {
|
|
|
|
type = lib.types.bool;
|
|
|
|
description = "Provision Self Host Blocks dashboards under 'Self Host Blocks' folder.";
|
|
|
|
default = true;
|
|
|
|
};
|
|
|
|
|
|
|
|
contactPoints = lib.mkOption {
|
|
|
|
type = lib.types.listOf lib.types.str;
|
|
|
|
description = "List of email addresses to send alerts to";
|
|
|
|
default = [];
|
|
|
|
};
|
|
|
|
|
|
|
|
adminPasswordFile = lib.mkOption {
|
|
|
|
type = lib.types.path;
|
|
|
|
description = "File containing the initial admin password.";
|
|
|
|
};
|
|
|
|
|
|
|
|
secretKeyFile = lib.mkOption {
|
|
|
|
type = lib.types.path;
|
|
|
|
description = "File containing the secret key used for signing.";
|
|
|
|
};
|
|
|
|
|
|
|
|
smtp = lib.mkOption {
|
2023-12-04 00:33:16 -08:00
|
|
|
description = "SMTP options.";
|
2023-11-26 09:56:08 -08:00
|
|
|
default = null;
|
|
|
|
type = lib.types.nullOr (lib.types.submodule {
|
|
|
|
options = {
|
|
|
|
from_address = lib.mkOption {
|
|
|
|
type = lib.types.str;
|
|
|
|
description = "SMTP address from which the emails originate.";
|
|
|
|
example = "vaultwarden@mydomain.com";
|
|
|
|
};
|
|
|
|
from_name = lib.mkOption {
|
|
|
|
type = lib.types.str;
|
|
|
|
description = "SMTP name from which the emails originate.";
|
|
|
|
default = "Vaultwarden";
|
|
|
|
};
|
|
|
|
host = lib.mkOption {
|
|
|
|
type = lib.types.str;
|
|
|
|
description = "SMTP host to send the emails to.";
|
|
|
|
};
|
|
|
|
port = lib.mkOption {
|
|
|
|
type = lib.types.port;
|
|
|
|
description = "SMTP port to send the emails to.";
|
|
|
|
default = 25;
|
|
|
|
};
|
|
|
|
username = lib.mkOption {
|
|
|
|
type = lib.types.str;
|
|
|
|
description = "Username to connect to the SMTP host.";
|
|
|
|
};
|
|
|
|
passwordFile = lib.mkOption {
|
|
|
|
type = lib.types.str;
|
|
|
|
description = "File containing the password to connect to the SMTP host.";
|
|
|
|
};
|
|
|
|
};
|
|
|
|
});
|
|
|
|
};
|
2023-07-01 10:12:36 -07:00
|
|
|
};
|
|
|
|
|
|
|
|
config = lib.mkIf cfg.enable {
|
2023-11-26 09:56:08 -08:00
|
|
|
assertions = [
|
|
|
|
{
|
|
|
|
assertion = (!(isNull cfg.smtp)) -> builtins.length cfg.contactPoints > 0;
|
|
|
|
message = "Must have at least one contact point for alerting";
|
|
|
|
}
|
|
|
|
];
|
|
|
|
|
2023-11-23 01:03:33 -08:00
|
|
|
shb.postgresql.ensures = [
|
2023-11-05 16:34:42 -08:00
|
|
|
{
|
|
|
|
username = "grafana";
|
|
|
|
database = "grafana";
|
|
|
|
}
|
|
|
|
];
|
2023-07-01 10:12:36 -07:00
|
|
|
|
|
|
|
services.grafana = {
|
|
|
|
enable = true;
|
|
|
|
|
|
|
|
settings = {
|
2023-07-15 15:09:54 -07:00
|
|
|
database = {
|
|
|
|
host = "/run/postgresql";
|
|
|
|
user = "grafana";
|
|
|
|
name = "grafana";
|
|
|
|
type = "postgres";
|
|
|
|
# Uses peer auth for local users, so we don't need a password.
|
|
|
|
# Here's the syntax anyway for future refence:
|
|
|
|
# password = "$__file{/run/secrets/homeassistant/dbpass}";
|
|
|
|
};
|
|
|
|
|
2023-11-26 09:56:08 -08:00
|
|
|
security = {
|
|
|
|
secret_key = "$__file{${cfg.secretKeyFile}}";
|
|
|
|
disable_initial_admin_creation = false; # Enable when LDAP support is configured.
|
|
|
|
admin_password = "$__file{${cfg.adminPasswordFile}}"; # Remove when LDAP support is configured.
|
|
|
|
};
|
|
|
|
|
2023-07-01 10:12:36 -07:00
|
|
|
server = {
|
|
|
|
http_addr = "127.0.0.1";
|
2023-11-26 09:56:08 -08:00
|
|
|
http_port = cfg.grafanaPort;
|
2023-07-15 15:09:54 -07:00
|
|
|
domain = fqdn;
|
|
|
|
root_url = "https://${fqdn}";
|
2023-08-25 09:41:36 -07:00
|
|
|
router_logging = cfg.debugLog;
|
2023-07-01 10:12:36 -07:00
|
|
|
};
|
2023-11-26 09:56:08 -08:00
|
|
|
|
|
|
|
smtp = lib.mkIf (!(isNull cfg.smtp)) {
|
|
|
|
enabled = true;
|
|
|
|
inherit (cfg.smtp) from_address from_name;
|
|
|
|
host = "${cfg.smtp.host}:${toString cfg.smtp.port}";
|
|
|
|
user = cfg.smtp.username;
|
|
|
|
password = "$__file{${cfg.smtp.passwordFile}}";
|
|
|
|
};
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
services.grafana.provision = {
|
|
|
|
dashboards.settings = lib.mkIf cfg.provisionDashboards {
|
|
|
|
apiVersion = 1;
|
|
|
|
providers = [{
|
|
|
|
folder = "Self Host Blocks";
|
|
|
|
options.path = ./monitoring/dashboards;
|
|
|
|
allowUiUpdates = true;
|
|
|
|
disableDeletion = true;
|
|
|
|
}];
|
|
|
|
};
|
|
|
|
datasources.settings = {
|
|
|
|
apiVersion = 1;
|
|
|
|
datasources = [
|
|
|
|
{
|
|
|
|
inherit (cfg) orgId;
|
|
|
|
name = "Prometheus";
|
|
|
|
type = "prometheus";
|
|
|
|
url = "http://127.0.0.1:${toString config.services.prometheus.port}";
|
|
|
|
uid = "df80f9f5-97d7-4112-91d8-72f523a02b09";
|
|
|
|
isDefault = true;
|
|
|
|
version = 1;
|
|
|
|
}
|
|
|
|
{
|
|
|
|
inherit (cfg) orgId;
|
|
|
|
name = "Loki";
|
|
|
|
type = "loki";
|
|
|
|
url = "http://127.0.0.1:${toString config.services.loki.configuration.server.http_listen_port}";
|
|
|
|
uid = "cd6cc53e-840c-484d-85f7-96fede324006";
|
|
|
|
version = 1;
|
|
|
|
}
|
|
|
|
];
|
|
|
|
deleteDatasources = [
|
|
|
|
{
|
|
|
|
inherit (cfg) orgId;
|
|
|
|
name = "Prometheus";
|
|
|
|
}
|
|
|
|
{
|
|
|
|
inherit (cfg) orgId;
|
|
|
|
name = "Loki";
|
|
|
|
}
|
|
|
|
];
|
|
|
|
};
|
|
|
|
alerting.contactPoints.settings = {
|
|
|
|
apiVersion = 1;
|
|
|
|
contactPoints = [{
|
|
|
|
inherit (cfg) orgId;
|
|
|
|
name = "grafana-default-email";
|
|
|
|
receivers = lib.optionals ((builtins.length cfg.contactPoints) > 0) [{
|
|
|
|
uid = "sysadmin";
|
|
|
|
type = "email";
|
|
|
|
settings.addresses = lib.concatStringsSep ";" cfg.contactPoints;
|
|
|
|
}];
|
|
|
|
}];
|
2023-07-01 10:12:36 -07:00
|
|
|
};
|
2023-11-26 09:56:08 -08:00
|
|
|
alerting.policies.settings = {
|
|
|
|
apiVersion = 1;
|
|
|
|
policies = [{
|
|
|
|
inherit (cfg) orgId;
|
|
|
|
receiver = "grafana-default-email";
|
|
|
|
group_by = [ "grafana_folder" "alertname" ];
|
|
|
|
group_wait = "30s";
|
|
|
|
group_interval = "5m";
|
|
|
|
repeat_interval = "4h";
|
|
|
|
}];
|
|
|
|
# resetPolicies seems to happen after setting the above policies, effectively rolling back
|
|
|
|
# any updates.
|
|
|
|
};
|
|
|
|
alerting.rules.settings =
|
|
|
|
let
|
|
|
|
rules = builtins.fromJSON (builtins.readFile ./monitoring/rules.json);
|
|
|
|
ruleIds = map (r: r.uid) rules;
|
|
|
|
in
|
|
|
|
{
|
|
|
|
apiVersion = 1;
|
|
|
|
groups = [{
|
|
|
|
inherit (cfg) orgId;
|
|
|
|
name = "SysAdmin";
|
|
|
|
folder = "Self Host Blocks";
|
|
|
|
interval = "10m";
|
|
|
|
inherit rules;
|
|
|
|
}];
|
|
|
|
# deleteRules seems to happen after creating the above rules, effectively rolling back
|
|
|
|
# any updates.
|
|
|
|
};
|
2023-07-01 10:12:36 -07:00
|
|
|
};
|
|
|
|
|
2023-07-15 15:09:54 -07:00
|
|
|
services.prometheus = {
|
|
|
|
enable = true;
|
2023-11-26 09:56:08 -08:00
|
|
|
port = cfg.prometheusPort;
|
2023-07-15 15:09:54 -07:00
|
|
|
};
|
|
|
|
|
2023-10-20 20:31:07 -07:00
|
|
|
services.loki = {
|
|
|
|
enable = true;
|
|
|
|
dataDir = "/var/lib/loki";
|
|
|
|
configuration = {
|
|
|
|
auth_enabled = false;
|
|
|
|
|
2023-11-26 09:56:08 -08:00
|
|
|
server.http_listen_port = cfg.lokiPort;
|
2023-10-20 20:31:07 -07:00
|
|
|
|
|
|
|
ingester = {
|
|
|
|
lifecycler = {
|
|
|
|
address = "127.0.0.1";
|
|
|
|
ring = {
|
|
|
|
kvstore.store = "inmemory";
|
|
|
|
replication_factor = 1;
|
|
|
|
};
|
|
|
|
final_sleep = "0s";
|
|
|
|
};
|
|
|
|
chunk_idle_period = "5m";
|
|
|
|
chunk_retain_period = "30s";
|
|
|
|
};
|
|
|
|
|
|
|
|
schema_config = {
|
|
|
|
configs = [
|
|
|
|
{
|
|
|
|
from = "2018-04-15";
|
|
|
|
store = "boltdb";
|
|
|
|
object_store = "filesystem";
|
|
|
|
schema = "v9";
|
|
|
|
index.prefix = "index_";
|
|
|
|
index.period = "168h";
|
|
|
|
}
|
|
|
|
];
|
|
|
|
};
|
|
|
|
|
|
|
|
storage_config = {
|
|
|
|
boltdb.directory = "/tmp/loki/index";
|
|
|
|
filesystem.directory = "/tmp/loki/chunks";
|
|
|
|
};
|
|
|
|
|
|
|
|
limits_config = {
|
|
|
|
enforce_metric_name = false;
|
|
|
|
reject_old_samples = true;
|
|
|
|
reject_old_samples_max_age = "168h";
|
|
|
|
};
|
|
|
|
|
|
|
|
chunk_store_config = {
|
|
|
|
max_look_back_period = 0;
|
|
|
|
};
|
|
|
|
|
|
|
|
table_manager = {
|
|
|
|
chunk_tables_provisioning = {
|
|
|
|
inactive_read_throughput = 0;
|
|
|
|
inactive_write_throughput = 0;
|
|
|
|
provisioned_read_throughput = 0;
|
|
|
|
provisioned_write_throughput = 0;
|
|
|
|
};
|
|
|
|
index_tables_provisioning = {
|
|
|
|
inactive_read_throughput = 0;
|
|
|
|
inactive_write_throughput = 0;
|
|
|
|
provisioned_read_throughput = 0;
|
|
|
|
provisioned_write_throughput = 0;
|
|
|
|
};
|
|
|
|
retention_deletes_enabled = false;
|
|
|
|
retention_period = 0;
|
|
|
|
};
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
|
|
|
services.promtail = {
|
|
|
|
enable = true;
|
|
|
|
configuration = {
|
|
|
|
server = {
|
|
|
|
http_listen_port = 9080;
|
|
|
|
grpc_listen_port = 0;
|
|
|
|
};
|
|
|
|
|
|
|
|
positions.filename = "/tmp/positions.yaml";
|
|
|
|
|
|
|
|
client.url = "http://localhost:${toString config.services.loki.configuration.server.http_listen_port}/api/prom/push";
|
|
|
|
|
|
|
|
scrape_configs = [
|
|
|
|
{
|
|
|
|
job_name = "systemd";
|
|
|
|
journal = {
|
|
|
|
json = false;
|
|
|
|
max_age = "12h";
|
|
|
|
path = "/var/log/journal";
|
|
|
|
# matches = "_TRANSPORT=kernel";
|
|
|
|
labels = {
|
|
|
|
job = "systemd-journal";
|
|
|
|
};
|
|
|
|
};
|
|
|
|
relabel_configs = [
|
|
|
|
{
|
|
|
|
source_labels = [ "__journal__systemd_unit" ];
|
|
|
|
target_label = "unit";
|
|
|
|
}
|
|
|
|
];
|
|
|
|
}
|
|
|
|
];
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
2023-07-15 15:09:54 -07:00
|
|
|
services.nginx = {
|
|
|
|
enable = true;
|
|
|
|
|
|
|
|
virtualHosts.${fqdn} = {
|
2023-11-26 09:56:08 -08:00
|
|
|
forceSSL = lib.mkIf config.shb.ssl.enable true;
|
|
|
|
sslCertificate = lib.mkIf config.shb.ssl.enable "/var/lib/acme/${cfg.domain}/cert.pem";
|
|
|
|
sslCertificateKey = lib.mkIf config.shb.ssl.enable "/var/lib/acme/${cfg.domain}/key.pem";
|
2023-07-15 15:09:54 -07:00
|
|
|
locations."/" = {
|
2023-08-13 16:11:23 -07:00
|
|
|
proxyPass = "http://${toString config.services.grafana.settings.server.http_addr}:${toString config.services.grafana.settings.server.http_port}";
|
2023-07-15 15:09:54 -07:00
|
|
|
proxyWebsockets = true;
|
2023-07-01 10:12:36 -07:00
|
|
|
};
|
|
|
|
};
|
2023-07-15 15:09:54 -07:00
|
|
|
};
|
|
|
|
|
2023-07-29 22:14:38 -07:00
|
|
|
services.prometheus.scrapeConfigs = [
|
|
|
|
{
|
|
|
|
job_name = "node";
|
|
|
|
static_configs = [
|
|
|
|
{
|
2023-09-25 22:55:41 -07:00
|
|
|
targets = ["127.0.0.1:${toString config.services.prometheus.exporters.node.port}"];
|
|
|
|
}
|
|
|
|
];
|
|
|
|
}
|
|
|
|
{
|
|
|
|
job_name = "smartctl";
|
|
|
|
static_configs = [
|
|
|
|
{
|
|
|
|
targets = ["127.0.0.1:${toString config.services.prometheus.exporters.smartctl.port}"];
|
2023-07-29 22:14:38 -07:00
|
|
|
}
|
|
|
|
];
|
|
|
|
}
|
2023-08-25 09:41:54 -07:00
|
|
|
{
|
|
|
|
job_name = "prometheus_internal";
|
|
|
|
static_configs = [
|
|
|
|
{
|
|
|
|
targets = ["127.0.0.1:${toString config.services.prometheus.port}"];
|
|
|
|
}
|
|
|
|
];
|
|
|
|
}
|
2023-07-29 22:14:38 -07:00
|
|
|
] ++ (lib.lists.optional config.services.nginx.enable {
|
2023-07-15 15:09:54 -07:00
|
|
|
job_name = "nginx";
|
|
|
|
static_configs = [
|
2023-07-01 10:12:36 -07:00
|
|
|
{
|
2023-09-25 22:55:41 -07:00
|
|
|
targets = ["127.0.0.1:${toString config.services.prometheus.exporters.nginx.port}"];
|
|
|
|
}
|
|
|
|
];
|
|
|
|
# }) ++ (lib.optional (builtins.length (lib.attrNames config.services.redis.servers) > 0) {
|
|
|
|
# job_name = "redis";
|
|
|
|
# static_configs = [
|
|
|
|
# {
|
|
|
|
# targets = ["127.0.0.1:${toString config.services.prometheus.exporters.redis.port}"];
|
|
|
|
# }
|
|
|
|
# ];
|
|
|
|
# }) ++ (lib.optional (builtins.length (lib.attrNames config.services.openvpn.servers) > 0) {
|
|
|
|
# job_name = "openvpn";
|
|
|
|
# static_configs = [
|
|
|
|
# {
|
|
|
|
# targets = ["127.0.0.1:${toString config.services.prometheus.exporters.openvpn.port}"];
|
|
|
|
# }
|
|
|
|
# ];
|
|
|
|
}) ++ (lib.optional config.services.dnsmasq.enable {
|
|
|
|
job_name = "dnsmasq";
|
|
|
|
static_configs = [
|
|
|
|
{
|
|
|
|
targets = ["127.0.0.1:${toString config.services.prometheus.exporters.dnsmasq.port}"];
|
2023-07-01 10:12:36 -07:00
|
|
|
}
|
|
|
|
];
|
2023-09-25 22:55:41 -07:00
|
|
|
});
|
2023-07-15 15:09:54 -07:00
|
|
|
services.prometheus.exporters.nginx = lib.mkIf config.services.nginx.enable {
|
|
|
|
enable = true;
|
|
|
|
port = 9113;
|
|
|
|
listenAddress = "127.0.0.1";
|
|
|
|
scrapeUri = "http://localhost:80/nginx_status";
|
2023-07-01 10:12:36 -07:00
|
|
|
};
|
2023-07-29 22:14:38 -07:00
|
|
|
services.prometheus.exporters.node = {
|
|
|
|
enable = true;
|
2023-11-24 20:09:39 -08:00
|
|
|
# https://github.com/prometheus/node_exporter#collectors
|
|
|
|
enabledCollectors = ["systemd" "processes" "ethtool"];
|
2023-07-29 22:14:38 -07:00
|
|
|
port = 9115;
|
|
|
|
listenAddress = "127.0.0.1";
|
|
|
|
};
|
2023-09-25 22:55:41 -07:00
|
|
|
services.prometheus.exporters.smartctl = {
|
|
|
|
enable = true;
|
|
|
|
port = 9117;
|
|
|
|
listenAddress = "127.0.0.1";
|
|
|
|
};
|
|
|
|
# services.prometheus.exporters.redis = lib.mkIf (builtins.length (lib.attrNames config.services.redis.servers) > 0) {
|
|
|
|
# enable = true;
|
|
|
|
# port = 9119;
|
|
|
|
# listenAddress = "127.0.0.1";
|
|
|
|
# };
|
|
|
|
# services.prometheus.exporters.openvpn = lib.mkIf (builtins.length (lib.attrNames config.services.openvpn.servers) > 0) {
|
|
|
|
# enable = true;
|
|
|
|
# port = 9121;
|
|
|
|
# listenAddress = "127.0.0.1";
|
|
|
|
# statusPaths = lib.mapAttrsToList (name: _config: "/tmp/openvpn/${name}.status") config.services.openvpn.servers;
|
|
|
|
# };
|
|
|
|
services.prometheus.exporters.dnsmasq = lib.mkIf config.services.dnsmasq.enable {
|
|
|
|
enable = true;
|
|
|
|
port = 9123;
|
|
|
|
listenAddress = "127.0.0.1";
|
|
|
|
};
|
2023-07-15 15:09:54 -07:00
|
|
|
services.nginx.statusPage = lib.mkDefault config.services.nginx.enable;
|
2023-07-01 10:12:36 -07:00
|
|
|
};
|
|
|
|
}
|