remove uptimekuma, replace with textonly script
This commit is contained in:
parent
0acd4f2d72
commit
48ec633a59
6 changed files with 217 additions and 29 deletions
|
|
@ -9,13 +9,24 @@
|
||||||
../../modules/site.nix
|
../../modules/site.nix
|
||||||
./sites.nix
|
./sites.nix
|
||||||
./fail2ban.nix
|
./fail2ban.nix
|
||||||
./uptime-kuma.nix
|
|
||||||
./tinyauth.nix
|
./tinyauth.nix
|
||||||
./shlink.nix
|
./shlink.nix
|
||||||
./guestbook.nix
|
./guestbook.nix
|
||||||
./telegram-alerts.nix
|
./telegram-alerts.nix
|
||||||
|
../../modules/uptime
|
||||||
];
|
];
|
||||||
|
|
||||||
|
services.uptime = {
|
||||||
|
enable = true;
|
||||||
|
services = {
|
||||||
|
website = "https://ily.rs";
|
||||||
|
forgejo = "https://git.ily.rs";
|
||||||
|
foundry = "https://foundry.ily.rs";
|
||||||
|
wiki = "https://wiki.ily.rs";
|
||||||
|
penfield = "https://penfield.ily.rs";
|
||||||
|
};
|
||||||
|
};
|
||||||
|
|
||||||
networking.hostName = "lab";
|
networking.hostName = "lab";
|
||||||
|
|
||||||
services.openssh = {
|
services.openssh = {
|
||||||
|
|
|
||||||
|
|
@ -62,6 +62,13 @@ in
|
||||||
reverse_proxy localhost:8123
|
reverse_proxy localhost:8123
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@status path /status
|
||||||
|
handle @status {
|
||||||
|
root * /var/lib/uptime
|
||||||
|
rewrite * /status.txt
|
||||||
|
file_server
|
||||||
|
}
|
||||||
|
|
||||||
@site_file file {
|
@site_file file {
|
||||||
try_files {path} {path}/index.html
|
try_files {path} {path}/index.html
|
||||||
}
|
}
|
||||||
|
|
|
||||||
|
|
@ -29,7 +29,6 @@ let
|
||||||
"podman-dokuwiki"
|
"podman-dokuwiki"
|
||||||
"podman-shlink"
|
"podman-shlink"
|
||||||
"podman-shlink-web-client"
|
"podman-shlink-web-client"
|
||||||
"podman-uptime-kuma"
|
|
||||||
"podman-tinyauth"
|
"podman-tinyauth"
|
||||||
"site-webhook"
|
"site-webhook"
|
||||||
];
|
];
|
||||||
|
|
|
||||||
|
|
@ -1,27 +0,0 @@
|
||||||
{ ... }:
|
|
||||||
{
|
|
||||||
services.caddy.virtualHosts."status.ily.rs" = {
|
|
||||||
extraConfig = ''
|
|
||||||
reverse_proxy localhost:3001
|
|
||||||
encode zstd gzip
|
|
||||||
'';
|
|
||||||
};
|
|
||||||
|
|
||||||
services.caddy.virtualHosts."status.wynne.rs" = {
|
|
||||||
extraConfig = ''
|
|
||||||
redir https://status.ily.rs{uri} permanent
|
|
||||||
'';
|
|
||||||
};
|
|
||||||
|
|
||||||
virtualisation.oci-containers.containers.uptime-kuma = {
|
|
||||||
image = "louislam/uptime-kuma:2.2.1";
|
|
||||||
podman.user = "podman";
|
|
||||||
volumes = [
|
|
||||||
"/srv/uptime-kuma/data:/app/data"
|
|
||||||
];
|
|
||||||
ports = [ "127.0.0.1:3001:3001" ];
|
|
||||||
};
|
|
||||||
|
|
||||||
# Workaround for NixOS/nixpkgs#410857 until backport of #475089 lands
|
|
||||||
systemd.services.podman-uptime-kuma.serviceConfig.Delegate = true;
|
|
||||||
}
|
|
||||||
98
modules/uptime/default.nix
Normal file
98
modules/uptime/default.nix
Normal file
|
|
@ -0,0 +1,98 @@
|
||||||
|
{ config, lib, pkgs, ... }:
|
||||||
|
let
|
||||||
|
cfg = config.services.uptime;
|
||||||
|
|
||||||
|
servicesEnv = lib.concatStringsSep "\n"
|
||||||
|
(lib.mapAttrsToList (name: url: "${name} ${url}") cfg.services);
|
||||||
|
|
||||||
|
runScript = pkgs.writeShellApplication {
|
||||||
|
name = "uptime-run";
|
||||||
|
runtimeInputs = with pkgs; [ curl gawk coreutils ];
|
||||||
|
text = builtins.readFile ./run.sh;
|
||||||
|
};
|
||||||
|
in
|
||||||
|
{
|
||||||
|
options.services.uptime = {
|
||||||
|
enable = lib.mkEnableOption "minimal text-only uptime status page";
|
||||||
|
|
||||||
|
interval = lib.mkOption {
|
||||||
|
type = lib.types.str;
|
||||||
|
default = "5min";
|
||||||
|
description = "Probe interval, passed to the timer's OnUnitActiveSec.";
|
||||||
|
};
|
||||||
|
|
||||||
|
outputPath = lib.mkOption {
|
||||||
|
type = lib.types.str;
|
||||||
|
default = "/var/lib/uptime/status.txt";
|
||||||
|
description = ''
|
||||||
|
Path where the rendered status page is written.
|
||||||
|
Must be writable by the uptime user. The default lives inside the
|
||||||
|
unit's StateDirectory, which is created and owned automatically.
|
||||||
|
'';
|
||||||
|
};
|
||||||
|
|
||||||
|
services = lib.mkOption {
|
||||||
|
type = lib.types.attrsOf lib.types.str;
|
||||||
|
default = {};
|
||||||
|
example = { forgejo = "https://git.ily.rs"; };
|
||||||
|
description = "Map of service name to URL to probe.";
|
||||||
|
};
|
||||||
|
|
||||||
|
retentionDays = lib.mkOption {
|
||||||
|
type = lib.types.int;
|
||||||
|
default = 90;
|
||||||
|
description = "How many days of log entries to keep on disk.";
|
||||||
|
};
|
||||||
|
|
||||||
|
displayDays = lib.mkOption {
|
||||||
|
type = lib.types.int;
|
||||||
|
default = 30;
|
||||||
|
description = "How many days of history to render in the bar.";
|
||||||
|
};
|
||||||
|
};
|
||||||
|
|
||||||
|
config = lib.mkIf cfg.enable {
|
||||||
|
assertions = [{
|
||||||
|
assertion = cfg.displayDays <= cfg.retentionDays;
|
||||||
|
message = "services.uptime.displayDays (${toString cfg.displayDays}) must be <= retentionDays (${toString cfg.retentionDays}).";
|
||||||
|
}];
|
||||||
|
|
||||||
|
users.users.uptime = {
|
||||||
|
isSystemUser = true;
|
||||||
|
group = "uptime";
|
||||||
|
home = "/var/lib/uptime";
|
||||||
|
};
|
||||||
|
users.groups.uptime = {};
|
||||||
|
|
||||||
|
systemd.services.uptime = {
|
||||||
|
description = "Probe configured services and render the status page";
|
||||||
|
after = [ "network-online.target" ];
|
||||||
|
wants = [ "network-online.target" ];
|
||||||
|
environment = {
|
||||||
|
SERVICES = servicesEnv;
|
||||||
|
OUTPUT_PATH = cfg.outputPath;
|
||||||
|
RETENTION_DAYS = toString cfg.retentionDays;
|
||||||
|
DISPLAY_DAYS = toString cfg.displayDays;
|
||||||
|
};
|
||||||
|
serviceConfig = {
|
||||||
|
Type = "oneshot";
|
||||||
|
ExecStart = lib.getExe runScript;
|
||||||
|
User = "uptime";
|
||||||
|
Group = "uptime";
|
||||||
|
StateDirectory = "uptime";
|
||||||
|
StateDirectoryMode = "0755";
|
||||||
|
UMask = "0022";
|
||||||
|
};
|
||||||
|
};
|
||||||
|
|
||||||
|
systemd.timers.uptime = {
|
||||||
|
description = "Periodic uptime probe";
|
||||||
|
wantedBy = [ "timers.target" ];
|
||||||
|
timerConfig = {
|
||||||
|
OnBootSec = "1min";
|
||||||
|
OnUnitActiveSec = cfg.interval;
|
||||||
|
Unit = "uptime.service";
|
||||||
|
};
|
||||||
|
};
|
||||||
|
};
|
||||||
|
}
|
||||||
100
modules/uptime/run.sh
Normal file
100
modules/uptime/run.sh
Normal file
|
|
@ -0,0 +1,100 @@
|
||||||
|
: "${SERVICES:?must be set}"
|
||||||
|
: "${OUTPUT_PATH:?must be set}"
|
||||||
|
: "${RETENTION_DAYS:?must be set}"
|
||||||
|
: "${DISPLAY_DAYS:?must be set}"
|
||||||
|
|
||||||
|
state_dir=$(dirname "$OUTPUT_PATH")
|
||||||
|
mkdir -p "$state_dir"
|
||||||
|
|
||||||
|
now=$(date -u +%s)
|
||||||
|
retention_cutoff=$(( now - RETENTION_DAYS * 86400 ))
|
||||||
|
|
||||||
|
# Probe each service and rotate its log.
|
||||||
|
while IFS= read -r line; do
|
||||||
|
[ -z "$line" ] && continue
|
||||||
|
name=${line%% *}
|
||||||
|
url=${line#* }
|
||||||
|
log="$state_dir/$name.log"
|
||||||
|
|
||||||
|
code=$(curl -fsS --max-time 10 -o /dev/null -w '%{http_code}' "$url" 2>/dev/null || true)
|
||||||
|
if [ -z "$code" ] || [ "$code" = "000" ]; then
|
||||||
|
code="000"
|
||||||
|
up=0
|
||||||
|
elif [ "${code:0:1}" = "2" ] || [ "${code:0:1}" = "3" ]; then
|
||||||
|
up=1
|
||||||
|
else
|
||||||
|
up=0
|
||||||
|
fi
|
||||||
|
printf '%s %s %s\n' "$now" "$up" "$code" >> "$log"
|
||||||
|
|
||||||
|
awk -v cutoff="$retention_cutoff" '$1 >= cutoff' "$log" > "$log.tmp"
|
||||||
|
mv "$log.tmp" "$log"
|
||||||
|
done <<< "$SERVICES"
|
||||||
|
|
||||||
|
# Render. bucket_size and cell_count are parameters so we can add
|
||||||
|
# hour/minute granularity rows later without restructuring the awk.
|
||||||
|
render_row() {
|
||||||
|
local log_file="$1"
|
||||||
|
local now_arg="$2"
|
||||||
|
local bucket_size="$3"
|
||||||
|
local cells="$4"
|
||||||
|
|
||||||
|
if [ ! -s "$log_file" ]; then
|
||||||
|
local pad
|
||||||
|
pad=$(printf '%*s' "$cells" '' | tr ' ' '?')
|
||||||
|
printf '%s 0.0 unknown\n' "$pad"
|
||||||
|
return
|
||||||
|
fi
|
||||||
|
|
||||||
|
awk -v now="$now_arg" -v bucket="$bucket_size" -v cells="$cells" '
|
||||||
|
BEGIN {
|
||||||
|
bucket_origin = int(now / bucket) * bucket
|
||||||
|
window_start = bucket_origin - (cells - 1) * bucket
|
||||||
|
window_end = bucket_origin + bucket
|
||||||
|
last_ok = -1
|
||||||
|
}
|
||||||
|
{
|
||||||
|
ts = $1; ok = $2
|
||||||
|
if (ts >= window_start && ts < window_end) {
|
||||||
|
idx = int((ts - window_start) / bucket)
|
||||||
|
if (idx >= 0 && idx < cells) {
|
||||||
|
if (ok == 1) up[idx]++; else down[idx]++
|
||||||
|
}
|
||||||
|
}
|
||||||
|
last_ok = ok
|
||||||
|
}
|
||||||
|
END {
|
||||||
|
bar = ""; total_up = 0; total_all = 0
|
||||||
|
for (i = 0; i < cells; i++) {
|
||||||
|
u = (i in up) ? up[i] : 0
|
||||||
|
d = (i in down) ? down[i] : 0
|
||||||
|
if (u + d == 0) bar = bar "?"
|
||||||
|
else if (d == 0) bar = bar "#"
|
||||||
|
else if (u == 0) bar = bar "_"
|
||||||
|
else bar = bar "."
|
||||||
|
total_up += u; total_all += u + d
|
||||||
|
}
|
||||||
|
pct = (total_all == 0) ? 0 : (100 * total_up / total_all)
|
||||||
|
state = (last_ok == 1) ? "up" : (last_ok == 0) ? "down" : "unknown"
|
||||||
|
printf "%s %.1f %s\n", bar, pct, state
|
||||||
|
}' "$log_file"
|
||||||
|
}
|
||||||
|
|
||||||
|
day_bucket=86400
|
||||||
|
|
||||||
|
tmp="$OUTPUT_PATH.tmp"
|
||||||
|
{
|
||||||
|
printf '# updated %s\n\n' "$(date -u -d "@$now" '+%Y-%m-%d %H:%M:%S UTC')"
|
||||||
|
|
||||||
|
while IFS= read -r line; do
|
||||||
|
[ -z "$line" ] && continue
|
||||||
|
name=${line%% *}
|
||||||
|
log="$state_dir/$name.log"
|
||||||
|
read -r bar pct state < <(render_row "$log" "$now" "$day_bucket" "$DISPLAY_DAYS")
|
||||||
|
printf '%-20s %s %-7s %5s%%\n' "$name" "$bar" "$state" "$pct"
|
||||||
|
done <<< "$SERVICES"
|
||||||
|
|
||||||
|
printf '\nlegend: # up . degraded _ down ? no data\n'
|
||||||
|
} > "$tmp"
|
||||||
|
|
||||||
|
mv "$tmp" "$OUTPUT_PATH"
|
||||||
Loading…
Add table
Add a link
Reference in a new issue