Add script for ZFS snapshots (#136)

lstrojny · web-flow · commit fc283fee8607 · 2023-05-26T15:40:29.000+02:00
Signed-off-by: Lars Strojny &lt;lars@strojny.net&gt;
diff --git a/mock/fixtures/zfs_list_-p_-H_-t_snapshot_-o_name,used,creation b/mock/fixtures/zfs_list_-p_-H_-t_snapshot_-o_name,used,creation
@@ -0,0 +1,4 @@
+zpool/vol/0@snapshot-name	0	1685082363
+zpool/vol/0@snapshot-name	128	1685085436
+zpool/vol1@snapshot-name	0	1685099827
+zpool/vol1@snapshot-name	256	1685100606
diff --git a/mock/zfs b/mock/zfs
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+
+# zfs mock script for testing zfs snapshot provider
+
+fixtures_dir=$(dirname "$0")/fixtures
+cat "${fixtures_dir}/zfs_list_-p_-H_-t_snapshot_-o_name,used,creation"
diff --git a/zfs-snapshots.py b/zfs-snapshots.py
@@ -0,0 +1,101 @@
+#!/usr/bin/env python3
+import os
+import subprocess
+from functools import reduce, partial
+from itertools import groupby
+from operator import itemgetter, add
+from prometheus_client import CollectorRegistry, Gauge, generate_latest
+
+
+def row_to_metric(metric: Gauge, row):
+    return metric.labels(pool=row[0][0], volume=row[0][1]).set(row[1])
+
+
+def collect_metrics(metric: Gauge, it) -> None:
+    list(map(partial(row_to_metric, metric), it))
+
+
+def zfs_parse_line(line):
+    cols = line.split("\t")
+    rest, snapshot = cols[0].rsplit("@", 1)
+    pool = rest
+    volume = None
+    if "/" in rest:
+        pool, volume = rest.split("/", 1)
+        volume = "/" + volume
+    return pool, volume, snapshot, *map(int, cols[1:])
+
+
+def zfs_list_snapshots():
+    cmd = [
+        "zfs",
+        "list",
+        "-p",
+        "-H",
+        "-t",
+        "snapshot",
+        "-o",
+        "name,used,creation",
+    ]
+    # zfs list can be relatively slow (couple of seconds)
+    # Use Popen to incrementally read from stdout to not waste further time
+    popen = subprocess.Popen(
+        cmd, stdout=subprocess.PIPE, env=dict(os.environ, LC_ALL="C")
+    )
+    for stdout_line in iter(popen.stdout.readline, ""):
+        stdout_line = stdout_line.strip()
+        if stdout_line == b"":
+            break
+        yield stdout_line.decode("utf-8")
+    return_code = popen.wait()
+    if return_code:
+        raise subprocess.CalledProcessError(return_code, cmd)
+
+
+def aggregate_rows(rows, index, operator):
+    return map(
+        lambda row: (row[0], reduce(operator, map(itemgetter(index), row[1]), 0)), rows
+    )
+
+
+NAMESPACE = "zfs_snapshot"
+LABEL_NAMES = ["pool", "volume"]
+
+
+def main():
+    registry = CollectorRegistry()
+    latest_time_metric = Gauge(
+        "latest_time",
+        "Timestamp of the latest snapshot",
+        labelnames=LABEL_NAMES,
+        namespace=NAMESPACE,
+        registry=registry,
+        unit="seconds",
+    )
+    space_used_metric = Gauge(
+        "space_used",
+        "Space used by snapshots in bytes",
+        labelnames=LABEL_NAMES,
+        namespace=NAMESPACE,
+        registry=registry,
+        unit="bytes",
+    )
+
+    snapshots = map(zfs_parse_line, zfs_list_snapshots())
+    per_fs = list(
+        map(
+            lambda row: (row[0], list(row[1])), groupby(snapshots, lambda row: row[0:2])
+        )
+    )
+
+    space_used = aggregate_rows(per_fs, -2, add)
+    latest_time = aggregate_rows(per_fs, -1, max)
+
+    collect_metrics(latest_time_metric, latest_time)
+    collect_metrics(space_used_metric, space_used)
+
+    print(generate_latest(registry).decode(), end="")
+
+
+if __name__ == "__main__":
+    main()