Another big round of refactoring and cleaning...

This commit is contained in:
2025-07-11 17:55:26 +02:00
parent aa61bf2a44
commit 168c5c0da6
323 changed files with 761 additions and 811 deletions

View File

@@ -0,0 +1,16 @@
# sys-hlth-btrfs
## Description
Checks the health of all mounted Btrfs filesystems by inspecting device error counters.
## Features
- Iterates over every Btrfs filesystem.
- Runs `btrfs device stats` and alerts if any error counters are non-zero.
- Hooks into systemd and a timer for regular checks.
- On failure, calls `sys-alm-compose.cymais@…` for notification.
## Usage
Just include this role in your playbook; it will:
1. Deploy a small shell script under `{{ path_administrator_scripts }}/sys-hlth-btrfs/`.
2. Install a `.service` and `.timer` unit.
3. Send alerts via `sys-alm-compose` if any filesystem shows errors.

View File

@@ -0,0 +1,11 @@
#!/bin/bash
exit_code=0
for path in $(btrfs filesystem show | awk '/ path /{print $NF}')
do
echo "Checking health for $path..."
result=$(btrfs device stats $path)
echo "$result"
regex='\.(.*)_errs(\s*)[1-9]'
[[ "$result" =~ $regex ]] && echo "Errors found!" && exit_code=1;
done
exit $exit_code

View File

@@ -0,0 +1,5 @@
- name: "reload sys-hlth-btrfs.cymais.service"
systemd:
name: sys-hlth-btrfs.cymais.service
enabled: yes
daemon_reload: yes

View File

@@ -0,0 +1,24 @@
---
galaxy_info:
author: "Kevin Veen-Birkenbach"
description: "Health-check for Btrfs filesystems, alerts on any device error counters."
company: |
Kevin Veen-Birkenbach
Consulting & Coaching Solutions
https://www.veen.world
license: "CyMaIS NonCommercial License (CNCL)"
license_url: "https://s.veen.world/cncl"
min_ansible_version: "2.9"
platforms:
- name: Archlinux
versions: ["rolling"]
galaxy_tags:
- monitor
- btrfs
- health
- systemd
- filesystem
repository: "https://s.veen.world/cymais"
documentation: "https://s.veen.world/cymais"
dependencies:
- sys-alm-compose

View File

@@ -0,0 +1,26 @@
- name: "create {{docker_health_btrfs_folder}}"
file:
path: "{{docker_health_btrfs_folder}}"
state: directory
mode: 0755
- name: create sys-hlth-btrfs.sh
copy:
src: sys-hlth-btrfs.sh
dest: "{{docker_health_btrfs_folder}}sys-hlth-btrfs.sh"
- name: create sys-hlth-btrfs.cymais.service
template:
src: sys-hlth-btrfs.service.j2
dest: /etc/systemd/system/sys-hlth-btrfs.cymais.service
notify: reload sys-hlth-btrfs.cymais.service
- name: "set 'service_name' to '{{ role_name }}'"
set_fact:
service_name: "{{ role_name }}"
- name: "include role for sys-timer for {{service_name}}"
include_role:
name: sys-timer
vars:
on_calendar: "{{on_calendar_health_btrfs}}"

View File

@@ -0,0 +1,7 @@
[Unit]
Description=Check btrfs status
OnFailure=sys-alm-compose.cymais@%n.service
[Service]
Type=oneshot
ExecStart=/bin/bash {{docker_health_btrfs_folder}}sys-hlth-btrfs.sh

View File

@@ -0,0 +1 @@
docker_health_btrfs_folder: '{{path_administrator_scripts}}sys-hlth-btrfs/'