From 8190523c30d8105c60960cec478e5ecf60784bef Mon Sep 17 00:00:00 2001 From: Rodrigo Arias Mallo Date: Tue, 14 Jan 2025 12:01:00 +0100 Subject: [PATCH] Add script to monitor GPFS MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Reviewed-by: Aleix Boné --- m/hut/gpfs-probe.nix | 31 +++++++++++++++++++++++++++++++ m/hut/gpfs-probe.sh | 18 ++++++++++++++++++ m/hut/monitoring.nix | 5 ++++- 3 files changed, 53 insertions(+), 1 deletion(-) create mode 100644 m/hut/gpfs-probe.nix create mode 100755 m/hut/gpfs-probe.sh diff --git a/m/hut/gpfs-probe.nix b/m/hut/gpfs-probe.nix new file mode 100644 index 0000000..d4a0d98 --- /dev/null +++ b/m/hut/gpfs-probe.nix @@ -0,0 +1,31 @@ +{ pkgs, config, lib, ... }: +let + gpfs-probe-script = pkgs.runCommand "gpfs-probe.sh" { } + '' + cp ${./gpfs-probe.sh} $out; + chmod +x $out + '' + ; +in +{ + # Use a new user to handle the SSH keys + users.groups.ssh-robot = { }; + users.users.ssh-robot = { + description = "SSH Robot"; + isNormalUser = true; + home = "/var/lib/ssh-robot"; + }; + + systemd.services.gpfs-probe = { + description = "Daemon to report GPFS latency via SSH"; + path = [ pkgs.openssh pkgs.netcat ]; + after = [ "network.target" ]; + wantedBy = [ "default.target" ]; + serviceConfig = { + Type = "simple"; + ExecStart = "${pkgs.socat}/bin/socat TCP4-LISTEN:9966,fork EXEC:${gpfs-probe-script}"; + User = "ssh-robot"; + Group = "ssh-robot"; + }; + }; +} diff --git a/m/hut/gpfs-probe.sh b/m/hut/gpfs-probe.sh new file mode 100755 index 0000000..b8f7f82 --- /dev/null +++ b/m/hut/gpfs-probe.sh @@ -0,0 +1,18 @@ +#!/bin/sh + +N=500 + +t=$(timeout 5 ssh bsc015557@glogin2.bsc.es "timeout 3 command time -f %e touch /gpfs/projects/bsc15/bsc015557/gpfs.{1..$N} 2>&1; rm -f /gpfs/projects/bsc15/bsc015557/gpfs.{1..$N}") + +if [ -z "$t" ]; then + t="5.00" +fi + +cat <