Kapitel 13/Tutorial.md aktualisiert

This commit is contained in:
2025-09-17 20:13:26 +00:00
parent 5a122145d9
commit 6d27408f23

View File

@@ -125,7 +125,7 @@ SFTP_USER=sftp_uploader
SFTP_KEY=/home/clipper/.ssh/nc_sftp_ed25519 SFTP_KEY=/home/clipper/.ssh/nc_sftp_ed25519
DROP_BASE="/mnt/hdd/incoming" DROP_BASE="/mnt/hdd/incoming"
CLIPPER_PEAK_THRESHOLD=0.85 CLIPPER_PEAK_THRESHOLD=0.85
CLIPPER_MATCH_TOLERANCE=4.0
CLIPPER_IN=/srv/clipper/watch CLIPPER_IN=/srv/clipper/watch
CLIPPER_OUT=/srv/clipper/out CLIPPER_OUT=/srv/clipper/out
@@ -826,86 +826,112 @@ Das folgende Schaubild zeigt dir die konkrete Verkabelung
``` ```
```bash ```bash
#!/usr/bin/env bash #!/bin/bash
set -euo pipefail set -euo pipefail
. /etc/clipper/clipper.env # Umgebungsvariablen laden
if [ -f "/etc/clipper/clipper.env" ]; then
set -a
. "/etc/clipper/clipper.env"
set +a
else
echo "[ERROR] Environment file not found: /etc/clipper/clipper.env" >&2
exit 1
fi
ID="${1:?need VOD id}" # Erwartete Umgebungsvariablen prüfen
: "${CLIPPER_PEAK_THRESHOLD:?Environment variable CLIPPER_PEAK_THRESHOLD is not set.}"
: "${CLIPPER_TMP:?Environment variable CLIPPER_TMP is not set.}"
: "${CLIPPER_LOG:?Environment variable CLIPPER_LOG is not set.}"
VOD_IN_MP4="${CLIPPER_OUT}/${ID}/original/${ID}.mp4" # ID aus dem Aufruf übernehmen
OUT_BASE="${CLIPPER_OUT}/${ID}" VOD_ID="$1"
ANALYSIS="${OUT_BASE}/analysis"
LOGDIR="${CLIPPER_LOG}/${ID}"
mkdir -p "$ANALYSIS" "$LOGDIR" VOD_PATH="/srv/clipper/out/$VOD_ID/original/$VOD_ID.mp4"
exec > >(tee -a "${LOGDIR}/analyze.log") 2>&1 TMP_DIR="$CLIPPER_TMP/$VOD_ID"
echo "== Analyze $ID ==" TMP_AUDIO="$TMP_DIR/audio.wav"
LOG_DIR="$CLIPPER_LOG/$VOD_ID"
TMP_LOG_AUDIO="$LOG_DIR/audio.log"
TMP_JSON="$TMP_DIR/candidates.json"
echo "[FFMPEG] Szenewechselanalyse läuft..." mkdir -p "$TMP_DIR" "$LOG_DIR"
ffmpeg -hide_banner -loglevel error -i "${VOD_IN_MP4}" \ exec > >(tee -a "${LOG_DIR}/analyze.log") 2>&1
-vf "scale=-2:360,select=gt(scene\,0.30),showinfo" -an -f null - \ echo "== Analyze $VOD_ID =="
2> "${LOGDIR}/sceneinfo.log" echo "[INFO] VOD gefunden: $VOD_PATH"
echo "[INFO] Extrahiere WAV aus $VOD_PATH → $TMP_AUDIO"
echo "[FFMPEG] Audiostatistik läuft..." # Audio extrahieren mit Logging
ffmpeg -hide_banner -loglevel error -i "${VOD_IN_MP4}" \ ffmpeg -v warning -i "$VOD_PATH" -ac 1 -ar 16000 -vn "$TMP_AUDIO" 2> "$TMP_LOG_AUDIO"
-vn -ac 1 -ar 16000 \ echo "[OK] Audio extrahiert: $TMP_AUDIO ($(du -h "$TMP_AUDIO" | cut -f1))"
-af "astats=metadata=1:reset=2,ametadata=print:key=lavfi.astats.Overall.RMS_level" \
-f null - \
2> "${LOGDIR}/astats.log" || true
ANALYSIS="$ANALYSIS" LOGDIR="$LOGDIR" python3 - <<'PY' echo "[INFO] Verwende Schwelle: $CLIPPER_PEAK_THRESHOLD"
import os, re, json, sys echo "[INFO] Starte Python-Analyse..."
from datetime import datetime
def log(msg): # Python-Analyse
timestamp = datetime.now().strftime("%F %T") /srv/clipper/.venv/bin/python3 - <<EOF
print(f"[PY] [{timestamp}] {msg}") import os
import json
import numpy as np
import soundfile as sf
import librosa
out = os.environ["ANALYSIS"] path = "$TMP_AUDIO"
logdir = os.environ["LOGDIR"] outfile = "$TMP_JSON"
threshold = float(os.getenv("CLIPPER_PEAK_THRESHOLD", "0.85"))
scene_ts = []
log("Lese sceneinfo.log...")
try: try:
with open(os.path.join(logdir, "sceneinfo.log"), errors="ignore") as f: y, sr = librosa.load(path, sr=None, mono=True)
for line in f:
m = re.search(r"pts_time:([0-9]+(?:\.[0-9]+)?)", line)
if m:
scene_ts.append(float(m.group(1)))
except Exception as e: except Exception as e:
log(f"Fehler beim Lesen von sceneinfo.log: {e}") print("[ERROR] Laden fehlgeschlagen:", e)
sys.exit(1) exit(1)
log(f"{len(scene_ts)} Szenenwechsel gefunden.") if len(y) == 0:
print("[WARN] Keine Audio-Daten vorhanden.")
with open(outfile, 'w') as f:
json.dump([], f)
print(f"[DONE] {outfile} geschrieben mit 0 Clip(s)")
exit(0)
has_audio = False frame_length = sr // 2
ap = os.path.join(logdir, "astats.log") energy = np.array([
if os.path.exists(ap): np.sum(np.abs(y[i:i+frame_length]))
log("Prüfe astats.log auf Audiodaten...") for i in range(0, len(y), frame_length)
with open(ap, errors="ignore") as f: ])
has_audio = "RMS_level" in f.read()
log(f"Audioanalyse: {'gefunden' if has_audio else 'nicht vorhanden'}") cutoff = np.quantile(energy, threshold)
high_energy = np.where(energy > cutoff)[0]
cands = [{ if len(high_energy) == 0:
"start": max(0.0, t - 2.0), print("[INFO] Keine Peaks über Schwelle gefunden.")
"end": t + 6.0, with open(outfile, 'w') as f:
"score": round(0.6 + (0.1 if has_audio else 0), 2), json.dump([], f)
"tags": ["scene-cut"] + (["audio-peak"] if has_audio else []) print(f"[DONE] {outfile} geschrieben mit 0 Clip(s)")
} for t in scene_ts] exit(0)
target = os.path.join(out, "candidates.json") # Zeiträume berechnen
try: candidates = []
with open(target, "w", encoding="utf-8") as f: t_start = None
json.dump(cands, f, ensure_ascii=False, indent=2) for i in range(len(energy)):
log(f"{len(cands)} Kandidaten gespeichert → {target}") t = i * frame_length / sr
except Exception as e: if energy[i] > cutoff:
log(f"Fehler beim Schreiben von candidates.json: {e}") if t_start is None:
sys.exit(2) t_start = t
PY elif t_start is not None:
t_end = t
if t_end - t_start > 5:
candidates.append({"start": round(t_start, 2), "end": round(t_end, 2)})
t_start = None
echo "== Done $ID ==" if t_start is not None:
t_end = len(y) / sr
if t_end - t_start > 5:
candidates.append({"start": round(t_start, 2), "end": round(t_end, 2)})
with open(outfile, 'w') as f:
json.dump(candidates, f)
print(f"[DONE] {outfile} geschrieben mit {len(candidates)} Clip(s)")
EOF
``` ```
1. **SSH Node Analyze VOD** (Node-Name: Analyze VOD) 1. **SSH Node Analyze VOD** (Node-Name: Analyze VOD)
- Node-Typ: SSH - Node-Typ: SSH