seisee/precompute_all_v4.py

import json, sys, os, numpy as np, h5py
from pathlib import Path
from datetime import datetime
from tqdm import tqdm

INDEX_PATH = Path("/mnt/kingston/seismic_webapp/data/index.json")
OUTPUT_DIR = Path("/mnt/kingston/seismic_webapp/data/rms_cache")
SAMPLE_RATE = 200

def fix_path(p):
    p = p.replace('\\', '/')
    if p.startswith('F:/'): return '/mnt/kingston/' + p[3:]
    if p.startswith('E:/'): return '/mnt/data_sdb1/' + p[3:]
    return p

def compute_rms(h5_path):
    h5_path = fix_path(h5_path)
    if not os.path.exists(h5_path): return None
    try:
        with h5py.File(h5_path, 'r') as f:
            ds = f['adc_values']
            start_ts = int(ds.attrs.get('timestamp', 0))
            if start_ts == 0: return None
            # On prend 5000 samples pour un RMS représentatif
            samples = ds[0:5000]
            rms = float(np.sqrt(np.mean(samples.astype(np.float64)**2)))
            return [{'ts': start_ts, 'rms': rms}]
    except: return None

def main():
    with open(INDEX_PATH, 'r') as f: index = json.load(f)
    nodes = index.get('nodes', {})
    OUTPUT_DIR.mkdir(parents=True, exist_ok=True)

    # Toutes les dates du système
    all_dates = set()
    for n in nodes.values():
        if 'dates' in n: all_dates.update(n['dates'].keys())

    print(f"Dates à traiter: {sorted(list(all_dates))}")

    channel = "ch0"
    for date in sorted(list(all_dates)):
        output_file = OUTPUT_DIR / f"rms_{date}_{channel}.json"
        # On force la régénération pour être sûr d'avoir tout
        print(f"Processing {date}...")
        results = {}
        for nid, node in tqdm(nodes.items(), desc=f"Nodes {date}"):
            files = node.get('dates', {}).get(date, [])
            # On cherche les fichiers data prioritaires
            target = next((f for f in files if '_data_' in f['path'] and f'_{channel}_' in f['path']), None)
            if not target and files: target = files[0] # Fallback

            if target:
                data = compute_rms(target['path'])
                if data: results[nid] = data

        if results:
            with open(output_file, 'w') as f:
                json.dump({'date':date, 'channel':channel, 'nodes':results}, f)
            print(f"Sauvegardé {output_file.name}: {len(results)} nodes")

if __name__ == '__main__': main()