codec-re: quiet bundle decodes FULLY (17k samples, zero errors)

User asked the right question: do events without 30 NN blocks decode fully? Answer: YES. event-a: Tran 3328 ✓ Vert 3328 ✓ Long 3328 ✓ (28 segments, 0 '30 NN') event-c: Tran 1280 ✓ Vert 1280 ✓ Long 1280 ✓ (12 segments, 0 '30 NN') event-d: Tran 1280 ✓ Vert 1280 ✓ Long 1280 ✓ (12 segments, 0 '30 NN') 17,664 ADC samples decoded byte-exact against BW's ASCII export. Zero divergences across event-a, event-c, event-d. This means the codec is FULLY SOLVED for any event without 30 NN blocks. The remaining gap is the 30 NN block format only — used for high-amplitude regions where deltas exceed int8 range. For quiet events (or quiet stretches of loud events), the decoder is complete. 9 new regression tests bring the total to 55, all passing. Files: tests/test_waveform_codec.py + docs/waveform_codec_re_status.md + new analysis/verify_quiet_bundle.py.
2026-05-12 04:07:55 +00:00
parent 07675626dc
commit ce5dc640ba
3 changed files with 108 additions and 12 deletions
@@ -261,6 +261,28 @@ MULTICHANNEL_FIXTURES = [
    (os.path.join(os.path.dirname(__file__), "fixtures", "5-11-26", "M529LL1L.JQ0"), "Vert", 258),
    # SP0 (loud all): Long all 3 segments byte-exact (1536 samples).
    (os.path.join(os.path.dirname(__file__), "fixtures", "5-11-26", "M529LL1A.SP0"), "Long", 1536),
+    # 5-8-26 quiet bundle: events without 30 NN blocks decode FULLY across all channels.
+    # event-a: 3328 samples × 3 channels = 9984 samples, all byte-exact.
+    (os.path.join(os.path.dirname(__file__), "fixtures", "decode-re-5-8-26",
+                  "event-a", "M529LKVQ.6S0"), "Tran", 3328),
+    (os.path.join(os.path.dirname(__file__), "fixtures", "decode-re-5-8-26",
+                  "event-a", "M529LKVQ.6S0"), "Vert", 3328),
+    (os.path.join(os.path.dirname(__file__), "fixtures", "decode-re-5-8-26",
+                  "event-a", "M529LKVQ.6S0"), "Long", 3328),
+    # event-c: 1280 samples × 3 channels
+    (os.path.join(os.path.dirname(__file__), "fixtures", "decode-re-5-8-26",
+                  "event-c", "M529LK44.AB0"), "Tran", 1280),
+    (os.path.join(os.path.dirname(__file__), "fixtures", "decode-re-5-8-26",
+                  "event-c", "M529LK44.AB0"), "Vert", 1280),
+    (os.path.join(os.path.dirname(__file__), "fixtures", "decode-re-5-8-26",
+                  "event-c", "M529LK44.AB0"), "Long", 1280),
+    # event-d: 1280 samples × 3 channels
+    (os.path.join(os.path.dirname(__file__), "fixtures", "decode-re-5-8-26",
+                  "event-d", "M529LK2V.470"), "Tran", 1280),
+    (os.path.join(os.path.dirname(__file__), "fixtures", "decode-re-5-8-26",
+                  "event-d", "M529LK2V.470"), "Vert", 1280),
+    (os.path.join(os.path.dirname(__file__), "fixtures", "decode-re-5-8-26",
+                  "event-d", "M529LK2V.470"), "Long", 1280),
 ]


@@ -325,9 +347,16 @@ def _full_truth(path):

 def _full_truth_channel(path, channel):
    """Load one channel's samples (in 16-count units) from the BW ASCII export."""
-    import re
+    import glob, re
    col_idx = {"Tran": 0, "Vert": 1, "Long": 2, "MicL": 3}[channel]
-    with open(path + ".TXT", "r", encoding="utf-8", errors="replace") as f:
+    # event-a's TXT has a typo ("M59" vs "M529") — pick the .TXT in the same dir
+    # rather than assuming exact-name correspondence.
+    txt_path = path + ".TXT"
+    if not os.path.exists(txt_path):
+        candidates = glob.glob(os.path.join(os.path.dirname(path), "*.TXT"))
+        if candidates:
+            txt_path = candidates[0]
+    with open(txt_path, "r", encoding="utf-8", errors="replace") as f:
        lines = f.read().splitlines()
    header_idx = None
    for i, line in enumerate(lines):