tsvm/mon2taud.py

#!/usr/bin/env python3
"""mon2taud.py — Convert Monotone (.MON) tracker modules to TSVM Taud (.taud)

Usage:
    python3 mon2taud.py input.MON output.taud [-v]

Monotone is Calvin "Trixter" French's tracker for the PC speaker / Tandy /
TI-99 SN76489. It has no user-defined instruments (the only instrument is
the beeper), 1..12 voices, 64 rows per pattern, ProTracker-flavoured 2-byte
cells and a reduced 8-effect set: 0,1,2,3,4,B,D,F.

This converter:
    - synthesises a single 32-byte squarewave instrument (instrument #1)
    - splits each Monotone pattern (64 × N voices) into N Taud patterns
    - converts notes (A0=27.5 Hz chromatic) to Taud 4096-TET centred on C4
    - maps the 8 Monotone effects to their closest Taud equivalents
    - approximates Hz/tick slides (1xx/2xx/3xx) at an A4=440 Hz reference

Limits: numVoices ≤ 20, numPatterns × numVoices ≤ 4095.
"""

import argparse
import gzip
import math
import struct
import sys

from taud_common import (
    set_verbose, vprint,
    TAUD_MAGIC, TAUD_VERSION, TAUD_HEADER_SIZE, TAUD_SONG_ENTRY,
    SAMPLEBIN_SIZE, INSTBIN_SIZE, SAMPLEINST_SIZE,
    PATTERN_ROWS, PATTERN_BYTES, NUM_PATTERNS_MAX, NUM_CUES, CUE_SIZE, NUM_VOICES,
    NOTE_NOP, NOTE_KEYOFF, NOTE_CUT, TAUD_C4,
    TOP_NONE, TOP_A, TOP_B, TOP_C, TOP_E, TOP_F, TOP_G, TOP_H, TOP_J,
    SEL_SET, SEL_FINE,
    J_SEMI_TABLE,
    encode_cue, deduplicate_patterns, encode_song_entry,
)


# ── Monotone constants ───────────────────────────────────────────────────────

MON_MAGIC_PREFIX  = b'\x08MONOTONE'        # only the first 9 bytes are stable
MON_HEADER_SIZE   = 0x15F                  # 92 magic + 3 meta + 256 order list
MON_PATTERN_ROWS  = 64
MON_CELL_BYTES    = 2

# Effect-code (3-bit) → ProTracker-style letter, following the format-doc table.
MON_EFFECT_LETTERS = ['0', '1', '2', '3', '4', 'B', 'D', 'F']

# Note value 1 = A0; C4 sits at value 40 (A0 + 39 semitones).
MON_NOTE_C4 = 40

# Slides are linear-in-Hz on Monotone but linear-in-4096-TET on Taud. Take A4
# (440 Hz) as the reference: 1 Hz at A4 ≈ 12/(440·ln 2) semitones, scaled by
# 4096/12 to Taud units. ≈ 161.0. Off by ±1 octave at the extremes; documented
# in the script header.
SLIDE_UNITS_PER_HZ = 12.0 / (440.0 * math.log(2.0)) * 4096.0 / 12.0


# ── Taud container ───────────────────────────────────────────────────────────

SIGNATURE = b"mon2taud/TSVM "    # 14 bytes


# ── Monotone parser ──────────────────────────────────────────────────────────

class MonRow:
    __slots__ = ('note', 'effect', 'effect_arg')
    def __init__(self):
        self.note       = 0      # 0 = empty, 0x7F = note off, else 1..126
        self.effect     = 0      # 0..7 (raw 3-bit code)
        self.effect_arg = 0      # 0..63 (6-bit data)


def parse_mon(data: bytes):
    if len(data) < MON_HEADER_SIZE:
        sys.exit(f"error: file too short ({len(data)} bytes); "
                 f"need at least {MON_HEADER_SIZE} for the header")

    if data[:9] != MON_MAGIC_PREFIX:
        sys.exit(f"error: bad magic; expected '\\x08MONOTONE', got {data[:9]!r}")

    song_len   = data[0x5C]
    num_voices = data[0x5D]
    if num_voices < 1 or num_voices > 12:
        sys.exit(f"error: invalid voice count {num_voices} (expected 1..12)")

    order_raw = data[0x5F:0x15F]
    # Effective order list: take first song_len entries and drop 0xFF skip-slots
    # (matches mtreader.lua and MT_PLAY.PAS' "ignore 0xFF" semantics).
    order_list = [b for b in order_raw[:song_len] if b != 0xFF]
    if not order_list:
        sys.exit("error: order list is empty after filtering 0xFF skip slots")

    n_patterns = max(order_list) + 1
    pattern_size = MON_PATTERN_ROWS * num_voices * MON_CELL_BYTES
    expected = MON_HEADER_SIZE + n_patterns * pattern_size
    if len(data) < expected:
        sys.exit(f"error: file truncated; expected {expected} bytes for "
                 f"{n_patterns} patterns × {num_voices} voices, got {len(data)}")

    # patterns[pi][voice][row] -> MonRow
    patterns = []
    for pi in range(n_patterns):
        base = MON_HEADER_SIZE + pi * pattern_size
        grid = [[MonRow() for _ in range(MON_PATTERN_ROWS)] for _ in range(num_voices)]
        for r in range(MON_PATTERN_ROWS):
            row_off = base + r * num_voices * MON_CELL_BYTES
            for v in range(num_voices):
                cell_off = row_off + v * MON_CELL_BYTES
                # Little-endian 16-bit cell.
                word = data[cell_off] | (data[cell_off + 1] << 8)
                cell = grid[v][r]
                cell.note       = (word >> 9) & 0x7F
                cell.effect     = (word >> 6) & 0x07
                cell.effect_arg = word & 0x3F
        patterns.append(grid)

    return {
        'song_len':   song_len,
        'num_voices': num_voices,
        'order_list': order_list,
        'n_patterns': n_patterns,
        'patterns':   patterns,
    }


# ── Note conversion (Monotone → Taud 4096-TET) ───────────────────────────────

def mon_note_to_taud(mon_note: int) -> int:
    if mon_note == 0:
        return NOTE_NOP
    if mon_note == 0x7F:
        return NOTE_CUT
    val = TAUD_C4 + round((mon_note - MON_NOTE_C4) * 4096.0 / 12.0)
    return max(1, min(0xFFFD, val))


# ── Effect mapping (Monotone 3-bit code + 6-bit data → Taud) ─────────────────

def encode_effect(eff_code: int, data: int) -> tuple:
    """Return (taud_op, taud_arg16)."""
    letter = MON_EFFECT_LETTERS[eff_code & 7]

    if letter == '0':
        if data == 0:
            return (TOP_NONE, 0)
        x = (data >> 3) & 0x7
        y = data & 0x7
        return (TOP_J, (J_SEMI_TABLE[x] << 8) | J_SEMI_TABLE[y])

    if letter == '1':                                # slide up Hz/tick → Taud F
        arg = round(data * SLIDE_UNITS_PER_HZ) & 0xFFFF
        return (TOP_F, arg)

    if letter == '2':                                # slide down Hz/tick → Taud E
        arg = round(data * SLIDE_UNITS_PER_HZ) & 0xFFFF
        return (TOP_E, arg)

    if letter == '3':                                # tone porta Hz/tick → Taud G
        arg = round(data * SLIDE_UNITS_PER_HZ) & 0xFFFF
        return (TOP_G, arg)

    if letter == '4':                                # vibrato xy → Taud H
        x = (data >> 3) & 0x7        # speed (3 bits)
        y = data & 0x7               # depth (3 bits)
        # Scale 3-bit nibble (0..7) to 8-bit byte (0..252) via × 0x24 (= 36).
        return (TOP_H, ((x * 0x24) << 8) | (y * 0x24))

    if letter == 'B':                                # position jump → Taud B
        return (TOP_B, data & 0xFF)

    if letter == 'D':                                # pattern break → Taud C
        return (TOP_C, data & 0xFF)

    if letter == 'F':                                # set speed → Taud A
        if data == 0:                                # invalid in Monotone
            return (TOP_NONE, 0)
        return (TOP_A, (data & 0xFF) << 8)

    return (TOP_NONE, 0)


# ── Squarewave instrument synthesis ──────────────────────────────────────────

# 32-byte single-cycle 50%-duty square; played at 8372 Hz at C4 → 261.6 Hz tone.
SQUARE_SAMPLE = bytes([0xFF] * 16 + [0x00] * 16)
SQUARE_C2SPD  = 8372

def build_sample_inst_bin() -> bytes:
    """Emit the full 786432-byte sample+instrument bin.

    Instrument 1 carries the synthesised square wave; all other slots stay
    zero. Sample bin starts with the 32-byte square at offset 0; rest is
    silence padding.
    """
    sample_bin = bytearray(SAMPLEBIN_SIZE)
    sample_bin[0:len(SQUARE_SAMPLE)] = SQUARE_SAMPLE

    inst_bin = bytearray(INSTBIN_SIZE)
    base = 1 * 256       # instrument #1 (slot 0 always blank)
    struct.pack_into('<I', inst_bin, base + 0,  0)                       # sample ptr
    struct.pack_into('<H', inst_bin, base + 4,  len(SQUARE_SAMPLE))      # length
    struct.pack_into('<H', inst_bin, base + 6,  SQUARE_C2SPD)            # rate at C4
    struct.pack_into('<H', inst_bin, base + 8,  0)                       # play start
    struct.pack_into('<H', inst_bin, base + 10, 0)                       # loop start
    struct.pack_into('<H', inst_bin, base + 12, len(SQUARE_SAMPLE))      # loop end
    inst_bin[base + 14] = 0x01                                           # forward loop
    struct.pack_into('<H', inst_bin, base + 15, 0x2020)                  # vol-env: P (bit 13) | b (bit 5)
    struct.pack_into('<H', inst_bin, base + 17, 0)                       # pan-env flags (P=0 → mixer skips)
    struct.pack_into('<H', inst_bin, base + 19, 0)                       # pitch-env flags (P=0 → mixer skips)
    inst_bin[base + 21] = 63                                             # vol env pt 0 = full
    inst_bin[base + 22] = 0
    inst_bin[base + 171] = 0xA0                                          # IGV
    inst_bin[base + 177] = 0x80                                          # default pan = centre
    inst_bin[base + 182] = 0xFF                                          # filter cutoff off
    inst_bin[base + 183] = 0xFF                                          # filter resonance off
    inst_bin[base + 186] = 0x01                                          # NNA: cut

    return bytes(sample_bin) + bytes(inst_bin)


# ── Pattern build ────────────────────────────────────────────────────────────

def build_taud_pattern(grid: list, voice: int) -> bytes:
    """Build one 512-byte Taud pattern from one Monotone voice's 64 rows."""
    out = bytearray(PATTERN_BYTES)
    rows = grid[voice]
    for r, row in enumerate(rows):
        note_taud = mon_note_to_taud(row.note)
        # Trigger instrument #1 only when an actual note (1..0x7E) starts.
        triggers = (1 <= row.note <= 0x7E)

        op, arg = encode_effect(row.effect, row.effect_arg)

        # Volume column: Monotone has none → permanent no-op (FINE 0).
        vol_byte = (SEL_FINE << 6) | 0
        # Pan column: SET centre on row 0, no-op afterwards.
        if r == 0:
            pan_byte = (SEL_SET << 6) | 32
        else:
            pan_byte = (SEL_FINE << 6) | 0

        base = r * 8
        struct.pack_into('<H', out, base + 0, note_taud)
        out[base + 2] = 1 if triggers else 0
        out[base + 3] = vol_byte
        out[base + 4] = pan_byte
        out[base + 5] = op & 0xFF
        struct.pack_into('<H', out, base + 6, arg & 0xFFFF)

    return bytes(out)


def build_cue_sheet(order_list: list, num_voices: int, pat_remap: dict) -> bytes:
    """One cue per order-list entry; last cue carries the halt instruction."""
    sheet = bytearray(NUM_CUES * CUE_SIZE)
    for c in range(NUM_CUES):
        sheet[c*CUE_SIZE : (c+1)*CUE_SIZE] = encode_cue([], 0)

    cue_idx = 0
    last_active = -1
    for order in order_list:
        if cue_idx >= NUM_CUES:
            break
        orig_pats = [order * num_voices + v for v in range(num_voices)]
        mapped    = [pat_remap[p] for p in orig_pats]
        sheet[cue_idx*CUE_SIZE : (cue_idx+1)*CUE_SIZE] = encode_cue(mapped, 0)
        last_active = cue_idx
        cue_idx += 1

    if last_active >= 0:
        sheet[last_active * CUE_SIZE + 30] = 0x01

    return bytes(sheet)


# ── Initial speed scan ───────────────────────────────────────────────────────

def find_initial_speed(patterns: list, order_list: list, num_voices: int) -> int:
    """Pick up an Fxx in the first ordered pattern's row 0 if present.

    Default tempo per MT_PLAY.PAS:238-239 is `max(numTracks, 4)`.
    """
    default_speed = max(num_voices, 4)
    if not order_list:
        return default_speed
    first = order_list[0]
    if first >= len(patterns):
        return default_speed
    grid = patterns[first]
    for v in range(num_voices):
        row = grid[v][0]
        if row.effect == 7 and 0 < row.effect_arg < 0x40:    # Fxx (idx 7)
            return row.effect_arg
    return default_speed


# ── Top-level assembly ───────────────────────────────────────────────────────

def assemble_taud(mon: dict) -> bytes:
    num_voices = mon['num_voices']
    patterns   = mon['patterns']
    order_list = mon['order_list']
    n_patterns = mon['n_patterns']

    if num_voices > NUM_VOICES:
        vprint(f"  warning: {num_voices} voices > {NUM_VOICES}; truncating")
        num_voices = NUM_VOICES

    if n_patterns * num_voices > NUM_PATTERNS_MAX:
        sys.exit(
            f"error: {n_patterns} patterns × {num_voices} voices = "
            f"{n_patterns*num_voices} > {NUM_PATTERNS_MAX} Taud limit"
        )

    vprint(f"  voices: {num_voices}, mon patterns: {n_patterns}, "
           f"taud patterns: {n_patterns * num_voices}")

    speed = find_initial_speed(patterns, order_list, num_voices)
    vprint(f"  initial speed (ticks/row): {speed}")

    vprint("  building sample/instrument bin…")
    sampleinst_raw = build_sample_inst_bin()
    assert len(sampleinst_raw) == SAMPLEINST_SIZE
    compressed = gzip.compress(sampleinst_raw, compresslevel=9, mtime=0)
    comp_size  = len(compressed)
    vprint(f"  sample+inst bin: {SAMPLEINST_SIZE} → {comp_size} bytes (gzip)")

    vprint("  building pattern bin…")
    pat_bin = bytearray()
    for pi in range(n_patterns):
        grid = patterns[pi]
        for v in range(num_voices):
            pat_bin += build_taud_pattern(grid, v)
    assert len(pat_bin) == n_patterns * num_voices * PATTERN_BYTES

    vprint("  deduplicating patterns…")
    orig_count = n_patterns * num_voices
    pat_bin, pat_remap, num_taud_pats = deduplicate_patterns(bytes(pat_bin), orig_count)
    vprint(f"  patterns: {orig_count} → {num_taud_pats} unique "
           f"({orig_count - num_taud_pats} deduplicated)")

    vprint("  building cue sheet…")
    cue_sheet = build_cue_sheet(order_list, num_voices, pat_remap)
    assert len(cue_sheet) == NUM_CUES * CUE_SIZE

    pat_comp = gzip.compress(bytes(pat_bin),  compresslevel=9, mtime=0)
    cue_comp = gzip.compress(bytes(cue_sheet), compresslevel=9, mtime=0)
    vprint(f"  pattern bin: {len(pat_bin)} → {len(pat_comp)} bytes (gzip)")
    vprint(f"  cue sheet:   {len(cue_sheet)} → {len(cue_comp)} bytes (gzip)")

    # Header: magic, version, num_songs=1, comp_size of sample+inst, projOff=0, sig.
    sig = (SIGNATURE + b' ' * 14)[:14]
    header = (
        TAUD_MAGIC
        + bytes([TAUD_VERSION, 1])
        + struct.pack('<I', comp_size)
        + b'\x00\x00\x00\x00'
        + sig
    )
    assert len(header) == TAUD_HEADER_SIZE

    song_offset = TAUD_HEADER_SIZE + comp_size + TAUD_SONG_ENTRY

    # BPM 150 + ticks=mon_speed → row rate = 60/mon_speed (matches Monotone).
    bpm_stored = 150 - 24
    # bit 2 reserved (was 'm' fadeout-zero policy; removed). Monotone has no instrument-level
    # fadeout, so every Taud instrument carries fadeout=0 ("no fade") — notes retire on
    # sample-end or pattern note-cut instead.
    flags_byte = 0x00

    song_table = encode_song_entry(
        song_offset       = song_offset,
        num_voices        = num_voices,
        num_patterns      = num_taud_pats,
        bpm_stored        = bpm_stored,
        tick_rate         = speed,
        base_note         = 0xA000,
        base_freq         = SQUARE_C2SPD,
        flags_byte        = flags_byte,
        pat_bin_comp_size = len(pat_comp),
        cue_sheet_comp_size = len(cue_comp),
        global_vol        = 0xFF,
        mixing_vol        = round(180 / num_voices),
    )
    assert len(song_table) == TAUD_SONG_ENTRY

    return header + compressed + song_table + pat_comp + cue_comp


# ── Main ─────────────────────────────────────────────────────────────────────

def main():
    ap = argparse.ArgumentParser(description=__doc__,
                                 formatter_class=argparse.RawDescriptionHelpFormatter)
    ap.add_argument('input',  help='Input .MON file')
    ap.add_argument('output', help='Output .taud file')
    ap.add_argument('-v', '--verbose', action='store_true',
                    help='Print conversion details to stderr')
    args = ap.parse_args()

    set_verbose(args.verbose)

    with open(args.input, 'rb') as f:
        data = f.read()

    vprint(f"parsing '{args.input}' ({len(data)} bytes)…")
    mon = parse_mon(data)
    vprint(f"  songLen={mon['song_len']}, voices={mon['num_voices']}, "
           f"patterns={mon['n_patterns']}, orders={len(mon['order_list'])}")

    taud = assemble_taud(mon)

    with open(args.output, 'wb') as f:
        f.write(taud)

    print(f"wrote {len(taud)} bytes to '{args.output}'")
    if args.verbose:
        print(f"  magic ok: {taud[:8].hex()}", file=sys.stderr)


if __name__ == '__main__':
    main()