working TAV-DT decoder

2026-03-14 23:16:06 +09:00 · 2025-12-02 14:13:57 +09:00
parent 196b9a0c01
commit 046fa98025
5 changed files with 1018 additions and 93 deletions
--- a/video_encoder/tav_inspector.c
+++ b/video_encoder/tav_inspector.c
@@ -1,6 +1,7 @@
 // TAV Packet Inspector - Comprehensive packet analysis tool for TAV files
 // to compile: gcc -o tav_inspector tav_inspector.c -lzstd -lm
 // Created by CuriousTorvald and Claude on 2025-10-14
+// Updated 2025-12-02: Added TAV-DT (Digital Tape) format support
 #include <stdio.h>
 #include <stdint.h>
 #include <stdlib.h>
@@ -9,6 +10,10 @@
 #include <getopt.h>
 #include <zstd.h>

+// TAV-DT sync patterns (big endian)
+#define TAV_DT_SYNC_NTSC  0xE3537A1F  // 720x480
+#define TAV_DT_SYNC_PAL   0xD193A745  // 720x576
+
 // Frame mode constants (from TAV spec)
 #define FRAME_MODE_SKIP  0x00
 #define FRAME_MODE_INTRA 0x01
@@ -110,6 +115,24 @@ typedef struct {
    int summary_only;
 } display_options_t;

+// Helper to read data from either file or DT payload buffer
+static size_t read_packet_data(void *dest, size_t size, size_t count, FILE *fp,
+                               uint8_t *payload, uint32_t payload_size, uint32_t *offset) {
+    if (payload) {
+        // DT mode: read from payload buffer
+        size_t bytes_to_read = size * count;
+        if (*offset + bytes_to_read > payload_size) {
+            return 0;  // Not enough data
+        }
+        memcpy(dest, payload + *offset, bytes_to_read);
+        *offset += bytes_to_read;
+        return count;
+    } else {
+        // TAV mode: read from file
+        return fread(dest, size, count, fp);
+    }
+}
+
 const char* get_packet_type_name(uint8_t type) {
    switch (type) {
        case TAV_PACKET_IFRAME: return "I-FRAME";
@@ -479,24 +502,87 @@ int main(int argc, char *argv[]) {
        printf("==================================================\n\n");
    }

-    // Read TAV header (32 bytes)
+    // Detect format: TAV (with magic) or TAV-DT (with sync pattern)
    uint8_t header[32];
-    if (fread(header, 1, 32, fp) != 32) {
-        fprintf(stderr, "Error: Failed to read TAV header\n");
+    int is_dt_format = 0;
+    uint16_t dt_width = 0, dt_height = 0;
+    uint8_t dt_framerate = 0;
+    uint8_t dt_quality = 0;
+    int dt_is_interlaced = 0;
+    int dt_is_ntsc_framerate = 0;
+
+    // Read first 4 bytes to check format
+    uint8_t format_check[4];
+    if (fread(format_check, 1, 4, fp) != 4) {
+        fprintf(stderr, "Error: Failed to read file header\n");
        fclose(fp);
        return 1;
    }

-    // Verify magic number
-    const char *magic = "\x1F\x54\x53\x56\x4D\x54\x41\x56";  // "\x1FTSVM TAV"
-    if (memcmp(header, magic, 8) != 0) {
-        fprintf(stderr, "Error: Invalid TAV magic number\n");
-        fclose(fp);
-        return 1;
+    // Check if it's a TAV-DT sync pattern
+    uint32_t sync = (format_check[0] << 24) | (format_check[1] << 16) |
+                    (format_check[2] << 8) | format_check[3];
+
+    if (sync == TAV_DT_SYNC_NTSC || sync == TAV_DT_SYNC_PAL) {
+        // TAV-DT format detected
+        is_dt_format = 1;
+        dt_width = (sync == TAV_DT_SYNC_NTSC) ? 720 : 720;
+        dt_height = (sync == TAV_DT_SYNC_NTSC) ? 480 : 576;
+
+        // Read rest of DT packet header (12 more bytes = 16 total)
+        uint8_t dt_header[12];
+        if (fread(dt_header, 1, 12, fp) != 12) {
+            fprintf(stderr, "Error: Failed to read TAV-DT packet header\n");
+            fclose(fp);
+            return 1;
+        }
+
+        dt_framerate = dt_header[0];
+        uint8_t flags = dt_header[1];
+        dt_is_interlaced = flags & 0x01;
+        dt_is_ntsc_framerate = flags & 0x02;
+        dt_quality = (flags >> 4) & 0x0F;
+
+        // Rewind to start of first packet so the loop can process it
+        fseek(fp, -(4 + 12), SEEK_CUR);  // Go back 16 bytes (full DT packet header)
+
+        if (!opts.summary_only) {
+            printf("TAV-DT Header (Headerless Streaming Format):\n");
+            printf("  Format:           %s %s\n",
+                   (sync == TAV_DT_SYNC_NTSC) ? "NTSC" : "PAL",
+                   dt_is_interlaced ? "interlaced" : "progressive");
+            printf("  Resolution:       %dx%d\n", dt_width, dt_height);
+            printf("  Frame rate:       %d fps", dt_framerate);
+            if (dt_is_ntsc_framerate) printf(" (NTSC)");
+            printf("\n");
+            printf("  Quality index:    %d (0-5)\n", dt_quality);
+            printf("  Total frames:     Unknown (streaming format)\n");
+            printf("  Wavelet:          1 (CDF 9/7, fixed for DT)\n");
+            printf("  Decomp levels:    4 spatial + 2 temporal (fixed for DT)\n");
+            printf("  Entropy coder:    EZBC (fixed for DT)\n");
+            printf("  Channel layout:   YCoCg-R (fixed for DT)\n");
+            printf("\n");
+        }
+    } else {
+        // Regular TAV format - rewind and read full header
+        rewind(fp);
+        if (fread(header, 1, 32, fp) != 32) {
+            fprintf(stderr, "Error: Failed to read TAV header\n");
+            fclose(fp);
+            return 1;
+        }
+
+        // Verify magic number
+        const char *magic = "\x1F\x54\x53\x56\x4D\x54\x41\x56";  // "\x1FTSVM TAV"
+        if (memcmp(header, magic, 8) != 0) {
+            fprintf(stderr, "Error: Invalid TAV magic number\n");
+            fclose(fp);
+            return 1;
+        }
    }

-    if (!opts.summary_only) {
-        // Parse header fields
+    if (!opts.summary_only && !is_dt_format) {
+        // Parse header fields (TAV format only)
        uint8_t version = header[8];
        uint8_t base_version = (version > 8) ? (version - 8) : version;
        uint8_t temporal_motion_coder = (version > 8) ? 1 : 0;
@@ -581,13 +667,76 @@ static const char* TEMPORAL_WAVELET[] = {"Haar", "CDF 5/3"};
    while (!feof(fp)) {
        long packet_offset = ftell(fp);
        uint8_t packet_type;
-        if (fread(&packet_type, 1, 1, fp) != 1) break;
+        uint8_t *packet_payload = NULL;
+        uint32_t payload_size = 0;
+        uint32_t payload_offset = 1;  // Start at 1 to skip packet type byte in DT mode
+
+        if (is_dt_format) {
+            // TAV-DT: Read 16-byte packet header
+            uint8_t dt_pkt_header[16];
+            if (fread(dt_pkt_header, 1, 16, fp) != 16) break;
+
+            // Parse DT packet header
+            uint32_t sync_check = (dt_pkt_header[0] << 24) | (dt_pkt_header[1] << 16) |
+                                  (dt_pkt_header[2] << 8) | dt_pkt_header[3];
+            payload_size = dt_pkt_header[8] | (dt_pkt_header[9] << 8) |
+                          (dt_pkt_header[10] << 16) | (dt_pkt_header[11] << 24);
+
+            // Verify sync pattern
+            if (sync_check != TAV_DT_SYNC_NTSC && sync_check != TAV_DT_SYNC_PAL) {
+                if (!opts.summary_only) {
+                    fprintf(stderr, "Warning: Invalid sync pattern 0x%08X at offset 0x%lX\n",
+                           sync_check, packet_offset);
+                }
+                break;
+            }
+
+            // Read packet payload
+            packet_payload = malloc(payload_size);
+            if (!packet_payload || fread(packet_payload, 1, payload_size, fp) != payload_size) {
+                free(packet_payload);
+                break;
+            }
+
+            // TAV-DT payload structure: [timecode(8)][TAD_packets...][video_packet]
+            // Skip past timecode (8 bytes) and any TAD packets to find the video packet
+            payload_offset = 8;  // Skip timecode
+
+            // Skip TAD audio packets (if any)
+            while (payload_offset < payload_size && packet_payload[payload_offset] == TAV_PACKET_AUDIO_TAD) {
+                payload_offset++;  // Skip packet type
+                if (payload_offset + 6 > payload_size) break;
+
+                // Skip past TAD packet header to get to payload size
+                payload_offset += 2;  // sample_count
+                uint32_t tad_payload_size = packet_payload[payload_offset] |
+                                           (packet_payload[payload_offset+1] << 8) |
+                                           (packet_payload[payload_offset+2] << 16) |
+                                           (packet_payload[payload_offset+3] << 24);
+                payload_offset += 4;  // payload_size field
+                payload_offset += tad_payload_size;  // Skip TAD payload
+            }
+
+            // Extract video packet type (should be at current offset)
+            if (payload_offset < payload_size) {
+                packet_type = packet_payload[payload_offset];
+                payload_offset++;  // Move past packet type for subsequent reads
+            } else {
+                packet_type = 0x00;  // No video packet
+            }
+        } else {
+            // Regular TAV: Read packet type directly
+            if (fread(&packet_type, 1, 1, fp) != 1) break;
+        }

        int display = should_display_packet(packet_type, &opts);

        if (!opts.summary_only && display) {
            printf("Packet %d (offset 0x%lX): Type 0x%02X (%s)",
                   packet_num, packet_offset, packet_type, get_packet_type_name(packet_type));
+            if (is_dt_format) {
+                printf(" [DT payload: %u bytes]", payload_size);
+            }
        }

        switch (packet_type) {
@@ -618,7 +767,7 @@ static const char* TEMPORAL_WAVELET[] = {"Haar", "CDF 5/3"};
            case TAV_PACKET_TIMECODE: {
                stats.timecode_count++;
                uint64_t timecode_ns;
-                if (fread(&timecode_ns, sizeof(uint64_t), 1, fp) != 1) break;
+                if (read_packet_data(&timecode_ns, sizeof(uint64_t), 1, fp, packet_payload, payload_size, &payload_offset) != 1) break;

                if (!opts.summary_only && display) {
                    double timecode_sec = timecode_ns / 1000000000.0;
@@ -630,22 +779,25 @@ static const char* TEMPORAL_WAVELET[] = {"Haar", "CDF 5/3"};
            case TAV_PACKET_GOP_UNIFIED: case TAV_PACKET_GOP_UNIFIED_MOTION: {
                // Unified GOP packet: [gop_size][motion_vectors...][compressed_size][data]
                uint8_t gop_size;
-                if (fread(&gop_size, 1, 1, fp) != 1) break;
+                if (read_packet_data(&gop_size, 1, 1, fp, packet_payload, payload_size, &payload_offset) != 1) break;

                // Read motion vectors
                uint32_t size0 = 0;
                if (packet_type == TAV_PACKET_GOP_UNIFIED_MOTION) {
-                    if (fread(&size0, sizeof(uint32_t), 1, fp) != 1) { break; }
+                    if (read_packet_data(&size0, sizeof(uint32_t), 1, fp, packet_payload, payload_size, &payload_offset) != 1) { break; }
                    stats.total_video_bytes += size0;
                    stats.gop_unified_motion_count++;
-                    fseek(fp, size0, SEEK_CUR);
+                    if (!packet_payload) fseek(fp, size0, SEEK_CUR);
+                    else payload_offset += size0;
                }

                // Read compressed data size
                uint32_t size1;
-                if (fread(&size1, sizeof(uint32_t), 1, fp) != 1) { break; }
+                if (read_packet_data(&size1, sizeof(uint32_t), 1, fp, packet_payload, payload_size, &payload_offset) != 1) { break; }
                stats.total_video_bytes += size1;
-                fseek(fp, size1, SEEK_CUR);
+                if (!packet_payload) fseek(fp, size1, SEEK_CUR);
+                // else: data is already in payload buffer, skip ahead
+                else payload_offset += size1;


                stats.total_gop_frames += gop_size;
@@ -664,7 +816,7 @@ static const char* TEMPORAL_WAVELET[] = {"Haar", "CDF 5/3"};
            case TAV_PACKET_GOP_SYNC: {
                // GOP sync packet: [frame_count]
                uint8_t frame_count;
-                if (fread(&frame_count, 1, 1, fp) != 1) break;
+                if (read_packet_data(&frame_count, 1, 1, fp, packet_payload, payload_size, &payload_offset) != 1) break;

                stats.gop_sync_count++;
                current_frame += frame_count;  // Advance frame counter
@@ -783,23 +935,23 @@ static const char* TEMPORAL_WAVELET[] = {"Haar", "CDF 5/3"};

                // Read sample count
                uint16_t sample_count0;
-                if (fread(&sample_count0, sizeof(uint16_t), 1, fp) != 1) break;
+                if (read_packet_data(&sample_count0, sizeof(uint16_t), 1, fp, packet_payload, payload_size, &payload_offset) != 1) break;

                // Read payload_size + 7
                uint32_t payload_size_plus_7;
-                if (fread(&payload_size_plus_7, sizeof(uint32_t), 1, fp) != 1) break;
+                if (read_packet_data(&payload_size_plus_7, sizeof(uint32_t), 1, fp, packet_payload, payload_size, &payload_offset) != 1) break;

                // Read sample count
                uint16_t sample_count;
-                if (fread(&sample_count, sizeof(uint16_t), 1, fp) != 1) break;
+                if (read_packet_data(&sample_count, sizeof(uint16_t), 1, fp, packet_payload, payload_size, &payload_offset) != 1) break;

                // Read quantiser index
                uint8_t quantiser;
-                if (fread(&quantiser, sizeof(uint8_t), 1, fp) != 1) break;
+                if (read_packet_data(&quantiser, sizeof(uint8_t), 1, fp, packet_payload, payload_size, &payload_offset) != 1) break;

                // Read compressed size
                uint32_t compressed_size;
-                if (fread(&compressed_size, sizeof(uint32_t), 1, fp) != 1) break;
+                if (read_packet_data(&compressed_size, sizeof(uint32_t), 1, fp, packet_payload, payload_size, &payload_offset) != 1) break;

                stats.total_audio_bytes += compressed_size;
                stats.audio_tad_bytes += compressed_size;
@@ -810,7 +962,8 @@ static const char* TEMPORAL_WAVELET[] = {"Haar", "CDF 5/3"};
                }

                // Skip compressed data
-                fseek(fp, compressed_size, SEEK_CUR);
+                if (!packet_payload) fseek(fp, compressed_size, SEEK_CUR);
+                else payload_offset += compressed_size;
                break;
            }

@@ -948,6 +1101,11 @@ static const char* TEMPORAL_WAVELET[] = {"Haar", "CDF 5/3"};
            printf("\n");
        }

+        // Free DT packet payload if allocated
+        if (packet_payload) {
+            free(packet_payload);
+        }
+
        packet_num++;
    }