1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
# Container / file format patterns.
#
# ARCHITECTURE NOTE (v0.2):
# Container detection has two paths:
#
# PATH A — Extension (primary, highest priority):
# The tokenizer strips the file extension into `TokenStream.extension`.
# The pipeline emits a Container span directly from that field.
# This replaces the EXT_REGEX approach in the legacy container.rs.
#
# PATH B — Standalone token (fallback, lower priority):
# When a container token appears mid-filename (e.g., "MP4-GROUP", "[mkv]"),
# the TOML token rules below catch it.
# This replaces EXT_STANDALONE in the legacy container.rs.
#
# Once the pipeline emits PATH A spans natively, container.rs can be removed.
= "container"
# ── Video containers ──────────────────────────────────────────────────────────
[]
= "mkv"
= "mp4"
= "m4v"
= "avi"
= "wmv"
= "flv"
= "mov"
= "webm"
= "ogm"
= "ogv"
= "ts"
= "m2ts"
= "mts"
= "mpg"
= "mpeg"
= "vob"
= "divx"
= "3gp"
= "3g2"
= "asf"
= "rm"
= "rmvb"
= "mk3d"
# ── Subtitle containers ─────────────────────────────────────────────────────
= "srt"
= "ass"
= "ssa"
= "sub"
= "sup"
= "idx"
= "vtt"
= "smi"
# ── Other recognized formats ─────────────────────────────────────────────────
= "nfo"
= "nzb"