1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
# Video codec patterns.
#
# Exact entries: case-insensitive token lookup (HashMap, no regex).
# Pattern entries: regex crate patterns matched against individual tokens.
#
# All matching happens against isolated tokens (post-tokenizer), so word
# boundary assertions are NOT needed.
= "video_codec"
[]
# Simple token → value mappings (case-insensitive).
= "H.264"
= "H.264"
= "H.265"
= "H.265"
= "H.265"
= "Xvid"
= "DivX"
= "DivX"
= "VP7"
= "VP8"
= "VP8"
= "VP9"
= "AV1"
= "H.264"
= "H.264"
[[]]
# HEVC with suffix: hevc10, HEVC_YUV420P10, etc.
# Use word chars only (no dots/dashes) to avoid matching compound tokens
# like "HEVC.Atmos-GROUP" or "HEVC-MZABI" in multi-token windows.
= '(?i)^hevc[a-zA-Z0-9_]+$'
= "H.265"
[[]]
# H.264 with optional dot/dash separator: h.264, x-264, etc.
= '(?i)^[xh][.-]?264$'
= "H.264"
[[]]
# H.265 with optional dot/dash separator.
= '(?i)^[xh][.-]?265$'
= "H.265"
[[]]
# H.263
= '(?i)^[xh][.-]?263$'
= "H.263"
[[]]
# MPEG-2 / Mpeg2 / H.262
= '(?i)^mpe?g[.-]?2$'
= "MPEG-2"
[[]]
= '(?i)^[xh][.-]?262$'
= "MPEG-2"
[[]]
# VC-1
= '(?i)^vc[.-]?1$'
= "VC-1"
[[]]
# MPEG-4 AVC variants.
= '(?i)^mpeg-?4avc(?:hd)?$'
= "H.264"
[[]]
# RealVideo (Rv10, Rv20, etc.)
= '(?i)^rv\d{2}$'
= "RealVideo"
[[]]
# H.264 glued to source suffix: WEB-DLx264, HDx264, Ripx264
= '(?i)(?:DL|Rip|HD)x264$'
= "H.264"
[[]]
# DVDDivX compound.
= '(?i)^dvddivx$'
= "DivX"