# pinyin weight-derivation rules.
# Mirrors wubi/tools/weights/rules.toml — same normalization parameters,
# applied globally (pinyin v0.2 has no layers; layered ranking lands at v0.3).
[]
# Cap on per-entry freq_score. u16-fits-in-u64 ceiling; later combined with
# layer base into the FST value at v0.3.
= 65535
# Log base for count compression. Currently unused — code uses natural log
# via .ln(). Recorded for forward-compat audits.
= 2.71828
# Floor below which a raw weighted count is treated as zero. Filters Aho-
# Corasick noise from short common substrings appearing once or twice in a
# huge corpus.
= 1
# Reserved — currently the only aggregation we support is sum-across-corpora,
# weighted by manifest.weight.
= "sum"