{
"kind": "neural",
"alpha": 0.03,
"experts": [
{
"name": "rwkv",
"kind": "rwkv",
"method": "cfg:hidden=64,layers=1,intermediate=64,decay_rank=16,a_rank=16,v_rank=16,g_rank=16,seed=22,train=adam,lr=0.0009,stride=1;policy:schedule=0..1%:train(scope=all,opt=adam,lr=0.001,stride=1,bptt=1,clip=0,momentum=0.9)|1%..5%:train(scope=head,opt=adam,lr=0.001,stride=1,bptt=1,clip=0,momentum=0.9)|5%..7%:train(scope=all,opt=adam,lr=0.001,stride=1,bptt=1,clip=0,momentum=0.9)",
"log_prior": 0.0
},
{
"name": "classical",
"kind": "mixture",
"log_prior": 0.0,
"spec": {
"kind": "neural",
"alpha": 0.03,
"experts": [
{
"name": "rosa",
"kind": "rosaplus",
"max_order": -1,
"log_prior": 0.0
},
{
"name": "ctw",
"kind": "ctw",
"depth": 24,
"log_prior": 0.0
},
{
"name": "ppmd",
"kind": "ppmd",
"order": 10,
"memory_mb": 64,
"log_prior": 0.0
},
{
"name": "match",
"kind": "match",
"log_prior": 0.0
},
{
"name": "sparse",
"kind": "sparse-match",
"log_prior": 0.0
},
{
"name": "cal-ctw",
"kind": "calibrated",
"context": "text",
"bins": 33,
"learning_rate": 0.02,
"bias_clip": 4.0,
"log_prior": 0.0,
"base": {
"kind": "ctw",
"depth": 24
}
},
{
"name": "cal-ppmd",
"kind": "calibrated",
"context": "text-repeat",
"bins": 33,
"learning_rate": 0.02,
"bias_clip": 4.0,
"log_prior": 0.0,
"base": {
"kind": "ppmd",
"order": 10,
"memory_mb": 64
}
}
]
}
}
]
}