Distillation-Outerlinks / outerlink_config.json
RecursiveMAS's picture
upload model
90fe4c3 verified
{
"format_version": 1,
"paradigm": "distillation",
"tasks": {
"math": {
"task": "math",
"legacy_config_filename": "outer_adapter_config(math).json",
"adapters": [
{
"legacy_key": "outer_el",
"legacy_filename": "outer_el.pt",
"filename": "Expert-Learner-Outerlink(math).pt",
"source_role": "Expert",
"target_role": "Learner",
"adapter_type": "outer_ln_res_adapter",
"in_dim": 4096,
"out_dim": 2560
},
{
"legacy_key": "outer_le",
"legacy_filename": "outer_le.pt",
"filename": "Learner-Expert-Outerlink(math).pt",
"source_role": "Learner",
"target_role": "Expert",
"adapter_type": "outer_ln_res_adapter",
"in_dim": 2560,
"out_dim": 4096
}
]
},
"code": {
"task": "code",
"legacy_config_filename": "outer_adapter_config(code).json",
"adapters": [
{
"legacy_key": "outer_el",
"legacy_filename": "outer_el.pt",
"filename": "Expert-Learner-Outerlink(code).pt",
"source_role": "Expert",
"target_role": "Learner",
"adapter_type": "outer_ln_res_adapter",
"in_dim": 4096,
"out_dim": 2560
},
{
"legacy_key": "outer_le",
"legacy_filename": "outer_le.pt",
"filename": "Learner-Expert-Outerlink(code).pt",
"source_role": "Learner",
"target_role": "Expert",
"adapter_type": "outer_ln_res_adapter",
"in_dim": 2560,
"out_dim": 4096
}
]
}
}
}