| { |
| "format_version": 1, |
| "paradigm": "distillation", |
| "tasks": { |
| "math": { |
| "task": "math", |
| "legacy_config_filename": "outer_adapter_config(math).json", |
| "adapters": [ |
| { |
| "legacy_key": "outer_el", |
| "legacy_filename": "outer_el.pt", |
| "filename": "Expert-Learner-Outerlink(math).pt", |
| "source_role": "Expert", |
| "target_role": "Learner", |
| "adapter_type": "outer_ln_res_adapter", |
| "in_dim": 4096, |
| "out_dim": 2560 |
| }, |
| { |
| "legacy_key": "outer_le", |
| "legacy_filename": "outer_le.pt", |
| "filename": "Learner-Expert-Outerlink(math).pt", |
| "source_role": "Learner", |
| "target_role": "Expert", |
| "adapter_type": "outer_ln_res_adapter", |
| "in_dim": 2560, |
| "out_dim": 4096 |
| } |
| ] |
| }, |
| "code": { |
| "task": "code", |
| "legacy_config_filename": "outer_adapter_config(code).json", |
| "adapters": [ |
| { |
| "legacy_key": "outer_el", |
| "legacy_filename": "outer_el.pt", |
| "filename": "Expert-Learner-Outerlink(code).pt", |
| "source_role": "Expert", |
| "target_role": "Learner", |
| "adapter_type": "outer_ln_res_adapter", |
| "in_dim": 4096, |
| "out_dim": 2560 |
| }, |
| { |
| "legacy_key": "outer_le", |
| "legacy_filename": "outer_le.pt", |
| "filename": "Learner-Expert-Outerlink(code).pt", |
| "source_role": "Learner", |
| "target_role": "Expert", |
| "adapter_type": "outer_ln_res_adapter", |
| "in_dim": 2560, |
| "out_dim": 4096 |
| } |
| ] |
| } |
| } |
| } |
|
|