RecursiveMAS commited on
Commit
90fe4c3
·
verified ·
1 Parent(s): 24951b6

upload model

Browse files
Expert-Learner-Outerlink(code).pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6479fea5f1d3ccaf7d7c28bf9eeb60dc0d903f545fe7e435c375e003227710b6
3
+ size 89180373
Expert-Learner-Outerlink(math).pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4993c4a66fc03544ba2c2bfaf67cf969a8226cfdca6aa4245e5bddcdeae5199a
3
+ size 89180373
Learner-Expert-Outerlink(code).pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3809550498f94dffe307f51c6b574ff8ecb1c8b72cd08b5d958be7fd6e5a3bd
3
+ size 130086805
Learner-Expert-Outerlink(math).pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:562729bfed5fbadfca41da252bb086607e2722b2cd0189b2e794c4741382bbbe
3
+ size 130086805
README.md ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ ---
4
+
5
+ Outerlink of Distillation-Style MAS in the paper: Recursive Multi-Agent Systems.
outer_adapter_config(code).json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "outer_el_in_dim": 4096,
3
+ "outer_el_out_dim": 2560,
4
+ "outer_el_type": "outer_ln_res_adapter",
5
+ "outer_le_in_dim": 2560,
6
+ "outer_le_out_dim": 4096,
7
+ "outer_le_type": "outer_ln_res_adapter"
8
+ }
outer_adapter_config(math).json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "outer_el_in_dim": 4096,
3
+ "outer_el_out_dim": 2560,
4
+ "outer_el_type": "outer_ln_res_adapter",
5
+ "outer_le_in_dim": 2560,
6
+ "outer_le_out_dim": 4096,
7
+ "outer_le_type": "outer_ln_res_adapter"
8
+ }
outerlink_config.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "paradigm": "distillation",
4
+ "tasks": {
5
+ "math": {
6
+ "task": "math",
7
+ "legacy_config_filename": "outer_adapter_config(math).json",
8
+ "adapters": [
9
+ {
10
+ "legacy_key": "outer_el",
11
+ "legacy_filename": "outer_el.pt",
12
+ "filename": "Expert-Learner-Outerlink(math).pt",
13
+ "source_role": "Expert",
14
+ "target_role": "Learner",
15
+ "adapter_type": "outer_ln_res_adapter",
16
+ "in_dim": 4096,
17
+ "out_dim": 2560
18
+ },
19
+ {
20
+ "legacy_key": "outer_le",
21
+ "legacy_filename": "outer_le.pt",
22
+ "filename": "Learner-Expert-Outerlink(math).pt",
23
+ "source_role": "Learner",
24
+ "target_role": "Expert",
25
+ "adapter_type": "outer_ln_res_adapter",
26
+ "in_dim": 2560,
27
+ "out_dim": 4096
28
+ }
29
+ ]
30
+ },
31
+ "code": {
32
+ "task": "code",
33
+ "legacy_config_filename": "outer_adapter_config(code).json",
34
+ "adapters": [
35
+ {
36
+ "legacy_key": "outer_el",
37
+ "legacy_filename": "outer_el.pt",
38
+ "filename": "Expert-Learner-Outerlink(code).pt",
39
+ "source_role": "Expert",
40
+ "target_role": "Learner",
41
+ "adapter_type": "outer_ln_res_adapter",
42
+ "in_dim": 4096,
43
+ "out_dim": 2560
44
+ },
45
+ {
46
+ "legacy_key": "outer_le",
47
+ "legacy_filename": "outer_le.pt",
48
+ "filename": "Learner-Expert-Outerlink(code).pt",
49
+ "source_role": "Learner",
50
+ "target_role": "Expert",
51
+ "adapter_type": "outer_ln_res_adapter",
52
+ "in_dim": 2560,
53
+ "out_dim": 4096
54
+ }
55
+ ]
56
+ }
57
+ }
58
+ }