RecursiveMAS commited on
Commit
3f09a92
·
verified ·
1 Parent(s): 377e70a

upload model

Browse files
README.md ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ ---
4
+
5
+ Outerlink of Deliberation-Style MAS in the paper: Recursive Multi-Agent Systems.
Reflector-Toolcaller-Outerlink.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1951461655ffcaccdde4ed9c70be19d6054065ed92ced21ca525c05efc170fd0
3
+ size 65581269
Toolcaller-Reflector-Outerlink.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e3a20dc5201f1d9552daa57aecb381b8830208837d4604bb806373f051f4ff2
3
+ size 65581269
outer_adapter_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "mas_shape": "deliberation",
3
+ "mas_task": "math",
4
+ "non_last_loss_weight": 0.1,
5
+ "num_recursive_rounds": 3,
6
+ "outer_rt_in_dim": 2560,
7
+ "outer_rt_out_dim": 2560,
8
+ "outer_rt_type": "outer_ln_res_adapter",
9
+ "outer_tr_in_dim": 2560,
10
+ "outer_tr_out_dim": 2560,
11
+ "outer_tr_type": "outer_ln_res_adapter",
12
+ "preserve_inner_input_grad": 1,
13
+ "reflector_inner_aligner_path": "checkpoints/innerloop_deliberation/deliberation_arpo_v1_reflector_qwen35_4b_ln_res/checkpoint-10000",
14
+ "reflector_model_name_or_path": "Qwen/Qwen3.5-4B",
15
+ "supervise_final_only": 0,
16
+ "toolcaller_inner_aligner_path": "checkpoints/innerloop_deliberation/deliberation_arpo_v1_toolcaller_qwen35_4b_ln_res/checkpoint-10000",
17
+ "toolcaller_model_name_or_path": "Qwen/Qwen3.5-4B"
18
+ }
outerlink_config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format_version": 1,
3
+ "paradigm": "deliberation",
4
+ "legacy_config_filename": "outer_adapter_config.json",
5
+ "meta": {
6
+ "mas_shape": "deliberation",
7
+ "mas_task": "math",
8
+ "num_recursive_rounds": 3,
9
+ "non_last_loss_weight": 0.1,
10
+ "preserve_inner_input_grad": 1,
11
+ "supervise_final_only": 0
12
+ },
13
+ "adapters": [
14
+ {
15
+ "legacy_key": "outer_rt",
16
+ "legacy_filename": "outer_rt.pt",
17
+ "filename": "Reflector-Toolcaller-Outerlink.pt",
18
+ "source_role": "Reflector",
19
+ "target_role": "Toolcaller",
20
+ "adapter_type": "outer_ln_res_adapter",
21
+ "in_dim": 2560,
22
+ "out_dim": 2560
23
+ },
24
+ {
25
+ "legacy_key": "outer_tr",
26
+ "legacy_filename": "outer_tr.pt",
27
+ "filename": "Toolcaller-Reflector-Outerlink.pt",
28
+ "source_role": "Toolcaller",
29
+ "target_role": "Reflector",
30
+ "adapter_type": "outer_ln_res_adapter",
31
+ "in_dim": 2560,
32
+ "out_dim": 2560
33
+ }
34
+ ]
35
+ }