Hzfinfdu commited on
Commit
b743eca
·
verified ·
1 Parent(s): 9ab845c

Upload folder using huggingface_hub

Browse files
Llama3_1Base-LXR-8x/checkpoints/final.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ac3d9482d565a6c219f2d293b1a9dd91cbacf7f05080426450dbe7adad11be6
3
  size 536945024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f291f55c9ce1547b312502c8ecd02993b7ccb2dc92fd0f135fac2f99ed3cb1ba
3
  size 536945024
Llama3_1Base-LXR-8x/hyperparams.json CHANGED
@@ -2,8 +2,8 @@
2
  "device": "cuda:0",
3
  "seed": 42,
4
  "dtype": "torch.bfloat16",
5
- "hook_point_in": "blocks.6.hook_resid_post",
6
- "hook_point_out": "blocks.6.hook_resid_post",
7
  "use_decoder_bias": true,
8
  "apply_decoder_bias_to_pre_encoder": false,
9
  "expansion_factor": 8,
@@ -11,11 +11,11 @@
11
  "d_sae": 32768,
12
  "bias_init_method": "all_zero",
13
  "act_fn": "jumprelu",
14
- "jump_relu_threshold": 0.1552734375,
15
  "norm_activation": "dataset-wise",
16
  "dataset_average_activation_norm": {
17
- "in": 5.34375,
18
- "out": 5.34375
19
  },
20
  "decoder_exactly_fixed_norm": false,
21
  "sparsity_include_decoder_norm": true,
 
2
  "device": "cuda:0",
3
  "seed": 42,
4
  "dtype": "torch.bfloat16",
5
+ "hook_point_in": "blocks.7.hook_resid_post",
6
+ "hook_point_out": "blocks.7.hook_resid_post",
7
  "use_decoder_bias": true,
8
  "apply_decoder_bias_to_pre_encoder": false,
9
  "expansion_factor": 8,
 
11
  "d_sae": 32768,
12
  "bias_init_method": "all_zero",
13
  "act_fn": "jumprelu",
14
+ "jump_relu_threshold": 0.1826171875,
15
  "norm_activation": "dataset-wise",
16
  "dataset_average_activation_norm": {
17
+ "in": 5.90625,
18
+ "out": 5.90625
19
  },
20
  "decoder_exactly_fixed_norm": false,
21
  "sparsity_include_decoder_norm": true,