SAELens
Juliushanhanhan commited on
Commit
868cb67
1 Parent(s): 53425c3

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +7 -17
README.md CHANGED
@@ -31,22 +31,12 @@ sae, cfg_dict, sparsity = SAE.from_pretrained("Juliushanhanhan/llama-3-8b-it-res
31
  ## Citation
32
 
33
  ```
34
- @misc{saelens2024llama38b,
35
- author = {SAELens, Jiatong Han},
36
- title = {Llama-3-8B SAEs (layer 25, Post-MLP Residual Stream)},
37
- year = {2024},
38
- publisher = {HuggingFace},
39
- url = {https://huggingface.co/Juliushanhanhan/llama-3-8b-it-res},
40
- note = {Model trained on the post-MLP residual stream of the 25th layer of Llama-3-8B. Feature visualizations are available at \url{https://www.neuronpedia.org/llama3-8b-it}. The wandb run is recorded at \url{https://wandb.ai/jiatongg/sae_semantic_entropy/runs/ruuu0izg?nw=nwuserjiatongg}.},
41
  }
42
-
43
- @misc{juliushanhanhan2024openwebtext,
44
- author = {Juliushanhanhan},
45
- title = {OpenWebText-1B Llama3 Tokenized CXT 1024},
46
- year = {2024},
47
- publisher = {HuggingFace},
48
- url = {https://huggingface.co/datasets/Juliushanhanhan/openwebtext-1b-llama3-tokenized-cxt-1024},
49
- note = {Dataset used for training the Llama-3-8B SAEs.},
50
- }
51
-
52
  ```
 
31
  ## Citation
32
 
33
  ```
34
+ @misc {jiatong_han_2024,
35
+ author = { {Jiatong Han} },
36
+ title = { llama-3-8b-it-res (Revision 53425c3) },
37
+ year = 2024,
38
+ url = { https://huggingface.co/Juliushanhanhan/llama-3-8b-it-res },
39
+ doi = { 10.57967/hf/2889 },
40
+ publisher = { Hugging Face }
41
  }
 
 
 
 
 
 
 
 
 
 
42
  ```