Text Generation
Transformers
Safetensors
English
Japanese
llama
conversational
text-generation-inference
Inference Endpoints
maym15 commited on
Commit
18f2bea
·
verified ·
1 Parent(s): 4b64f49

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +2 -2
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/gs/bs/tga-okazaki/ma/ckpts/llama-3.1-swallow-v0.3-exp-4-5_LR_2.5e-5_MINLR_2.5e-6_WD_0.1_42",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -35,6 +35,6 @@
35
  "tie_word_embeddings": false,
36
  "torch_dtype": "bfloat16",
37
  "transformers_version": "4.46.2",
38
- "use_cache": false,
39
  "vocab_size": 128256
40
  }
 
1
  {
2
+ "_name_or_path": "tokyotech-llm/Llama-3.1-Swallow-8B-Instruct-v0.3",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
35
  "tie_word_embeddings": false,
36
  "torch_dtype": "bfloat16",
37
  "transformers_version": "4.46.2",
38
+ "use_cache": true,
39
  "vocab_size": 128256
40
  }