fazeelzafar commited on
Commit
72b2651
1 Parent(s): 51a342c

Upload LlamaForCausalLM

Browse files
Files changed (2) hide show
  1. config.json +7 -3
  2. model.safetensors +2 -2
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "unsloth/tinyllama-bnb-4bit",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -11,7 +11,7 @@
11
  "hidden_size": 2048,
12
  "initializer_range": 0.02,
13
  "intermediate_size": 5632,
14
- "max_position_embeddings": 2048,
15
  "model_type": "llama",
16
  "num_attention_heads": 32,
17
  "num_hidden_layers": 22,
@@ -33,11 +33,15 @@
33
  "quant_method": "bitsandbytes"
34
  },
35
  "rms_norm_eps": 1e-05,
36
- "rope_scaling": null,
 
 
 
37
  "rope_theta": 10000.0,
38
  "tie_word_embeddings": false,
39
  "torch_dtype": "float16",
40
  "transformers_version": "4.38.2",
 
41
  "use_cache": true,
42
  "vocab_size": 32000
43
  }
 
1
  {
2
+ "_name_or_path": "mrm8488/tinyllama-bnb-4bit-ft-codeAlpaca",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
11
  "hidden_size": 2048,
12
  "initializer_range": 0.02,
13
  "intermediate_size": 5632,
14
+ "max_position_embeddings": 4096,
15
  "model_type": "llama",
16
  "num_attention_heads": 32,
17
  "num_hidden_layers": 22,
 
33
  "quant_method": "bitsandbytes"
34
  },
35
  "rms_norm_eps": 1e-05,
36
+ "rope_scaling": {
37
+ "factor": 2.0,
38
+ "type": "linear"
39
+ },
40
  "rope_theta": 10000.0,
41
  "tie_word_embeddings": false,
42
  "torch_dtype": "float16",
43
  "transformers_version": "4.38.2",
44
+ "unsloth_version": "2024.1",
45
  "use_cache": true,
46
  "vocab_size": 32000
47
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5af7f5da90b8b199890b7e3fa19810145c1b2f1db7655843ea83154ff580b541
3
- size 762453341
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f5f5032c250a1d66e8ab6ead9267b9600a237ebb7d1229d3597d3737bcf754c
3
+ size 762453346