Upload GPTNeoXForCausalLM
Browse files- README.md +17 -25
- config.json +3 -2
- generation_config.json +1 -1
- model.safetensors +3 -0
README.md
CHANGED
@@ -1,39 +1,31 @@
|
|
1 |
---
|
2 |
language: en
|
|
|
3 |
tags:
|
4 |
- b1ade
|
5 |
-
|
|
|
|
|
6 |
widget:
|
7 |
-
- text:
|
8 |
-
context: <math>
|
9 |
-
question: <Evaluate -24 + -24 + 15*2.>
|
10 |
-
answer: <
|
11 |
example_title: Math
|
12 |
-
- text:
|
13 |
-
|
14 |
-
|
15 |
-
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
22 |
-
|
23 |
-
|
24 |
-
detached, grunting style, in the end he comes through convincingly as a
|
25 |
-
passionate, dedicated man. The plot is a little weak in demostrating his
|
26 |
-
conversion from trapper to animal coservationist. Good film, highly
|
27 |
-
recommended.>
|
28 |
-
answer: <
|
29 |
example_title: Sentiment
|
30 |
- inference:
|
31 |
- parameters:
|
32 |
- max_new_tokens: 512
|
33 |
- top_p=0.99
|
34 |
-
datasets:
|
35 |
-
- Open-Orca/OpenOrca
|
36 |
-
- WizardLM/WizardLM_evol_instruct_V2_196k
|
37 |
---
|
38 |
|
39 |
|
|
|
1 |
---
|
2 |
language: en
|
3 |
+
license: mit
|
4 |
tags:
|
5 |
- b1ade
|
6 |
+
datasets:
|
7 |
+
- Open-Orca/OpenOrca
|
8 |
+
- WizardLM/WizardLM_evol_instruct_V2_196k
|
9 |
widget:
|
10 |
+
- text: "context: <math>\n question: <Evaluate -24 + -24 + 15*2.>\n answer: <"
|
|
|
|
|
|
|
11 |
example_title: Math
|
12 |
+
- text: "context: <You are a helpful assistant, who always provide explanation. Think\
|
13 |
+
\ like you are answering to a five year old.>\n question: <Determine the sentiment:\n\
|
14 |
+
\nWe viewed the vcr and found it to be fascinating. Not knowing anything about\
|
15 |
+
\ this true story, I thought: Oh, no, P.Brosnan as an American Indian, what a\
|
16 |
+
\ bad choice until I discovered the truth about Grey Owl. The film does a good\
|
17 |
+
\ job of demonstrating the dignity of these native peoples and undermining the\
|
18 |
+
\ racist myths about them. And Annie Galipeau, WOW, what a beauty, and very convincing\
|
19 |
+
\ as an Indian woman (I believe she is French-Canadian; she sure reverts to the\
|
20 |
+
\ all-too familiar speech of such). In spite, of Brosnan's detached, grunting\
|
21 |
+
\ style, in the end he comes through convincingly as a passionate, dedicated man.\
|
22 |
+
\ The plot is a little weak in demostrating his conversion from trapper to animal\
|
23 |
+
\ coservationist. Good film, highly recommended.>\n answer: <"
|
|
|
|
|
|
|
|
|
|
|
24 |
example_title: Sentiment
|
25 |
- inference:
|
26 |
- parameters:
|
27 |
- max_new_tokens: 512
|
28 |
- top_p=0.99
|
|
|
|
|
|
|
29 |
---
|
30 |
|
31 |
|
config.json
CHANGED
@@ -1,8 +1,9 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"GPTNeoXForCausalLM"
|
5 |
],
|
|
|
6 |
"attention_dropout": 0.0,
|
7 |
"bos_token_id": 0,
|
8 |
"classifier_dropout": 0.1,
|
@@ -22,7 +23,7 @@
|
|
22 |
"rotary_pct": 0.25,
|
23 |
"tie_word_embeddings": false,
|
24 |
"torch_dtype": "bfloat16",
|
25 |
-
"transformers_version": "4.
|
26 |
"use_cache": true,
|
27 |
"use_parallel_residual": true,
|
28 |
"vocab_size": 50304
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "tmp_trainer_scratch/checkpoint-376000/",
|
3 |
"architectures": [
|
4 |
"GPTNeoXForCausalLM"
|
5 |
],
|
6 |
+
"attention_bias": true,
|
7 |
"attention_dropout": 0.0,
|
8 |
"bos_token_id": 0,
|
9 |
"classifier_dropout": 0.1,
|
|
|
23 |
"rotary_pct": 0.25,
|
24 |
"tie_word_embeddings": false,
|
25 |
"torch_dtype": "bfloat16",
|
26 |
+
"transformers_version": "4.37.2",
|
27 |
"use_cache": true,
|
28 |
"use_parallel_residual": true,
|
29 |
"vocab_size": 50304
|
generation_config.json
CHANGED
@@ -2,5 +2,5 @@
|
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 0,
|
4 |
"eos_token_id": 0,
|
5 |
-
"transformers_version": "4.
|
6 |
}
|
|
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 0,
|
4 |
"eos_token_id": 0,
|
5 |
+
"transformers_version": "4.37.2"
|
6 |
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c3918114d8b0889fd527ead5ed62df6deb07edacc6d4ea428230178529580fd
|
3 |
+
size 2023586384
|