muirkat commited on
Commit
4d5bdd3
1 Parent(s): 04ad92a
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
README.md ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ tags:
4
+ - generated_from_trainer
5
+ model-index:
6
+ - name: tolkien-mythopoeic-gen
7
+ results:
8
+ - task:
9
+ name: Causal Language Modeling
10
+ type: text-generation
11
+ ---
12
+
13
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
14
+ should probably proofread and complete it, then remove this comment. -->
15
+
16
+ # tolkien-mythopoeic-gen
17
+
18
+ This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
19
+ It achieves the following results on the evaluation set:
20
+ - Loss: 3.5110
21
+
22
+ ## Model description
23
+
24
+ More information needed
25
+
26
+ ## Intended uses & limitations
27
+
28
+ More information needed
29
+
30
+ ## Training and evaluation data
31
+
32
+ More information needed
33
+
34
+ ## Training procedure
35
+
36
+ ### Training hyperparameters
37
+
38
+ The following hyperparameters were used during training:
39
+ - learning_rate: 2e-05
40
+ - train_batch_size: 16
41
+ - eval_batch_size: 16
42
+ - seed: 42
43
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
+ - lr_scheduler_type: linear
45
+ - num_epochs: 3.0
46
+
47
+ ### Training results
48
+
49
+ | Training Loss | Epoch | Step | Validation Loss |
50
+ |:-------------:|:-----:|:----:|:---------------:|
51
+ | 3.5732 | 1.0 | 145 | 3.5110 |
52
+ | 3.5713 | 2.0 | 290 | 3.5110 |
53
+ | 3.5718 | 3.0 | 435 | 3.5110 |
54
+
55
+
56
+ ### Framework versions
57
+
58
+ - Transformers 4.10.2
59
+ - Pytorch 1.9.0+cu102
60
+ - Tokenizers 0.10.3
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "gpt2",
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPT2LMHeadModel"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 50256,
11
+ "gradient_checkpointing": false,
12
+ "initializer_range": 0.02,
13
+ "layer_norm_epsilon": 1e-05,
14
+ "model_type": "gpt2",
15
+ "n_ctx": 1024,
16
+ "n_embd": 768,
17
+ "n_head": 12,
18
+ "n_inner": null,
19
+ "n_layer": 12,
20
+ "n_positions": 1024,
21
+ "resid_pdrop": 0.1,
22
+ "scale_attn_weights": true,
23
+ "summary_activation": null,
24
+ "summary_first_dropout": 0.1,
25
+ "summary_proj_to_labels": true,
26
+ "summary_type": "cls_index",
27
+ "summary_use_proj": true,
28
+ "task_specific_params": {
29
+ "text-generation": {
30
+ "do_sample": true,
31
+ "max_length": 50
32
+ }
33
+ },
34
+ "torch_dtype": "float32",
35
+ "transformers_version": "4.10.2",
36
+ "use_cache": true,
37
+ "vocab_size": 50257
38
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2169b18f89c16392db042c084938a3aa345a71f65287b59ae513433837b78a86
3
+ size 510403817
runs/Sep17_20-58-12_809f1a19f9e4/1631912379.7387805/events.out.tfevents.1631912379.809f1a19f9e4.75.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a94c320bd98345251aab768df353934219e2ae40711f6878b1993a37f8ac706
3
+ size 4201
runs/Sep17_20-58-12_809f1a19f9e4/1631912910.4550812/events.out.tfevents.1631912910.809f1a19f9e4.75.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71f92b6f510dc35ce2872317d4fae88a63edc938b3e6703e966931dde1a0ea2f
3
+ size 4201
runs/Sep17_20-58-12_809f1a19f9e4/events.out.tfevents.1631912379.809f1a19f9e4.75.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba3bf1a53b62a018beada61d2cb77ab46724ca8e6ce0f5ff37375e50d8bf0210
3
+ size 4798
runs/Sep17_20-58-12_809f1a19f9e4/events.out.tfevents.1631912910.809f1a19f9e4.75.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f14bc528b9c6d0ec088248c7f3625901854aafcb70a701de159029abcf232c4d
3
+ size 4798
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0a0129ffff269672b0c20ccad0119362f29a869a42ba838a9a8ddc16c7ab28a
3
+ size 2671