floriangardin commited on
Commit
2c18c2b
1 Parent(s): b93e3a0

musiclang/musiclang-bpe

Browse files
Files changed (5) hide show
  1. README.md +15 -16
  2. config.json +4 -4
  3. generation_config.json +2 -2
  4. model.safetensors +2 -2
  5. training_args.bin +1 -1
README.md CHANGED
@@ -11,9 +11,9 @@ should probably proofread and complete it, then remove this comment. -->
11
 
12
  # model
13
 
14
- This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
15
  It achieves the following results on the evaluation set:
16
- - Loss: 0.9350
17
 
18
  ## Model description
19
 
@@ -46,20 +46,19 @@ The following hyperparameters were used during training:
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:-----:|:---------------:|
49
- | 2.799 | 0.07 | 2000 | 2.6594 |
50
- | 1.5819 | 0.13 | 4000 | 1.4878 |
51
- | 1.3252 | 0.2 | 6000 | 1.2718 |
52
- | 1.2293 | 0.27 | 8000 | 1.1748 |
53
- | 1.141 | 0.34 | 10000 | 1.1004 |
54
- | 1.093 | 0.4 | 12000 | 1.0582 |
55
- | 1.0601 | 0.47 | 14000 | 1.0282 |
56
- | 1.0285 | 0.54 | 16000 | 0.9957 |
57
- | 1.002 | 0.61 | 18000 | 0.9794 |
58
- | 0.9876 | 0.67 | 20000 | 0.9605 |
59
- | 0.9903 | 0.74 | 22000 | 0.9489 |
60
- | 0.9698 | 0.81 | 24000 | 0.9418 |
61
- | 0.962 | 0.88 | 26000 | 0.9370 |
62
- | 0.9598 | 0.94 | 28000 | 0.9350 |
63
 
64
 
65
  ### Framework versions
 
11
 
12
  # model
13
 
14
+ This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
+ - Loss: 1.0360
17
 
18
  ## Model description
19
 
 
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:-----:|:---------------:|
49
+ | 3.1667 | 0.07 | 2000 | 3.1054 |
50
+ | 1.8298 | 0.14 | 4000 | 1.7209 |
51
+ | 1.4726 | 0.22 | 6000 | 1.4237 |
52
+ | 1.3446 | 0.29 | 8000 | 1.2875 |
53
+ | 1.2647 | 0.36 | 10000 | 1.2120 |
54
+ | 1.2023 | 0.43 | 12000 | 1.1621 |
55
+ | 1.185 | 0.51 | 14000 | 1.1240 |
56
+ | 1.1308 | 0.58 | 16000 | 1.0957 |
57
+ | 1.1057 | 0.65 | 18000 | 1.0736 |
58
+ | 1.0894 | 0.72 | 20000 | 1.0555 |
59
+ | 1.087 | 0.8 | 22000 | 1.0439 |
60
+ | 1.0829 | 0.87 | 24000 | 1.0372 |
61
+ | 1.0566 | 0.94 | 26000 | 1.0360 |
 
62
 
63
 
64
  ### Framework versions
config.json CHANGED
@@ -4,9 +4,9 @@
4
  "GPT2LMHeadModel"
5
  ],
6
  "attn_pdrop": 0.1,
7
- "bos_token_id": 30000,
8
  "embd_pdrop": 0.1,
9
- "eos_token_id": 30000,
10
  "initializer_range": 0.02,
11
  "layer_norm_epsilon": 1e-05,
12
  "model_type": "gpt2",
@@ -15,7 +15,7 @@
15
  "n_inner": null,
16
  "n_layer": 10,
17
  "n_positions": 4096,
18
- "padding_token_id": 30000,
19
  "reorder_and_upcast_attn": false,
20
  "resid_pdrop": 0.1,
21
  "scale_attn_by_inverse_layer_idx": false,
@@ -28,5 +28,5 @@
28
  "torch_dtype": "float32",
29
  "transformers_version": "4.37.2",
30
  "use_cache": true,
31
- "vocab_size": 30001
32
  }
 
4
  "GPT2LMHeadModel"
5
  ],
6
  "attn_pdrop": 0.1,
7
+ "bos_token_id": 1,
8
  "embd_pdrop": 0.1,
9
+ "eos_token_id": 1,
10
  "initializer_range": 0.02,
11
  "layer_norm_epsilon": 1e-05,
12
  "model_type": "gpt2",
 
15
  "n_inner": null,
16
  "n_layer": 10,
17
  "n_positions": 4096,
18
+ "padding_token_id": 1,
19
  "reorder_and_upcast_attn": false,
20
  "resid_pdrop": 0.1,
21
  "scale_attn_by_inverse_layer_idx": false,
 
28
  "torch_dtype": "float32",
29
  "transformers_version": "4.37.2",
30
  "use_cache": true,
31
+ "vocab_size": 30000
32
  }
generation_config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_from_model_config": true,
3
- "bos_token_id": 30000,
4
- "eos_token_id": 30000,
5
  "transformers_version": "4.37.2"
6
  }
 
1
  {
2
  "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 1,
5
  "transformers_version": "4.37.2"
6
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22726d5d220ff7c2d8b4bda44044f456543da712c6f13abceb7ebfbdf291e29c
3
- size 254962056
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e91ec2e5db8defd484c25027a4f99b039f5e416917f7cbfade856f1fcf1154a
3
+ size 254959656
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db2daf1ba377eb851dad0905d389222e965f048ff071e14d1039b7e459c05c67
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84fd46c4d64452c3ae2ae1094579da98c0405b2f53b95a5f1906bbe659ae8c78
3
  size 4664