delvan commited on
Commit
042b7f4
1 Parent(s): d67905a

Changing to a less trained GPT-small

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "microsoft/DialoGPT-medium",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -12,10 +12,10 @@
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
- "n_embd": 1024,
16
- "n_head": 16,
17
  "n_inner": null,
18
- "n_layer": 24,
19
  "n_positions": 1024,
20
  "resid_pdrop": 0.1,
21
  "scale_attn_weights": true,
 
1
  {
2
+ "_name_or_path": "microsoft/DialoGPT-small",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
+ "n_embd": 768,
16
+ "n_head": 12,
17
  "n_inner": null,
18
+ "n_layer": 12,
19
  "n_positions": 1024,
20
  "resid_pdrop": 0.1,
21
  "scale_attn_weights": true,
eval_results.txt CHANGED
@@ -1 +1 @@
1
- perplexity = tensor(4.2456)
 
1
+ perplexity = tensor(7.6071)
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a6b6de3faf2650b64408d34ab235d237b05155f6fbbb0e12031ddd2ee21faf4
3
- size 1444530764
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adc0a105f61321dba53dd3301745b6ddadb39ad32e39511859e137852c9eff79
3
+ size 510378337
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"unk_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "bos_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "eos_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "add_prefix_space": false, "model_max_length": 1024, "special_tokens_map_file": null, "name_or_path": "microsoft/DialoGPT-medium", "errors": "replace", "tokenizer_class": "GPT2Tokenizer"}
 
1
+ {"unk_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "bos_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "eos_token": {"content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "add_prefix_space": false, "model_max_length": 1024, "special_tokens_map_file": null, "name_or_path": "microsoft/DialoGPT-small", "errors": "replace", "tokenizer_class": "GPT2Tokenizer"}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ae5414c5ca6649ce87c5f94c3714ce3217628bbfe91d62fc790a3d81965de43
3
- size 1077
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bb4c7a39872e0b554db507498a5d91a912208989ed0e1921b8312384f54c87b
3
+ size 1083