patrickvonplaten commited on
Commit
f53f6af
1 Parent(s): 577db6b

Training in progress, step 400

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "anton-l/distilhubert",
3
  "activation_dropout": 0.0,
4
  "apply_spec_augment": false,
5
  "architectures": [
@@ -43,6 +43,7 @@
43
  "feat_extract_activation": "gelu",
44
  "feat_extract_norm": "group",
45
  "feat_proj_dropout": 0.0,
 
46
  "final_dropout": 0.0,
47
  "gradient_checkpointing": false,
48
  "hidden_act": "gelu",
1
  {
2
+ "_name_or_path": "ntu-spml/distilhubert",
3
  "activation_dropout": 0.0,
4
  "apply_spec_augment": false,
5
  "architectures": [
43
  "feat_extract_activation": "gelu",
44
  "feat_extract_norm": "group",
45
  "feat_proj_dropout": 0.0,
46
+ "feat_proj_layer_norm": false,
47
  "final_dropout": 0.0,
48
  "gradient_checkpointing": false,
49
  "hidden_act": "gelu",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f45733908b4d346cd571f50573ebff4fb8a1dab88c2e59c605cb09c1c7c686f9
3
- size 94089804
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34af1a498aa9c0cc4e74d1319415a0570ebba2653986964a73bfcafb9d72df8b
3
+ size 94084922
runs/Oct27_23-22-06_brutasse/1635377008.532898/events.out.tfevents.1635377008.brutasse.8534.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05a86d600e9501ec13493ec9cbd88086b01e925ffbfa24256bc8ce800fc98d41
3
+ size 4544
runs/Oct27_23-22-06_brutasse/events.out.tfevents.1635377008.brutasse.8534.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8f7c0a3dd9b0e011a269631a1ae8c16c656bd72ed590debb3704ab82d2b76f1
3
+ size 11457
special_tokens_map.json CHANGED
@@ -1 +1 @@
1
- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e61d5815111f8a234da1968e1dd6ae9e05e335f7bdd1086bc8319722fcc8a0f
3
  size 2863
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d91af76e55961ed6d42bc6636da82263b9218c6d7ec6c8988bf273631911759
3
  size 2863