ChrisGeishauser commited on
Commit
e8d30de
1 Parent(s): 0268bc5

Upload 3 files

Browse files
Files changed (4) hide show
  1. .gitattributes +1 -0
  2. config_saved.json +1 -0
  3. supervised.pol.mdl +3 -0
  4. train_INFO.log +29 -0
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ supervised.pol.mdl filter=lfs diff=lfs merge=lfs -text
config_saved.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"args": {"seed": 0, "eval_freq": 1, "dataset_name": "sgd", "model_path": ""}, "config": {"batchsz": 64, "epoch": 1, "gamma": 0.99, "policy_lr": 5e-06, "supervised_lr": 1e-05, "entropy_weight": 0.01, "value_lr": 0.0001, "save_dir": "save", "log_dir": "log", "save_per_epoch": 5000, "hidden_size": 256, "load": "save/best", "logging_mode": "INFO", "use_cer": true, "memory_size": 5000, "behaviour_cloning_weight": 0.1, "supervised_weight": 0.0, "online_offline_ratio": 0.2, "smoothed_value_function": false, "use_reservoir_sampling": false, "seed": 0, "lambda": 1, "tau": 0.001, "policy_freq": 1, "print_per_batch": 400, "c": 1.0, "rho_bar": 1, "max_length": 10, "noisy_linear": false, "dataset_name": "sgd", "data_percentage": 1.0, "dialogue_order": 0, "multiwoz_like": false, "regularization_weight": 0.0, "enc_input_dim": 128, "enc_nhead": 2, "enc_d_hid": 128, "enc_nlayers": 4, "enc_dropout": 0.1, "dec_input_dim": 128, "dec_nhead": 2, "dec_d_hid": 128, "dec_nlayers": 2, "dec_dropout": 0.0, "action_embedding_dim": 128, "domain_embedding_dim": 64, "value_embedding_dim": 12, "node_embedding_dim": 128, "roberta_path": "", "node_attention": true, "semantic_descriptions": true, "freeze_roberta": true, "use_pooled": false, "mean": true, "roberta_actions": true, "independent_descriptions": true, "random_matrix": false, "distance_metric": false, "verbose": false, "ignore_features": [], "domains_removed": ["hospital", "police", "train", "hotel", "attraction", "taxi"], "only_active_values": false, "permuted_data": false, "need_weights": false, "cls_dim": 128, "independent": true, "old_critic": false, "pos_weight": 5, "weight_decay": 1e-05}, "policy_config": null}
supervised.pol.mdl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a52f1b3ef34f075c3932d80e6d569157a307ff19796421996e393e7f8ea7bc5f
3
+ size 9331458
train_INFO.log ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Visible device: cuda
2
+ Seed used: 0
3
+ Batch size: 64
4
+ Epochs: 1
5
+ Learning rate: 1e-05
6
+ Entropy weight: 0.01
7
+ Regularization weight: 0.0
8
+ Only use multiwoz like domains: False
9
+ We use: 100.0% of the data
10
+ Dialogue order used: 0
11
+ Vectorizer: Data set used is sgd
12
+ We filter state by active domains: True
13
+ Vectorizer: Data set used is sgd
14
+ Embedding semantic descriptions: True
15
+ Embedded descriptions successfully. Size: torch.Size([1678, 768])
16
+ Data set used for descriptions: sgd
17
+ We use Roberta to embed actions.
18
+ Didnt load a model
19
+ Start training
20
+ Epoch: 0
21
+ Average actions: 1.684490442276001
22
+ Average target actions: 2.024200201034546
23
+ Precision: 0.3306945737954022
24
+ Recall: 0.27521008403361347
25
+ F1: 0.3004118891239007
26
+ <<dialog policy>> epoch 0: saved network to mdl
27
+ Best Precision: 0.3306945737954022
28
+ Best Recall: 0.27521008403361347
29
+ Best F1: 0.3004118891239007