tomekkorbak commited on
Commit
076c81a
1 Parent(s): d446344

update model card README.md

Browse files
Files changed (1) hide show
  1. README.md +188 -0
README.md ADDED
@@ -0,0 +1,188 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ license: mit
5
+ tags:
6
+ - generated_from_trainer
7
+ datasets:
8
+ - tomekkorbak/detoxify-pile-chunk3-0-50000
9
+ - tomekkorbak/detoxify-pile-chunk3-50000-100000
10
+ - tomekkorbak/detoxify-pile-chunk3-100000-150000
11
+ - tomekkorbak/detoxify-pile-chunk3-150000-200000
12
+ - tomekkorbak/detoxify-pile-chunk3-200000-250000
13
+ - tomekkorbak/detoxify-pile-chunk3-250000-300000
14
+ - tomekkorbak/detoxify-pile-chunk3-300000-350000
15
+ - tomekkorbak/detoxify-pile-chunk3-350000-400000
16
+ - tomekkorbak/detoxify-pile-chunk3-400000-450000
17
+ - tomekkorbak/detoxify-pile-chunk3-450000-500000
18
+ - tomekkorbak/detoxify-pile-chunk3-500000-550000
19
+ - tomekkorbak/detoxify-pile-chunk3-550000-600000
20
+ - tomekkorbak/detoxify-pile-chunk3-600000-650000
21
+ - tomekkorbak/detoxify-pile-chunk3-650000-700000
22
+ - tomekkorbak/detoxify-pile-chunk3-700000-750000
23
+ - tomekkorbak/detoxify-pile-chunk3-750000-800000
24
+ - tomekkorbak/detoxify-pile-chunk3-800000-850000
25
+ - tomekkorbak/detoxify-pile-chunk3-850000-900000
26
+ - tomekkorbak/detoxify-pile-chunk3-900000-950000
27
+ - tomekkorbak/detoxify-pile-chunk3-950000-1000000
28
+ - tomekkorbak/detoxify-pile-chunk3-1000000-1050000
29
+ - tomekkorbak/detoxify-pile-chunk3-1050000-1100000
30
+ - tomekkorbak/detoxify-pile-chunk3-1100000-1150000
31
+ - tomekkorbak/detoxify-pile-chunk3-1150000-1200000
32
+ - tomekkorbak/detoxify-pile-chunk3-1200000-1250000
33
+ - tomekkorbak/detoxify-pile-chunk3-1250000-1300000
34
+ - tomekkorbak/detoxify-pile-chunk3-1300000-1350000
35
+ - tomekkorbak/detoxify-pile-chunk3-1350000-1400000
36
+ - tomekkorbak/detoxify-pile-chunk3-1400000-1450000
37
+ - tomekkorbak/detoxify-pile-chunk3-1450000-1500000
38
+ - tomekkorbak/detoxify-pile-chunk3-1500000-1550000
39
+ - tomekkorbak/detoxify-pile-chunk3-1550000-1600000
40
+ - tomekkorbak/detoxify-pile-chunk3-1600000-1650000
41
+ - tomekkorbak/detoxify-pile-chunk3-1650000-1700000
42
+ - tomekkorbak/detoxify-pile-chunk3-1700000-1750000
43
+ - tomekkorbak/detoxify-pile-chunk3-1750000-1800000
44
+ - tomekkorbak/detoxify-pile-chunk3-1800000-1850000
45
+ - tomekkorbak/detoxify-pile-chunk3-1850000-1900000
46
+ - tomekkorbak/detoxify-pile-chunk3-1900000-1950000
47
+ model-index:
48
+ - name: cranky_jang
49
+ results: []
50
+ ---
51
+
52
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
53
+ should probably proofread and complete it, then remove this comment. -->
54
+
55
+ # cranky_jang
56
+
57
+ This model was trained from scratch on the tomekkorbak/detoxify-pile-chunk3-0-50000, the tomekkorbak/detoxify-pile-chunk3-50000-100000, the tomekkorbak/detoxify-pile-chunk3-100000-150000, the tomekkorbak/detoxify-pile-chunk3-150000-200000, the tomekkorbak/detoxify-pile-chunk3-200000-250000, the tomekkorbak/detoxify-pile-chunk3-250000-300000, the tomekkorbak/detoxify-pile-chunk3-300000-350000, the tomekkorbak/detoxify-pile-chunk3-350000-400000, the tomekkorbak/detoxify-pile-chunk3-400000-450000, the tomekkorbak/detoxify-pile-chunk3-450000-500000, the tomekkorbak/detoxify-pile-chunk3-500000-550000, the tomekkorbak/detoxify-pile-chunk3-550000-600000, the tomekkorbak/detoxify-pile-chunk3-600000-650000, the tomekkorbak/detoxify-pile-chunk3-650000-700000, the tomekkorbak/detoxify-pile-chunk3-700000-750000, the tomekkorbak/detoxify-pile-chunk3-750000-800000, the tomekkorbak/detoxify-pile-chunk3-800000-850000, the tomekkorbak/detoxify-pile-chunk3-850000-900000, the tomekkorbak/detoxify-pile-chunk3-900000-950000, the tomekkorbak/detoxify-pile-chunk3-950000-1000000, the tomekkorbak/detoxify-pile-chunk3-1000000-1050000, the tomekkorbak/detoxify-pile-chunk3-1050000-1100000, the tomekkorbak/detoxify-pile-chunk3-1100000-1150000, the tomekkorbak/detoxify-pile-chunk3-1150000-1200000, the tomekkorbak/detoxify-pile-chunk3-1200000-1250000, the tomekkorbak/detoxify-pile-chunk3-1250000-1300000, the tomekkorbak/detoxify-pile-chunk3-1300000-1350000, the tomekkorbak/detoxify-pile-chunk3-1350000-1400000, the tomekkorbak/detoxify-pile-chunk3-1400000-1450000, the tomekkorbak/detoxify-pile-chunk3-1450000-1500000, the tomekkorbak/detoxify-pile-chunk3-1500000-1550000, the tomekkorbak/detoxify-pile-chunk3-1550000-1600000, the tomekkorbak/detoxify-pile-chunk3-1600000-1650000, the tomekkorbak/detoxify-pile-chunk3-1650000-1700000, the tomekkorbak/detoxify-pile-chunk3-1700000-1750000, the tomekkorbak/detoxify-pile-chunk3-1750000-1800000, the tomekkorbak/detoxify-pile-chunk3-1800000-1850000, the tomekkorbak/detoxify-pile-chunk3-1850000-1900000 and the tomekkorbak/detoxify-pile-chunk3-1900000-1950000 datasets.
58
+
59
+ ## Model description
60
+
61
+ More information needed
62
+
63
+ ## Intended uses & limitations
64
+
65
+ More information needed
66
+
67
+ ## Training and evaluation data
68
+
69
+ More information needed
70
+
71
+ ## Training procedure
72
+
73
+ ### Training hyperparameters
74
+
75
+ The following hyperparameters were used during training:
76
+ - learning_rate: 0.001
77
+ - train_batch_size: 16
78
+ - eval_batch_size: 8
79
+ - seed: 42
80
+ - gradient_accumulation_steps: 64
81
+ - total_train_batch_size: 1024
82
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
83
+ - lr_scheduler_type: linear
84
+ - lr_scheduler_warmup_ratio: 0.01
85
+ - training_steps: 3147
86
+ - mixed_precision_training: Native AMP
87
+
88
+ ### Framework versions
89
+
90
+ - Transformers 4.20.1
91
+ - Pytorch 1.11.0+cu113
92
+ - Datasets 2.5.1
93
+ - Tokenizers 0.11.6
94
+
95
+
96
+ # Full config
97
+ {'dataset': {'datasets': ['tomekkorbak/detoxify-pile-chunk3-0-50000',
98
+ 'tomekkorbak/detoxify-pile-chunk3-50000-100000',
99
+ 'tomekkorbak/detoxify-pile-chunk3-100000-150000',
100
+ 'tomekkorbak/detoxify-pile-chunk3-150000-200000',
101
+ 'tomekkorbak/detoxify-pile-chunk3-200000-250000',
102
+ 'tomekkorbak/detoxify-pile-chunk3-250000-300000',
103
+ 'tomekkorbak/detoxify-pile-chunk3-300000-350000',
104
+ 'tomekkorbak/detoxify-pile-chunk3-350000-400000',
105
+ 'tomekkorbak/detoxify-pile-chunk3-400000-450000',
106
+ 'tomekkorbak/detoxify-pile-chunk3-450000-500000',
107
+ 'tomekkorbak/detoxify-pile-chunk3-500000-550000',
108
+ 'tomekkorbak/detoxify-pile-chunk3-550000-600000',
109
+ 'tomekkorbak/detoxify-pile-chunk3-600000-650000',
110
+ 'tomekkorbak/detoxify-pile-chunk3-650000-700000',
111
+ 'tomekkorbak/detoxify-pile-chunk3-700000-750000',
112
+ 'tomekkorbak/detoxify-pile-chunk3-750000-800000',
113
+ 'tomekkorbak/detoxify-pile-chunk3-800000-850000',
114
+ 'tomekkorbak/detoxify-pile-chunk3-850000-900000',
115
+ 'tomekkorbak/detoxify-pile-chunk3-900000-950000',
116
+ 'tomekkorbak/detoxify-pile-chunk3-950000-1000000',
117
+ 'tomekkorbak/detoxify-pile-chunk3-1000000-1050000',
118
+ 'tomekkorbak/detoxify-pile-chunk3-1050000-1100000',
119
+ 'tomekkorbak/detoxify-pile-chunk3-1100000-1150000',
120
+ 'tomekkorbak/detoxify-pile-chunk3-1150000-1200000',
121
+ 'tomekkorbak/detoxify-pile-chunk3-1200000-1250000',
122
+ 'tomekkorbak/detoxify-pile-chunk3-1250000-1300000',
123
+ 'tomekkorbak/detoxify-pile-chunk3-1300000-1350000',
124
+ 'tomekkorbak/detoxify-pile-chunk3-1350000-1400000',
125
+ 'tomekkorbak/detoxify-pile-chunk3-1400000-1450000',
126
+ 'tomekkorbak/detoxify-pile-chunk3-1450000-1500000',
127
+ 'tomekkorbak/detoxify-pile-chunk3-1500000-1550000',
128
+ 'tomekkorbak/detoxify-pile-chunk3-1550000-1600000',
129
+ 'tomekkorbak/detoxify-pile-chunk3-1600000-1650000',
130
+ 'tomekkorbak/detoxify-pile-chunk3-1650000-1700000',
131
+ 'tomekkorbak/detoxify-pile-chunk3-1700000-1750000',
132
+ 'tomekkorbak/detoxify-pile-chunk3-1750000-1800000',
133
+ 'tomekkorbak/detoxify-pile-chunk3-1800000-1850000',
134
+ 'tomekkorbak/detoxify-pile-chunk3-1850000-1900000',
135
+ 'tomekkorbak/detoxify-pile-chunk3-1900000-1950000'],
136
+ 'is_split_by_sentences': True},
137
+ 'generation': {'force_call_on': [25354],
138
+ 'metrics_configs': [{}, {'n': 1}, {'n': 2}, {'n': 5}],
139
+ 'scenario_configs': [{'generate_kwargs': {'do_sample': True,
140
+ 'max_length': 128,
141
+ 'min_length': 10,
142
+ 'temperature': 0.7,
143
+ 'top_k': 0,
144
+ 'top_p': 0.9},
145
+ 'name': 'unconditional',
146
+ 'num_samples': 2048},
147
+ {'generate_kwargs': {'do_sample': True,
148
+ 'max_length': 128,
149
+ 'min_length': 10,
150
+ 'temperature': 0.7,
151
+ 'top_k': 0,
152
+ 'top_p': 0.9},
153
+ 'name': 'challenging_rtp',
154
+ 'num_samples': 2048,
155
+ 'prompts_path': 'resources/challenging_rtp.jsonl'}],
156
+ 'scorer_config': {'device': 'cuda:0'}},
157
+ 'kl_gpt3_callback': {'force_call_on': [25354],
158
+ 'max_tokens': 64,
159
+ 'num_samples': 4096},
160
+ 'model': {'from_scratch': True,
161
+ 'gpt2_config_kwargs': {'reorder_and_upcast_attn': True,
162
+ 'scale_attn_by': True},
163
+ 'model_kwargs': {'value_head_config': {'is_detached': False}},
164
+ 'path_or_name': 'gpt2'},
165
+ 'objective': {'alpha': 0.5, 'beta': 10, 'name': 'AWR'},
166
+ 'tokenizer': {'path_or_name': 'gpt2'},
167
+ 'training': {'dataloader_num_workers': 0,
168
+ 'effective_batch_size': 1024,
169
+ 'evaluation_strategy': 'no',
170
+ 'fp16': True,
171
+ 'hub_model_id': 'cranky_jang',
172
+ 'hub_strategy': 'all_checkpoints',
173
+ 'learning_rate': 0.001,
174
+ 'logging_first_step': True,
175
+ 'logging_steps': 1,
176
+ 'num_tokens': 3300000000,
177
+ 'output_dir': 'training_output104340',
178
+ 'per_device_train_batch_size': 16,
179
+ 'push_to_hub': True,
180
+ 'remove_unused_columns': False,
181
+ 'save_steps': 25354,
182
+ 'save_strategy': 'steps',
183
+ 'seed': 42,
184
+ 'warmup_ratio': 0.01,
185
+ 'weight_decay': 0.1}}
186
+
187
+ # Wandb URL:
188
+ https://wandb.ai/tomekkorbak/apo/runs/37cxyfb2