model update
Browse files- config.json +1 -1
- eval/metric.first.answer.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.first.answer.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.first.answer.sentence_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.first.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.first.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.last.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.last.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.last.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.long.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.long.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.long.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.middle.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.middle.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.middle.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.short.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.short.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/metric.short.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json +1 -0
- eval/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt +0 -0
- eval/samples.test.hyp.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.txt +0 -0
- eval/samples.test.hyp.sentence_answer.question.asahi417_qg_squadshifts.amazon.txt +0 -0
- eval/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt +0 -0
- eval/samples.validation.hyp.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.txt +0 -0
- eval/samples.validation.hyp.sentence_answer.question.asahi417_qg_squadshifts.amazon.txt +0 -0
- pytorch_model.bin +2 -2
- tokenizer_config.json +1 -1
- trainer_config.json +1 -0
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"add_prefix": true,
|
4 |
"architectures": [
|
5 |
"T5ForConditionalGeneration"
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "t5-small",
|
3 |
"add_prefix": true,
|
4 |
"architectures": [
|
5 |
"T5ForConditionalGeneration"
|
eval/metric.first.answer.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.04290566129938567, "Bleu_2": 0.013053374665617686, "Bleu_3": 0.004627188561090198, "Bleu_4": 0.0019199816607240786, "METEOR": 0.05189936204343655, "ROUGE_L": 0.05350355677017498, "BERTScore": 0.8152750407897152, "MoverScore": 0.5051068235474198}, "test": {"Bleu_1": 0.04481589542142716, "Bleu_2": 0.014121203784322248, "Bleu_3": 0.005936629808173858, "Bleu_4": 0.002994793670824618, "METEOR": 0.052031642408706856, "ROUGE_L": 0.05530195153707644, "BERTScore": 0.8176489767517845, "MoverScore": 0.5049897780978438}}
|
eval/metric.first.answer.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.03612839366515709, "Bleu_2": 0.01116952817389538, "Bleu_3": 0.0047731681167366875, "Bleu_4": 0.002184159866779065, "METEOR": 0.040572153636078044, "ROUGE_L": 0.03453086893568191, "BERTScore": 0.7804537044422141, "MoverScore": 0.5027725998161208}, "test": {"Bleu_1": 0.035713011947928, "Bleu_2": 0.011901015684313369, "Bleu_3": 0.005348024767184312, "Bleu_4": 0.002925686102006162, "METEOR": 0.03893999820800414, "ROUGE_L": 0.035950601628877005, "BERTScore": 0.7794891686296714, "MoverScore": 0.5022117505274228}}
|
eval/metric.first.answer.sentence_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.07604584860650049, "Bleu_2": 0.033596061392643414, "Bleu_3": 0.017061678428897983, "Bleu_4": 0.009968373866813422, "METEOR": 0.052111850077991705, "ROUGE_L": 0.06506860627129887, "BERTScore": 0.750528070496992, "MoverScore": 0.5110558106033206}, "test": {"Bleu_1": 0.0822782352027326, "Bleu_2": 0.04059886616248794, "Bleu_3": 0.02335872841144139, "Bleu_4": 0.01444897550966233, "METEOR": 0.054213014539944274, "ROUGE_L": 0.06922636855397667, "BERTScore": 0.7465991752681246, "MoverScore": 0.5115809834602486}}
|
eval/metric.first.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.043116677392207245, "Bleu_2": 0.013170705505483141, "Bleu_3": 0.004675227675292343, "Bleu_4": 0.0019412941966986921, "METEOR": 0.05206199705925229, "ROUGE_L": 0.05374112204796383, "BERTScore": 0.8151429012143538, "MoverScore": 0.5051581469544685}, "test": {"Bleu_1": 0.045631512158907074, "Bleu_2": 0.014495610094339766, "Bleu_3": 0.006016757914670315, "Bleu_4": 0.002993000643302378, "METEOR": 0.05265268648700494, "ROUGE_L": 0.055881379876925555, "BERTScore": 0.817735575513811, "MoverScore": 0.5049508670556511}}
|
eval/metric.first.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.03624252408408709, "Bleu_2": 0.011260729966972879, "Bleu_3": 0.004820151411066952, "Bleu_4": 0.0022074834534034846, "METEOR": 0.040554605600931944, "ROUGE_L": 0.034537394137885154, "BERTScore": 0.7804314222072531, "MoverScore": 0.5027822526483483}, "test": {"Bleu_1": 0.03633982648551272, "Bleu_2": 0.012015230269655026, "Bleu_3": 0.005322987797950195, "Bleu_4": 0.0029127471280701875, "METEOR": 0.03912983626636803, "ROUGE_L": 0.036253412494811794, "BERTScore": 0.7794026645046798, "MoverScore": 0.5020943299559956}}
|
eval/metric.first.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.0763758231420463, "Bleu_2": 0.033916478645778035, "Bleu_3": 0.017228753374083347, "Bleu_4": 0.010066800004813903, "METEOR": 0.052260075359249245, "ROUGE_L": 0.06543701661170866, "BERTScore": 0.7498494936278992, "MoverScore": 0.5109176559258664}, "test": {"Bleu_1": 0.08523020409847731, "Bleu_2": 0.04234884887704143, "Bleu_3": 0.024398335447912943, "Bleu_4": 0.015161513452290607, "METEOR": 0.055491290065925195, "ROUGE_L": 0.07098243982330889, "BERTScore": 0.7459425859796279, "MoverScore": 0.5116814254947332}}
|
eval/metric.last.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.04318461917673051, "Bleu_2": 0.013194704574756572, "Bleu_3": 0.004673865561205807, "Bleu_4": 0.0019386107196008996, "METEOR": 0.05216346982690336, "ROUGE_L": 0.05371733654954279, "BERTScore": 0.8152713727000301, "MoverScore": 0.5051376096965516}, "test": {"Bleu_1": 0.04548876409355573, "Bleu_2": 0.014276939570918938, "Bleu_3": 0.005870371340139266, "Bleu_4": 0.002880383666774421, "METEOR": 0.052571653721727264, "ROUGE_L": 0.05580163039454399, "BERTScore": 0.8176188937145633, "MoverScore": 0.5049757873609766}}
|
eval/metric.last.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.03624252408408709, "Bleu_2": 0.011260729966972879, "Bleu_3": 0.004820151411066952, "Bleu_4": 0.0022074834534034846, "METEOR": 0.040554605600931944, "ROUGE_L": 0.034537394137885154, "BERTScore": 0.7804314293378701, "MoverScore": 0.5027822526483483}, "test": {"Bleu_1": 0.03633982648551272, "Bleu_2": 0.012015230269655026, "Bleu_3": 0.005322987797950195, "Bleu_4": 0.0029127471280701875, "METEOR": 0.03912983626636803, "ROUGE_L": 0.036253412494811794, "BERTScore": 0.7794026651828777, "MoverScore": 0.5020943299559956}}
|
eval/metric.last.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.07623634441442052, "Bleu_2": 0.033793047141879515, "Bleu_3": 0.01717965703983972, "Bleu_4": 0.010041982233439363, "METEOR": 0.05227462473304259, "ROUGE_L": 0.06526642804080211, "BERTScore": 0.7501313740856077, "MoverScore": 0.5109041491453634}, "test": {"Bleu_1": 0.08457351023533864, "Bleu_2": 0.041681380166993506, "Bleu_3": 0.02387056007162457, "Bleu_4": 0.014816030462875508, "METEOR": 0.05499395607679083, "ROUGE_L": 0.07047058703732026, "BERTScore": 0.7458811996959729, "MoverScore": 0.5115901248568412}}
|
eval/metric.long.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.04319420132639622, "Bleu_2": 0.013197693494815303, "Bleu_3": 0.004674945249651668, "Bleu_4": 0.0019390673022873675, "METEOR": 0.05216176610258244, "ROUGE_L": 0.05371733654954279, "BERTScore": 0.8151580313232047, "MoverScore": 0.5051189018475749}, "test": {"Bleu_1": 0.04570762878826776, "Bleu_2": 0.014547708495636033, "Bleu_3": 0.006068327438522486, "Bleu_4": 0.0030446950651127525, "METEOR": 0.05285644460594556, "ROUGE_L": 0.056105497624388004, "BERTScore": 0.8174572320084759, "MoverScore": 0.5048283919231693}}
|
eval/metric.long.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.03624252408408709, "Bleu_2": 0.011260729966972879, "Bleu_3": 0.004820151411066952, "Bleu_4": 0.0022074834534034846, "METEOR": 0.040554605600931944, "ROUGE_L": 0.034537394137885154, "BERTScore": 0.7804314247303945, "MoverScore": 0.5027822526483483}, "test": {"Bleu_1": 0.03633982648551272, "Bleu_2": 0.012015230269655026, "Bleu_3": 0.005322987797950195, "Bleu_4": 0.0029127471280701875, "METEOR": 0.03912983626636803, "ROUGE_L": 0.036253412494811794, "BERTScore": 0.7794026629819334, "MoverScore": 0.5020943299559956}}
|
eval/metric.long.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.07651590895723834, "Bleu_2": 0.03395305595761596, "Bleu_3": 0.017243166303052154, "Bleu_4": 0.010074282853718327, "METEOR": 0.052376151921151345, "ROUGE_L": 0.06557340347103441, "BERTScore": 0.7498414388097868, "MoverScore": 0.5109775663786402}, "test": {"Bleu_1": 0.08532964574775115, "Bleu_2": 0.042284928813845046, "Bleu_3": 0.024285490536015752, "Bleu_4": 0.015040949045617947, "METEOR": 0.05584240863470676, "ROUGE_L": 0.07135539735686057, "BERTScore": 0.7465991082750405, "MoverScore": 0.5117052102923553}}
|
eval/metric.middle.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.04319420132639622, "Bleu_2": 0.013197693494815303, "Bleu_3": 0.004674945249651668, "Bleu_4": 0.0019390673022873675, "METEOR": 0.052137864057332256, "ROUGE_L": 0.05371733654954279, "BERTScore": 0.8151564011910211, "MoverScore": 0.5051188499624129}, "test": {"Bleu_1": 0.045636859155653436, "Bleu_2": 0.014427834629933531, "Bleu_3": 0.005982626503946396, "Bleu_4": 0.0029744280735005684, "METEOR": 0.05280098648266344, "ROUGE_L": 0.05607868356020809, "BERTScore": 0.8175508585443001, "MoverScore": 0.5048571838904148}}
|
eval/metric.middle.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.03624252408408709, "Bleu_2": 0.011260729966972879, "Bleu_3": 0.004820151411066952, "Bleu_4": 0.0022074834534034846, "METEOR": 0.040554605600931944, "ROUGE_L": 0.034537394137885154, "BERTScore": 0.7804314252789035, "MoverScore": 0.5027822526483483}, "test": {"Bleu_1": 0.03633982648551272, "Bleu_2": 0.012015230269655026, "Bleu_3": 0.005322987797950195, "Bleu_4": 0.0029127471280701875, "METEOR": 0.03912983626636803, "ROUGE_L": 0.036253412494811794, "BERTScore": 0.7794026698790788, "MoverScore": 0.5020943299559956}}
|
eval/metric.middle.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.076398683591909, "Bleu_2": 0.0339127866008168, "Bleu_3": 0.017224262425249007, "Bleu_4": 0.01006347191887409, "METEOR": 0.05233066205652623, "ROUGE_L": 0.06548279012264836, "BERTScore": 0.7499170074433636, "MoverScore": 0.5109643170431181}, "test": {"Bleu_1": 0.08520490382065388, "Bleu_2": 0.042234661434540896, "Bleu_3": 0.024295370008397026, "Bleu_4": 0.015060108481865581, "METEOR": 0.055744955009394005, "ROUGE_L": 0.07121607766938139, "BERTScore": 0.7464687786756437, "MoverScore": 0.5117216698086959}}
|
eval/metric.short.sentence.paragraph_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.04310707480636354, "Bleu_2": 0.013167710710194604, "Bleu_3": 0.004674143483404549, "Bleu_4": 0.0019408351735300698, "METEOR": 0.05206366133877939, "ROUGE_L": 0.05374112204796383, "BERTScore": 0.8152562464307422, "MoverScore": 0.5051768548034452}, "test": {"Bleu_1": 0.04538323426360063, "Bleu_2": 0.014213060536575365, "Bleu_3": 0.005812033931171208, "Bleu_4": 0.0028226945926885585, "METEOR": 0.052344684481866785, "ROUGE_L": 0.055556660734854164, "BERTScore": 0.8178340481068761, "MoverScore": 0.5050756117958667}}
|
eval/metric.short.sentence.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.03624252408408709, "Bleu_2": 0.011260729966972879, "Bleu_3": 0.004820151411066952, "Bleu_4": 0.0022074834534034846, "METEOR": 0.040554605600931944, "ROUGE_L": 0.034537394137885154, "BERTScore": 0.7804314203423225, "MoverScore": 0.5027822526483483}, "test": {"Bleu_1": 0.03633982648551272, "Bleu_2": 0.012015230269655026, "Bleu_3": 0.005322987797950195, "Bleu_4": 0.0029127471280701875, "METEOR": 0.03912983626636803, "ROUGE_L": 0.036253412494811794, "BERTScore": 0.7794026727070364, "MoverScore": 0.5020943299559956}}
|
eval/metric.short.sentence.sentence_answer.question.asahi417_qg_squadshifts.amazon.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"validation": {"Bleu_1": 0.07621342108355411, "Bleu_2": 0.03379669579604187, "Bleu_3": 0.0171841237901245, "Bleu_4": 0.010045296654859997, "METEOR": 0.05220398702408211, "ROUGE_L": 0.0652206545298624, "BERTScore": 0.7500638603432778, "MoverScore": 0.5108574880281117}, "test": {"Bleu_1": 0.0844491080797464, "Bleu_2": 0.04175536795345092, "Bleu_3": 0.024001094555284125, "Bleu_4": 0.014940084682124804, "METEOR": 0.05467329259772323, "ROUGE_L": 0.07015062102976598, "BERTScore": 0.7451926632954257, "MoverScore": 0.5115565518029267}}
|
eval/samples.test.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval/samples.test.hyp.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval/samples.test.hyp.sentence_answer.question.asahi417_qg_squadshifts.amazon.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval/samples.validation.hyp.paragraph_answer.question.asahi417_qg_squadshifts.amazon.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval/samples.validation.hyp.paragraph_sentence.question.asahi417_qg_squadshifts.amazon.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
eval/samples.validation.hyp.sentence_answer.question.asahi417_qg_squadshifts.amazon.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1764557a426c6d867ba7b155baaaad95133001b5cd6079ebcd6cb9210f219156
|
3 |
+
size 242030331
|
tokenizer_config.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>", "extra_ids": 100, "additional_special_tokens": ["<extra_id_0>", "<extra_id_1>", "<extra_id_2>", "<extra_id_3>", "<extra_id_4>", "<extra_id_5>", "<extra_id_6>", "<extra_id_7>", "<extra_id_8>", "<extra_id_9>", "<extra_id_10>", "<extra_id_11>", "<extra_id_12>", "<extra_id_13>", "<extra_id_14>", "<extra_id_15>", "<extra_id_16>", "<extra_id_17>", "<extra_id_18>", "<extra_id_19>", "<extra_id_20>", "<extra_id_21>", "<extra_id_22>", "<extra_id_23>", "<extra_id_24>", "<extra_id_25>", "<extra_id_26>", "<extra_id_27>", "<extra_id_28>", "<extra_id_29>", "<extra_id_30>", "<extra_id_31>", "<extra_id_32>", "<extra_id_33>", "<extra_id_34>", "<extra_id_35>", "<extra_id_36>", "<extra_id_37>", "<extra_id_38>", "<extra_id_39>", "<extra_id_40>", "<extra_id_41>", "<extra_id_42>", "<extra_id_43>", "<extra_id_44>", "<extra_id_45>", "<extra_id_46>", "<extra_id_47>", "<extra_id_48>", "<extra_id_49>", "<extra_id_50>", "<extra_id_51>", "<extra_id_52>", "<extra_id_53>", "<extra_id_54>", "<extra_id_55>", "<extra_id_56>", "<extra_id_57>", "<extra_id_58>", "<extra_id_59>", "<extra_id_60>", "<extra_id_61>", "<extra_id_62>", "<extra_id_63>", "<extra_id_64>", "<extra_id_65>", "<extra_id_66>", "<extra_id_67>", "<extra_id_68>", "<extra_id_69>", "<extra_id_70>", "<extra_id_71>", "<extra_id_72>", "<extra_id_73>", "<extra_id_74>", "<extra_id_75>", "<extra_id_76>", "<extra_id_77>", "<extra_id_78>", "<extra_id_79>", "<extra_id_80>", "<extra_id_81>", "<extra_id_82>", "<extra_id_83>", "<extra_id_84>", "<extra_id_85>", "<extra_id_86>", "<extra_id_87>", "<extra_id_88>", "<extra_id_89>", "<extra_id_90>", "<extra_id_91>", "<extra_id_92>", "<extra_id_93>", "<extra_id_94>", "<extra_id_95>", "<extra_id_96>", "<extra_id_97>", "<extra_id_98>", "<extra_id_99>"], "model_max_length": 512, "name_or_path": "
|
|
|
1 |
+
{"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>", "extra_ids": 100, "additional_special_tokens": ["<extra_id_0>", "<extra_id_1>", "<extra_id_2>", "<extra_id_3>", "<extra_id_4>", "<extra_id_5>", "<extra_id_6>", "<extra_id_7>", "<extra_id_8>", "<extra_id_9>", "<extra_id_10>", "<extra_id_11>", "<extra_id_12>", "<extra_id_13>", "<extra_id_14>", "<extra_id_15>", "<extra_id_16>", "<extra_id_17>", "<extra_id_18>", "<extra_id_19>", "<extra_id_20>", "<extra_id_21>", "<extra_id_22>", "<extra_id_23>", "<extra_id_24>", "<extra_id_25>", "<extra_id_26>", "<extra_id_27>", "<extra_id_28>", "<extra_id_29>", "<extra_id_30>", "<extra_id_31>", "<extra_id_32>", "<extra_id_33>", "<extra_id_34>", "<extra_id_35>", "<extra_id_36>", "<extra_id_37>", "<extra_id_38>", "<extra_id_39>", "<extra_id_40>", "<extra_id_41>", "<extra_id_42>", "<extra_id_43>", "<extra_id_44>", "<extra_id_45>", "<extra_id_46>", "<extra_id_47>", "<extra_id_48>", "<extra_id_49>", "<extra_id_50>", "<extra_id_51>", "<extra_id_52>", "<extra_id_53>", "<extra_id_54>", "<extra_id_55>", "<extra_id_56>", "<extra_id_57>", "<extra_id_58>", "<extra_id_59>", "<extra_id_60>", "<extra_id_61>", "<extra_id_62>", "<extra_id_63>", "<extra_id_64>", "<extra_id_65>", "<extra_id_66>", "<extra_id_67>", "<extra_id_68>", "<extra_id_69>", "<extra_id_70>", "<extra_id_71>", "<extra_id_72>", "<extra_id_73>", "<extra_id_74>", "<extra_id_75>", "<extra_id_76>", "<extra_id_77>", "<extra_id_78>", "<extra_id_79>", "<extra_id_80>", "<extra_id_81>", "<extra_id_82>", "<extra_id_83>", "<extra_id_84>", "<extra_id_85>", "<extra_id_86>", "<extra_id_87>", "<extra_id_88>", "<extra_id_89>", "<extra_id_90>", "<extra_id_91>", "<extra_id_92>", "<extra_id_93>", "<extra_id_94>", "<extra_id_95>", "<extra_id_96>", "<extra_id_97>", "<extra_id_98>", "<extra_id_99>"], "model_max_length": 512, "name_or_path": "t5-small", "tokenizer_class": "T5Tokenizer"}
|
trainer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"dataset_path": "asahi417/qg_squadshifts", "dataset_name": "amazon", "input_types": ["paragraph_answer"], "output_types": ["question"], "prefix_types": ["qg"], "model": "t5-small", "max_length": 512, "max_length_output": 32, "epoch": 1, "batch": 32, "lr": 1e-05, "fp16": false, "random_seed": 1, "gradient_accumulation_steps": 4, "label_smoothing": 0.15}
|