Spaces:

jesseplusplus
/

easy-translate

Running

Iker commited on May 13, 2022

Commit

ed535ee

1 Parent(s): d3c75c1

Print in standard format

Files changed (1) hide show

translate.py CHANGED Viewed

@@ -138,7 +138,6 @@ def main(
             total=total_lines, desc="Dataset translation", leave=True, ascii=True
         ) as pbar, open(output_path, "w", encoding="utf-8") as output_file:
             with torch.no_grad():
-                first_batch = True
                 for batch in data_loader:
                     batch["input_ids"] = batch["input_ids"]
                     batch["attention_mask"] = batch["attention_mask"]
@@ -158,11 +157,8 @@ def main(
                     tgt_text = tokenizer.batch_decode(
                         generated_tokens, skip_special_tokens=True
                     )
-                    if not first_batch:
-                        print(file=output_file)
-                    else:
-                        first_batch = False
-                    print("\n".join(tgt_text), file=output_file, end="")
                     pbar.update(len(tgt_text))

             total=total_lines, desc="Dataset translation", leave=True, ascii=True
         ) as pbar, open(output_path, "w", encoding="utf-8") as output_file:
             with torch.no_grad():
                 for batch in data_loader:
                     batch["input_ids"] = batch["input_ids"]
                     batch["attention_mask"] = batch["attention_mask"]
                     tgt_text = tokenizer.batch_decode(
                         generated_tokens, skip_special_tokens=True
                     )
+                    print("\n".join(tgt_text), file=output_file)
                     pbar.update(len(tgt_text))