Iker commited on
Commit
ed535ee
·
1 Parent(s): d3c75c1

Print in standard format

Browse files
Files changed (1) hide show
  1. translate.py +2 -6
translate.py CHANGED
@@ -138,7 +138,6 @@ def main(
138
  total=total_lines, desc="Dataset translation", leave=True, ascii=True
139
  ) as pbar, open(output_path, "w", encoding="utf-8") as output_file:
140
  with torch.no_grad():
141
- first_batch = True
142
  for batch in data_loader:
143
  batch["input_ids"] = batch["input_ids"]
144
  batch["attention_mask"] = batch["attention_mask"]
@@ -158,11 +157,8 @@ def main(
158
  tgt_text = tokenizer.batch_decode(
159
  generated_tokens, skip_special_tokens=True
160
  )
161
- if not first_batch:
162
- print(file=output_file)
163
- else:
164
- first_batch = False
165
- print("\n".join(tgt_text), file=output_file, end="")
166
 
167
  pbar.update(len(tgt_text))
168
 
 
138
  total=total_lines, desc="Dataset translation", leave=True, ascii=True
139
  ) as pbar, open(output_path, "w", encoding="utf-8") as output_file:
140
  with torch.no_grad():
 
141
  for batch in data_loader:
142
  batch["input_ids"] = batch["input_ids"]
143
  batch["attention_mask"] = batch["attention_mask"]
 
157
  tgt_text = tokenizer.batch_decode(
158
  generated_tokens, skip_special_tokens=True
159
  )
160
+
161
+ print("\n".join(tgt_text), file=output_file)
 
 
 
162
 
163
  pbar.update(len(tgt_text))
164