Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
40 changes: 21 additions & 19 deletions poetry.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -70,7 +70,7 @@ tqdm = "^4.62.2"
sacrebleu = "^2.3.1"
ctranslate2 = "^3.5.1"
libclang = "14.0.6"
sil-machine = {extras = ["thot"], version = "1.8.7"}
sil-machine = {extras = ["thot"], version = "1.8.8"}
datasets = "^2.7.1"
torch = {version = "^2.4", source = "torch"}
sacremoses = "^0.0.53"
Expand Down
22 changes: 17 additions & 5 deletions silnlp/common/translator.py
Original file line number Diff line number Diff line change
Expand Up @@ -336,7 +336,7 @@ def translate_book(
trg_iso: str,
produce_multiple_translations: bool = False,
save_confidences: bool = False,
chapters: List[int] = [],
chapters: Optional[List[int]] = None,
trg_project: Optional[str] = None,
postprocess_handler: Optional[PostprocessHandler] = None,
experiment_ckpt_str: str = "",
Expand Down Expand Up @@ -372,7 +372,7 @@ def translate_usfm(
trg_iso: str,
produce_multiple_translations: bool = False,
save_confidences: bool = False,
chapters: List[int] = [],
chapters: Optional[List[int]] = None,
trg_project: Optional[str] = None,
postprocess_handler: Optional[PostprocessHandler] = None,
experiment_ckpt_str: str = "",
Expand Down Expand Up @@ -440,10 +440,21 @@ def translate_usfm(
for config in postprocess_handler.configs:

# Compile draft remarks
draft_src_str = f"project {src_file_text.project}" if src_from_project else f"file {src_file_path.name}"
draft_remark = f"This draft of {sentences.get_book()} was machine translated on {date.today()} from {draft_src_str} using model {experiment_ckpt_str}. It should be reviewed and edited carefully."
remarks: List[Tuple[int, str]] = []
postprocess_remark = config.get_postprocess_remark()
remarks = [draft_remark] + ([postprocess_remark] if postprocess_remark else [])
draft_src_str = f"project {src_file_text.project}" if src_from_project else f"file {src_file_path.name}"
chapters_for_remarks = (
chapters if chapters else sorted({sr.verse_ref.chapter_num for sr in scripture_refs})
)
for chapter_num in chapters_for_remarks:
draft_remark = (
f"This draft of {sentences.get_book()} {chapter_num} was machine translated on "
f"{date.today()} from {draft_src_str} using model {experiment_ckpt_str}. It should be "
f"reviewed and edited carefully."
)
remarks.append((chapter_num, draft_remark))
if postprocess_remark:
remarks.append((chapter_num, postprocess_remark))

# Insert translation into the USFM structure of an existing project
# If the target project is not the same as the translated file's original project,
Expand All @@ -460,6 +471,7 @@ def translate_usfm(
usfm_out = dest_updater.update_usfm(
book_id=src_file_text.id,
rows=config.rows,
chapters=chapters,
text_behavior=text_behavior,
paragraph_behavior=config.get_paragraph_behavior(),
embed_behavior=config.get_embed_behavior(),
Expand Down
2 changes: 1 addition & 1 deletion silnlp/nmt/translate.py
Original file line number Diff line number Diff line change
Expand Up @@ -163,7 +163,7 @@ def translate_books(
trg_iso,
produce_multiple_translations,
save_confidences,
chapters,
chapters if chapters else None,
trg_project,
postprocess_handler,
experiment_ckpt_str,
Expand Down