Skip to content

Commit e2d7c3b

Browse files
authored
Merge pull request #349 from funstory-ai/dev
feat: improve paragraph translation handling and unicode management in LLM processing
2 parents 3895911 + c4f907d commit e2d7c3b

File tree

5 files changed

+19
-6
lines changed

5 files changed

+19
-6
lines changed

babeldoc/__init__.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
__version__ = "0.3.41"
1+
__version__ = "0.3.42"

babeldoc/const.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
import subprocess
44
from pathlib import Path
55

6-
__version__ = "0.3.41"
6+
__version__ = "0.3.42"
77

88
CACHE_FOLDER = Path.home() / ".cache" / "babeldoc"
99

babeldoc/document_il/midend/il_translator_llm_only.py

+14-1
Original file line numberDiff line numberDiff line change
@@ -224,6 +224,7 @@ def translate_paragraph(
224224
try:
225225
inputs = []
226226
llm_translate_trackers = []
227+
paragraph_unicodes = []
227228
for i in range(len(batch_paragraph.paragraphs)):
228229
paragraph = batch_paragraph.paragraphs[i]
229230
tracker = batch_paragraph.trackers[i]
@@ -237,8 +238,16 @@ def translate_paragraph(
237238
should_translate_paragraph.append(i)
238239
llm_translate_trackers.append(llm_translate_tracker)
239240
inputs.append(
240-
(text, translate_input, paragraph, tracker, llm_translate_tracker)
241+
(
242+
text,
243+
translate_input,
244+
paragraph,
245+
tracker,
246+
llm_translate_tracker,
247+
paragraph_unicodes,
248+
)
241249
)
250+
paragraph_unicodes.append(paragraph.unicode)
242251
if not inputs:
243252
return
244253
json_format_input = []
@@ -454,6 +463,8 @@ def translate_paragraph(
454463
paragraph_token_count = self.calc_token_count(
455464
inputs[id_][2].unicode
456465
)
466+
paragraph_unicodes = inputs[id_][5]
467+
inputs[id_][2].unicode = paragraph_unicodes[id_]
457468
executor.submit(
458469
self.il_translator.translate_paragraph,
459470
inputs[id_][2],
@@ -473,6 +484,8 @@ def translate_paragraph(
473484
for llm_translate_tracker in llm_translate_trackers:
474485
llm_translate_tracker.set_error_message(error_message)
475486
llm_translate_tracker.set_fallback_to_translate()
487+
for input_ in inputs:
488+
input_[2].unicode = input_[5]
476489
if not should_translate_paragraph:
477490
should_translate_paragraph = list(
478491
range(len(batch_paragraph.paragraphs))

babeldoc/main.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@
2323
from babeldoc.translation_config import WatermarkOutputMode
2424

2525
logger = logging.getLogger(__name__)
26-
__version__ = "0.3.41"
26+
__version__ = "0.3.42"
2727

2828

2929
def create_parser():

pyproject.toml

+2-2
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
[project]
22
name = "BabelDOC"
3-
version = "0.3.41"
3+
version = "0.3.42"
44
description = "Yet Another Document Translator"
55
license = "AGPL-3.0"
66
readme = "README.md"
@@ -150,7 +150,7 @@ pythonpath = [".", "src"]
150150
testpaths = ["tests"]
151151

152152
[bumpver]
153-
current_version = "0.3.41"
153+
current_version = "0.3.42"
154154
version_pattern = "MAJOR.MINOR.PATCH[.PYTAGNUM]"
155155

156156
[bumpver.file_patterns]

0 commit comments

Comments
 (0)