mirror of
https://github.com/HIllya51/LunaTranslator.git
synced 2024-12-29 16:44:13 +08:00
Fix empty sentence. (#839)
Properly handle empty sentences when spliting original text.
This commit is contained in:
parent
cb418e4f7f
commit
345a288f74
@ -256,13 +256,16 @@ class TS(basetrans):
|
||||
return output_ids_py
|
||||
|
||||
def translate(self, content):
|
||||
delimiters = ['.','。','\n',':',':','?','?','!','!','……','「','」']
|
||||
content_split = [i for i in re.split('(['+''.join(delimiters)+'])', content) if i]
|
||||
delimiters = ['.','。','\n',':',':','?','?','!','!','…','「','」',]
|
||||
raw_split = [i.strip() for i in re.split('(['+''.join(delimiters)+'])', content)]
|
||||
content_split = [i for i in raw_split if i]
|
||||
translated_list = []
|
||||
i = 0
|
||||
while i < len(content_split):
|
||||
sentence = content_split[i]
|
||||
if i+1 < len(content_split):
|
||||
while i + 1 < len(content_split):
|
||||
if content_split[i+1] not in delimiters:
|
||||
break
|
||||
i += 1
|
||||
sentence += content_split[i]
|
||||
input_ids_py = self.encode_as_ids(sentence)
|
||||
|
Loading…
x
Reference in New Issue
Block a user