diff --git a/src/chat/utils/utils.py b/src/chat/utils/utils.py index e6c22a89..18542f9f 100644 --- a/src/chat/utils/utils.py +++ b/src/chat/utils/utils.py @@ -366,9 +366,12 @@ def split_into_sentences_w_remove_punctuation(text: str) -> list[str]: if not preliminary_final_sentences: return [] - if len_text < 12: split_strength = 0.2 - elif len_text < 32: split_strength = 0.5 - else: split_strength = 0.7 + if len_text < 12: + split_strength = 0.5 + elif len_text < 32: + split_strength = 0.7 + else: + split_strength = 0.9 merge_probability = 1.0 - split_strength if merge_probability == 1.0 and len(preliminary_final_sentences) > 1: