Skip to content

Commit

Permalink
Update step3_2_splitbymeaning.py
Browse files Browse the repository at this point in the history
  • Loading branch information
Huanshere committed Sep 12, 2024
1 parent 807592a commit 9e42551
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion core/step3_2_splitbymeaning.py
Original file line number Diff line number Diff line change
Expand Up @@ -79,7 +79,7 @@ def parallel_split_sentences(sentences, max_length, max_workers, nlp, retry_atte
for index, sentence in enumerate(sentences):
# Use tokenizer to split the sentence
tokens = tokenize_sentence(sentence, nlp)
print("Tokenization result:", tokens)
# print("Tokenization result:", tokens)
num_parts = math.ceil(len(tokens) / max_length)
if len(tokens) > max_length:
future = executor.submit(split_sentence, sentence, num_parts, max_length, index=index, retry_attempt=retry_attempt)
Expand Down

0 comments on commit 9e42551

Please sign in to comment.