Fix indexing in tests in chunk_by_sentence_test
This commit is contained in:
parent
928e1075c6
commit
14dd60576e
1 changed files with 2 additions and 2 deletions
|
|
@ -15,7 +15,7 @@ maximum_length_vals = [None, 8, 64]
|
|||
)
|
||||
def test_chunk_by_sentence_isomorphism(input_text, maximum_length):
|
||||
chunks = chunk_by_sentence(input_text, maximum_length)
|
||||
reconstructed_text = "".join([chunk[2] for chunk in chunks])
|
||||
reconstructed_text = "".join([chunk[1] for chunk in chunks])
|
||||
assert (
|
||||
reconstructed_text == input_text
|
||||
), f"texts are not identical: {len(input_text) = }, {len(reconstructed_text) = }"
|
||||
|
|
@ -33,7 +33,7 @@ def test_chunk_by_sentence_isomorphism(input_text, maximum_length):
|
|||
def test_paragraph_chunk_length(input_text, maximum_length):
|
||||
chunks = list(chunk_by_sentence(input_text, maximum_length))
|
||||
|
||||
chunk_lengths = np.array([len(list(chunk_by_word(chunk[2]))) for chunk in chunks])
|
||||
chunk_lengths = np.array([len(list(chunk_by_word(chunk[1]))) for chunk in chunks])
|
||||
|
||||
larger_chunks = chunk_lengths[chunk_lengths > maximum_length]
|
||||
assert np.all(
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue