remove delimiter for naive parser
This commit is contained in:
parent
0cc0a91cbf
commit
4a053b8c08
1 changed files with 1 additions and 1 deletions
|
|
@ -246,7 +246,7 @@ def naive_merge(sections, chunk_token_num=128, delimiter="\n。;!?"):
|
|||
tk_nums[-1] += tnum
|
||||
|
||||
for sec, pos in sections:
|
||||
add_chunk(sec[s: e], pos)
|
||||
add_chunk(sec, pos)
|
||||
continue
|
||||
s, e = 0, 1
|
||||
while e < len(sec):
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue