From 4e9d8f8e6f0f6221abb81d8495e1c1a5a63186c8 Mon Sep 17 00:00:00 2001 From: Kevin Hu Date: Fri, 28 Nov 2025 17:57:49 +0800 Subject: [PATCH] Code format. --- agent/canvas.py | 1 - rag/nlp/__init__.py | 2 +- 2 files changed, 1 insertion(+), 2 deletions(-) diff --git a/agent/canvas.py b/agent/canvas.py index 2dfeb63e6..c8b6f9e38 100644 --- a/agent/canvas.py +++ b/agent/canvas.py @@ -13,7 +13,6 @@ # See the License for the specific language governing permissions and # limitations under the License. # -import base64 import json import logging import re diff --git a/rag/nlp/__init__.py b/rag/nlp/__init__.py index cc679bc53..334c63645 100644 --- a/rag/nlp/__init__.py +++ b/rag/nlp/__init__.py @@ -266,7 +266,7 @@ def is_chinese(text): def tokenize(d, txt, eng): d["content_with_weight"] = txt - t = re.sub(r"]{0,12})?>", " ", t) + t = re.sub(r"]{0,12})?>", " ", txt) d["content_ltks"] = rag_tokenizer.tokenize(t) d["content_sm_ltks"] = rag_tokenizer.fine_grained_tokenize(d["content_ltks"])