test escape characters (#171)

* test escape characters

* format

* tests

* run tests

* copyright
This commit is contained in:
Preston Rasmussen 2024-10-03 10:08:30 -04:00 committed by GitHub
parent ae9b5eca9c
commit ec2e51c5ec
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
2 changed files with 40 additions and 2 deletions

View file

@ -25,7 +25,7 @@ def parse_db_date(neo_date: neo4j_time.DateTime | None) -> datetime | None:
def lucene_sanitize(query: str) -> str:
# Escape special characters from a query before passing into Lucene
# + - && || ! ( ) { } [ ] ^ " ~ * ? : \
# + - && || ! ( ) { } [ ] ^ " ~ * ? : \ /
escape_map = str.maketrans(
{
'+': r'\+',
@ -46,7 +46,7 @@ def lucene_sanitize(query: str) -> str:
'?': r'\?',
':': r'\:',
'\\': r'\\',
'/': r'\/'
'/': r'\/',
}
)

38
tests/helpers_test.py Normal file
View file

@ -0,0 +1,38 @@
"""
Copyright 2024, Zep Software, Inc.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""
import pytest
from graphiti_core.helpers import lucene_sanitize
def test_lucene_sanitize():
# Call the function with test data
queries = [
(
'This has every secape character + - && || ! ( ) { } [ ] ^ " ~ * ? : \\ /',
'This has every secape character \+ \- \&\& \|\| \! \( \) \{ \} \[ \] \^ \\" \~ \* \? \: \\\ \/',
),
('This has no escape characters', 'This has no escape characters'),
]
for query, assert_result in queries:
result = lucene_sanitize(query)
assert assert_result == result
if __name__ == '__main__':
pytest.main([__file__])