2e09234b68
Signed-off-by: wiseaidev <business@wiseai.dev> Signed-off-by: wiseaidev <business@wiseai.dev>
26 lines
823 B
Python
26 lines
823 B
Python
import re
|
|
from typing import Optional, Pattern
|
|
|
|
|
|
class TokenEscaper:
|
|
"""
|
|
Escape punctuation within an input string.
|
|
"""
|
|
|
|
# Characters that RediSearch requires us to escape during queries.
|
|
# Source: https://redis.io/docs/stack/search/reference/escaping/#the-rules-of-text-field-tokenization
|
|
DEFAULT_ESCAPED_CHARS = r"[,.<>{}\[\]\\\"\':;!@#$%^&*()\-+=~\ ]"
|
|
|
|
def __init__(self, escape_chars_re: Optional[Pattern] = None):
|
|
if escape_chars_re:
|
|
self.escaped_chars_re = escape_chars_re
|
|
else:
|
|
self.escaped_chars_re = re.compile(self.DEFAULT_ESCAPED_CHARS)
|
|
|
|
def escape(self, value: str) -> str:
|
|
def escape_symbol(match):
|
|
value = match.group(0)
|
|
return f"\\{value}"
|
|
|
|
return self.escaped_chars_re.sub(escape_symbol, value)
|