You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
|
from ..char_classes import LIST_QUOTES
|
|
from ..punctuation import TOKENIZER_INFIXES as BASE_TOKENIZER_INFIXES
|
|
|
|
_infixes = (
|
|
["·", "ㆍ", r"\(", r"\)"]
|
|
+ [r"(?<=[0-9])~(?=[0-9-])"]
|
|
+ LIST_QUOTES
|
|
+ BASE_TOKENIZER_INFIXES
|
|
)
|
|
|
|
TOKENIZER_INFIXES = _infixes
|