From 3c4f4bfd44f09a843dc07c9cc68d5b875e5e66a4 Mon Sep 17 00:00:00 2001 From: Chaoying <32626585+Chaoyingz@users.noreply.github.com> Date: Tue, 29 Mar 2022 09:16:21 +0800 Subject: [PATCH] Fix Chinese punctuation regex comment (#1012) --- qlib/utils/__init__.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/qlib/utils/__init__.py b/qlib/utils/__init__.py index 50fb785d8..eaacc613c 100644 --- a/qlib/utils/__init__.py +++ b/qlib/utils/__init__.py @@ -271,7 +271,11 @@ def parse_field(field): if not isinstance(field, str): field = str(field) - # Chinese Punctuation Regex: \nff08 = (, \nff09 = ), \nff1a = :, \n3001 = 。 + # Chinese punctuation regex: + # \u3001 -> 、 + # \uff1a -> : + # \uff08 -> ( + # \uff09 -> ) chinese_punctuation_regex = r"\u3001\uff1a\uff08\uff09" for pattern, new in [ (rf"\$\$([\w{chinese_punctuation_regex}]+)", r'PFeature("\1")'), # $$ must be before $