Skip to content

Commit daa0886

Browse files
authored
Merge pull request jdlorimer#146 from 3ter/remove-regex-deprecation-warnings
Remove 'DeprecationWarning: invalid escape sequence'
2 parents da3f227 + 5144120 commit daa0886

File tree

2 files changed

+8
-8
lines changed

2 files changed

+8
-8
lines changed

chinese/lib/jieba/__init__.py

+6-6
Original file line numberDiff line numberDiff line change
@@ -34,19 +34,19 @@
3434

3535
pool = None
3636

37-
re_userdict = re.compile('^(.+?)( [0-9]+)?( [a-z]+)?$', re.U)
37+
re_userdict = re.compile(r'^(.+?)( [0-9]+)?( [a-z]+)?$', re.U)
3838

39-
re_eng = re.compile('[a-zA-Z0-9]', re.U)
39+
re_eng = re.compile(r'[a-zA-Z0-9]', re.U)
4040

4141
# \u4E00-\u9FD5a-zA-Z0-9+#&\._ : All non-space characters. Will be handled with re_han
4242
# \r\n|\s : whitespace characters. Will not be handled.
4343
# re_han_default = re.compile("([\u4E00-\u9FD5a-zA-Z0-9+#&\._%]+)", re.U)
4444
# Adding "-" symbol in re_han_default
45-
re_han_default = re.compile("([\u4E00-\u9FD5a-zA-Z0-9+#&\._%\-]+)", re.U)
45+
re_han_default = re.compile(r'([\u4E00-\u9FD5a-zA-Z0-9+#&\._%\-]+)', re.U)
4646

47-
re_skip_default = re.compile("(\r\n|\s)", re.U)
48-
re_han_cut_all = re.compile("([\u4E00-\u9FD5]+)", re.U)
49-
re_skip_cut_all = re.compile("[^a-zA-Z0-9+#\n]", re.U)
47+
re_skip_default = re.compile(r'(\r\n|\s)', re.U)
48+
re_han_cut_all = re.compile(r'([\u4E00-\u9FD5]+)', re.U)
49+
re_skip_cut_all = re.compile(r'[^a-zA-Z0-9+#\n]', re.U)
5050

5151
def setLogLevel(log_level):
5252
global logger

chinese/lib/jieba/finalseg/__init__.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -74,8 +74,8 @@ def __cut(sentence):
7474
if nexti < len(sentence):
7575
yield sentence[nexti:]
7676

77-
re_han = re.compile("([\u4E00-\u9FD5]+)")
78-
re_skip = re.compile("([a-zA-Z0-9]+(?:\.\d+)?%?)")
77+
re_han = re.compile(r'([\u4E00-\u9FD5]+)')
78+
re_skip = re.compile(r'([a-zA-Z0-9]+(?:\.\d+)?%?)')
7979

8080

8181
def add_force_split(word):

0 commit comments

Comments
 (0)