99d0fb1a8a00c80c97271b2cc58d52c4fcff0032,jieba/__init__.py,Tokenizer,load_userdict,#Tokenizer#Any#,347
Before Change
line = ln.strip().decode("utf-8").lstrip("\ufeff")
if not line:
continue
tup = line.split(" ")
freq, tag = None, None
if len(tup) == 2:
if tup[1].isdigit():
freq = tup[1]
else:
tag = tup[1]
elif len(tup) > 2:
freq, tag = tup[1], tup[2]
self.add_word(tup[0], freq, tag)
except Exception:
raise ValueError(
"invalid dictionary entry in %s at Line %s: %s" % (
After Change
f = open(f, "rb")
for lineno, ln in enumerate(f, 1):
line = ln.strip()
if not isinstance(f, text_type):
try:
line = line.decode("utf-8").lstrip("\ufeff")
except UnicodeDecodeError:
raise ValueError("dictionary file %s must be utf-8" % f.name)
if not line:
continue
// match won"t be None because there"s at least one character
word, freq, tag = re_userdict.match(line).groups()
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 7
Instances
Project Name: fxsjy/jieba
Commit Name: 99d0fb1a8a00c80c97271b2cc58d52c4fcff0032
Time: 2015-11-09
Author: abcdoyle888@gmail.com
File Name: jieba/__init__.py
Class Name: Tokenizer
Method Name: load_userdict
Project Name: hyperspy/hyperspy
Commit Name: 904e72663b634ce65641c3c99e2219e91aefc671
Time: 2017-01-10
Author: eric.prestat@gmail.com
File Name: hyperspy/misc/date_time_tools.py
Class Name:
Method Name: update_date_time_in_metadata
Project Name: pantsbuild/pants
Commit Name: 6ffda41d1538a5f8e6eab953346a95505c84c40c
Time: 2014-01-17
Author: travis@twitter.com
File Name: src/python/twitter/pants/targets/python_binary.py
Class Name: PythonBinary
Method Name: __init__