0bcc8da0344cddc9dfff82a788df519c19489500,nltk/tokenize/treebank.py,TreebankWordTokenizer,span_tokenize,#TreebankWordTokenizer#Any#,147
Before Change
else:
tokens = raw_tokens
return align_tokens(tokens, text)
class TreebankWordDetokenizer(TokenizerI):
After Change
for word_token in self.tokenize(text):
if word_token in ("``", """"):
orig_idx = text.find(word_token, ix)
quote_idx = text.find(""", ix)
if orig_idx < 0:
real_token = """
elif quote_idx < 0:
real_token = word_token
elif orig_idx < quote_idx:
real_token = word_token
else:
real_token = """
else:
real_token = word_token
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 5
Instances
Project Name: nltk/nltk
Commit Name: 0bcc8da0344cddc9dfff82a788df519c19489500
Time: 2017-10-17
Author: lyyb46@gmail.com
File Name: nltk/tokenize/treebank.py
Class Name: TreebankWordTokenizer
Method Name: span_tokenize
Project Name: akkana/scripts
Commit Name: cc1d29a7a7a20a83a78a51a37eafa22ec9fa895d
Time: 2019-06-27
Author: akkana@shallowsky.com
File Name: newreads.py
Class Name: GoodreadsAPI
Method Name: books_by_author
Project Name: deepgram/kur
Commit Name: 697d56a33afbd2602414f894745a1cc144a53d06
Time: 2016-12-12
Author: ajsyp@syptech.net
File Name: setup.py
Class Name:
Method Name: readme