a8f7080fbcc91a80391f93c82e21238fc6f82823,tests/test_extract.py,ExtractTestCase,test_words_min_freq,#ExtractTestCase#,48
Before Change
self.assertEqual(observed, expected)
def test_words_min_freq(self):
expected = [
",", "I", "in", "in", "an", "for", ".", "For", ",", "we",
"the", "education", "in", "the", ".", "And", "an",
"education", "and", "he", """, "I", "we", "to", "in"]
observed = [tok.text for tok in extract.words(
self.spacy_doc, filter_stops=False, filter_punct=False, filter_nums=False,
min_freq=2)][:25]
self.assertEqual(observed, expected)
After Change
self.assertTrue(all(tok.pos_ == "NOUN" for tok in result))
def test_words_min_freq(self):
counts = collections.Counter()
counts.update(tok.lower_ for tok in self.spacy_doc)
result = [tok for tok in extract.words(
self.spacy_doc, filter_stops=False, filter_punct=False, filter_nums=False,
min_freq=2)]
self.assertTrue(all(counts[tok.lower_] >= 2 for tok in result))
In pattern: SUPERPATTERN
Frequency: 4
Non-data size: 7
Instances Project Name: chartbeat-labs/textacy
Commit Name: a8f7080fbcc91a80391f93c82e21238fc6f82823
Time: 2017-11-28
Author: burton@chartbeat.com
File Name: tests/test_extract.py
Class Name: ExtractTestCase
Method Name: test_words_min_freq
Project Name: chartbeat-labs/textacy
Commit Name: a8f7080fbcc91a80391f93c82e21238fc6f82823
Time: 2017-11-28
Author: burton@chartbeat.com
File Name: tests/test_extract.py
Class Name: ExtractTestCase
Method Name: test_ngrams_min_freq
Project Name: chartbeat-labs/textacy
Commit Name: f127dccf797744d04255582e89bfac5163da5e6e
Time: 2017-11-30
Author: burton@chartbeat.com
File Name: tests/test_extract.py
Class Name: ExtractTestCase
Method Name: test_ngrams_min_freq
Project Name: chartbeat-labs/textacy
Commit Name: f127dccf797744d04255582e89bfac5163da5e6e
Time: 2017-11-30
Author: burton@chartbeat.com
File Name: tests/test_extract.py
Class Name: ExtractTestCase
Method Name: test_words_min_freq