a8f7080fbcc91a80391f93c82e21238fc6f82823,tests/test_extract.py,ExtractTestCase,test_words_min_freq,#ExtractTestCase#,48

Before Change


        self.assertEqual(observed, expected)

    def test_words_min_freq(self):
        expected = [
            ",", "I", "in", "in", "an", "for", ".", "For", ",", "we",
            "the", "education", "in", "the", ".", "And", "an",
            "education", "and", "he", """, "I", "we", "to", "in"]
        observed = [tok.text for tok in extract.words(
            self.spacy_doc, filter_stops=False, filter_punct=False, filter_nums=False,
            min_freq=2)][:25]
        self.assertEqual(observed, expected)

After Change


        self.assertTrue(all(tok.pos_ == "NOUN" for tok in result))

    def test_words_min_freq(self):
        counts = collections.Counter()
        counts.update(tok.lower_ for tok in self.spacy_doc)
        result = [tok for tok in extract.words(
            self.spacy_doc, filter_stops=False, filter_punct=False, filter_nums=False,
            min_freq=2)]
        self.assertTrue(all(counts[tok.lower_] >= 2 for tok in result))
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 4

Non-data size: 7

Instances


Project Name: chartbeat-labs/textacy
Commit Name: a8f7080fbcc91a80391f93c82e21238fc6f82823
Time: 2017-11-28
Author: burton@chartbeat.com
File Name: tests/test_extract.py
Class Name: ExtractTestCase
Method Name: test_words_min_freq


Project Name: chartbeat-labs/textacy
Commit Name: a8f7080fbcc91a80391f93c82e21238fc6f82823
Time: 2017-11-28
Author: burton@chartbeat.com
File Name: tests/test_extract.py
Class Name: ExtractTestCase
Method Name: test_ngrams_min_freq


Project Name: chartbeat-labs/textacy
Commit Name: f127dccf797744d04255582e89bfac5163da5e6e
Time: 2017-11-30
Author: burton@chartbeat.com
File Name: tests/test_extract.py
Class Name: ExtractTestCase
Method Name: test_ngrams_min_freq


Project Name: chartbeat-labs/textacy
Commit Name: f127dccf797744d04255582e89bfac5163da5e6e
Time: 2017-11-30
Author: burton@chartbeat.com
File Name: tests/test_extract.py
Class Name: ExtractTestCase
Method Name: test_words_min_freq