e998834136c5074583f528b7422c56ab57009c1f,nlp_architect/utils/text.py,SpacyTokenizer,__init__,#SpacyTokenizer#Any#,120

Before Change


            print("    python -m spacy download en_core_web_sm")
            print("")
            print("Spacy license:  MIT")
            print("Link to license: https://github.com/explosion/spaCy/blob/master/LICENSE")
            print("The terms and conditions of the data set license apply. Intel does not "
                  "grant any rights to the data files or database")
            sys.exit(0)

After Change


                  "https://creativecommons.org/licenses/by-sa/3.0/")
            response = input("To download the model from {}, "
                             + "please type YES: ".format(url))
            if response.lower().strip() == "yes":
                print("The terms and conditions of the data set license apply. Intel does not "
                      "grant any rights to the data files or database")
                print("Downloading Spacy model...")
                spacy_download(model)
                self.parser = spacy.load(model, disable=pipeline_opts)
            else:
                print("Download declined. Response received {} != YES. ".format(response))
                print("Please download the model manually")
                sys.exit(0)

    def tokenize(self, text):
        
        Tokenize a sentence into tokens
        Args:
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 4

Non-data size: 4

Instances


Project Name: NervanaSystems/nlp-architect
Commit Name: e998834136c5074583f528b7422c56ab57009c1f
Time: 2018-05-09
Author: peter.izsak@intel.com
File Name: nlp_architect/utils/text.py
Class Name: SpacyTokenizer
Method Name: __init__


Project Name: hellohaptik/chatbot_ner
Commit Name: f271ea86878e4b01d3630bd296bc863928c0ca52
Time: 2019-09-30
Author: ruthvik@haptik.co
File Name: ner_v2/detectors/temporal/date/en/date_detection.py
Class Name: DateDetector
Method Name: _date_identification_everyday_except_weekends


Project Name: catalyst-cooperative/pudl
Commit Name: 4875e1c7fe16594cb2bf9fbb7ab04c0bae21424c
Time: 2019-07-08
Author: cgosnell@catalyst.coop
File Name: pudl/ETL_pkg.py
Class Name:
Method Name: _input_validate_epacems


Project Name: akkana/scripts
Commit Name: 3ae1e3fd5fad7676bdb48f94809a737648394f77
Time: 2020-07-27
Author: akkana@shallowsky.com
File Name: starstack.py
Class Name:
Method Name: register_all