bff5f111e188c26eff86d94249d5bf603f35d5e9,parlai/tasks/insuranceqa/build.py,,build,#Any#,71

Before Change


        build_data.untar(dpath, fname)

        // According to the author, V2 holds the latest data
        dpext = os.path.join(dpath, "insuranceQA-master/V2")

        // read vocab file
        vocab_path = os.path.join(dpext, "vocabulary")
        d_vocab = read_vocab(vocab_path)

        // read label2answer file
        label2answer_path_gz = os.path.join(dpext, "InsuranceQA.label2answer.token.encoded.gz")
        d_label_answer = read_label2answer(label2answer_path_gz, d_vocab)

        // TODO: right now it uses 100 by default, but 500, 1000, 1500 (// of label candidates) should also be available
        train_path_gz = os.path.join(dpext, "InsuranceQA.question.anslabel.token.100.pool.solr.train.encoded.gz")
        valid_path_gz = os.path.join(dpext, "InsuranceQA.question.anslabel.token.100.pool.solr.valid.encoded.gz")
        test_path_gz = os.path.join(dpext, "InsuranceQA.question.anslabel.token.100.pool.solr.test.encoded.gz")

        create_fb_format(dpath, "train", train_path_gz, d_vocab, d_label_answer)
        create_fb_format(dpath, "valid", valid_path_gz, d_vocab, d_label_answer)
        create_fb_format(dpath, "test", test_path_gz, d_vocab, d_label_answer)

After Change


        // Download the data from github.
        fname = "insuranceqa.zip"
        url = "https://github.com/shuzi/insuranceQA/archive/master.zip"
        print("[downloading data from: " + url + "]")
        build_data.download(url, dpath, fname)
        build_data.untar(dpath, fname)

        ParseInsuranceQAV1.build(dpath)
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 10

Instances


Project Name: facebookresearch/ParlAI
Commit Name: bff5f111e188c26eff86d94249d5bf603f35d5e9
Time: 2017-07-13
Author: chao@wayblazer.com
File Name: parlai/tasks/insuranceqa/build.py
Class Name:
Method Name: build


Project Name: facebookresearch/ParlAI
Commit Name: bff5f111e188c26eff86d94249d5bf603f35d5e9
Time: 2017-07-13
Author: chao@wayblazer.com
File Name: parlai/tasks/insuranceqa/build.py
Class Name:
Method Name: build


Project Name: pyprob/pyprob
Commit Name: 2728afcd57721b34f95ba575507a3db6c86c1f4c
Time: 2018-02-21
Author: atilimgunes.baydin@gmail.com
File Name: tests/test_model_remote.py
Class Name:
Method Name:


Project Name: yangyanli/PointCNN
Commit Name: 161b24af716a1e7a3221fce2903544ac1429387d
Time: 2018-06-08
Author: yangyan.lee@gmail.com
File Name: evaluation/eval_s3dis.py
Class Name:
Method Name: