2137c84c95286a1c888140cf425c27ff087271bb,solutionbox/structured_data/mltoolbox/_structured_data/preprocess/local_preprocess.py,,run_numerical_categorical_analysis,#Any#Any#,70

Before Change


    // label2,count
    // ...
    // where label1 is the most frequent label, and label2 is the 2nd most, etc.
    labels = "\n".join(["%s,%d" % (label, count)
                        for label, count in sorted(six.iteritems(label_count),
                                                   key=lambda x: x[1],
                                                   reverse=True)])
    file_io.write_string_to_file(
        os.path.join(args.output_dir, CATEGORICAL_ANALYSIS_FILE % name),
        labels)

After Change



  // Write the vocab files. Each label is on its own line.
  for name, unique_labels in six.iteritems(categorical_results):
    labels = "\n".join(list(unique_labels))
    file_io.write_string_to_file(
        os.path.join(args.output_dir, CATEGORICAL_ANALYSIS_FILE % name),
        labels)
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 5

Non-data size: 4

Instances


Project Name: googledatalab/pydatalab
Commit Name: 2137c84c95286a1c888140cf425c27ff087271bb
Time: 2017-04-21
Author: brandondutra@google.com
File Name: solutionbox/structured_data/mltoolbox/_structured_data/preprocess/local_preprocess.py
Class Name:
Method Name: run_numerical_categorical_analysis


Project Name: CamDavidsonPilon/lifelines
Commit Name: 52f0b3557df5bafee7830e4ac2e04ca7f1a82c37
Time: 2020-07-24
Author: cam.davidson.pilon@gmail.com
File Name: lifelines/fitters/__init__.py
Class Name: ParametricRegressionFitter
Method Name: _create_design_info_and_matrices


Project Name: PyThaiNLP/pythainlp
Commit Name: 02bc05643816935e205611ee95c90fcf057b9cef
Time: 2020-02-09
Author: wannaphong@yahoo.com
File Name: pythainlp/tokenize/etcc.py
Class Name:
Method Name:


Project Name: chartbeat-labs/textacy
Commit Name: 465e3da40350f30c2ef965b72531fb33666fa388
Time: 2019-03-20
Author: burtdewilde@gmail.com
File Name: tests/test_extract.py
Class Name:
Method Name: test_subject_verb_object_triples


Project Name: pytorch/pytorch
Commit Name: 64255294ba92089e2acabde78293e057a1c5d144
Time: 2021-03-08
Author: chenlai@fb.com
File Name: .circleci/cimodel/data/simple/macos_definitions.py
Class Name: MacOsJob
Method Name: gen_tree