2137c84c95286a1c888140cf425c27ff087271bb,solutionbox/structured_data/mltoolbox/_structured_data/preprocess/local_preprocess.py,,run_numerical_categorical_analysis,#Any#Any#,70
Before Change
// label2,count
// ...
// where label1 is the most frequent label, and label2 is the 2nd most, etc.
labels = "\n".join(["%s,%d" % (label, count)
for label, count in sorted(six.iteritems(label_count),
key=lambda x: x[1],
reverse=True)])
file_io.write_string_to_file(
os.path.join(args.output_dir, CATEGORICAL_ANALYSIS_FILE % name),
labels)
After Change
// Write the vocab files. Each label is on its own line.
for name, unique_labels in six.iteritems(categorical_results):
labels = "\n".join(list(unique_labels))
file_io.write_string_to_file(
os.path.join(args.output_dir, CATEGORICAL_ANALYSIS_FILE % name),
labels)
In pattern: SUPERPATTERN
Frequency: 5
Non-data size: 4
Instances Project Name: googledatalab/pydatalab
Commit Name: 2137c84c95286a1c888140cf425c27ff087271bb
Time: 2017-04-21
Author: brandondutra@google.com
File Name: solutionbox/structured_data/mltoolbox/_structured_data/preprocess/local_preprocess.py
Class Name:
Method Name: run_numerical_categorical_analysis
Project Name: CamDavidsonPilon/lifelines
Commit Name: 52f0b3557df5bafee7830e4ac2e04ca7f1a82c37
Time: 2020-07-24
Author: cam.davidson.pilon@gmail.com
File Name: lifelines/fitters/__init__.py
Class Name: ParametricRegressionFitter
Method Name: _create_design_info_and_matrices
Project Name: PyThaiNLP/pythainlp
Commit Name: 02bc05643816935e205611ee95c90fcf057b9cef
Time: 2020-02-09
Author: wannaphong@yahoo.com
File Name: pythainlp/tokenize/etcc.py
Class Name:
Method Name:
Project Name: chartbeat-labs/textacy
Commit Name: 465e3da40350f30c2ef965b72531fb33666fa388
Time: 2019-03-20
Author: burtdewilde@gmail.com
File Name: tests/test_extract.py
Class Name:
Method Name: test_subject_verb_object_triples
Project Name: pytorch/pytorch
Commit Name: 64255294ba92089e2acabde78293e057a1c5d144
Time: 2021-03-08
Author: chenlai@fb.com
File Name: .circleci/cimodel/data/simple/macos_definitions.py
Class Name: MacOsJob
Method Name: gen_tree