4a1b752726028f02bd04fc7b766b048a859e7f97,deepchem/models/tests/test_api.py,TestModelAPI,test_singletask_sklearn_rf_ECFP_regression_sharded_API,#TestModelAPI#,113
Before Change
task_type = "regression"
task_types = {task: task_type for task in tasks}
input_file = "../../../datasets/pdbbind_core_df.pkl.gz"
train_dataset , test_dataset, _, transformers = self._featurize_train_test_split(
splittype, featurizers, input_transformers, output_transformers,
input_file, tasks, shard_size=50)
// We set shard size above to force the creation of multiple shards of the data.
After Change
tasks = ["label"]
task_type = "regression"
task_types = {task: task_type for task in tasks}
input_file = os.path.join(
self.current_dir, "../../../datasets/pdbbind_core_df.pkl.gz")
featurizer = DataFeaturizer(tasks=tasks,
smiles_field=self.smiles_field,
featurizers=featurizers,
verbosity="low")
dataset = featurizer.featurize(input_file, self.data_dir)
splitter = ScaffoldSplitter()
train_dataset, test_dataset = splitter.train_test_split(
dataset, self.train_dir, self.test_dir)
//train_dataset, test_dataset, _, transformers = self._featurize_train_test_split(
// splittype, featurizers, input_transformers, output_transformers,
// input_file, tasks, shard_size=50)
input_transformers = []
In pattern: SUPERPATTERN
Frequency: 4
Non-data size: 18
Instances Project Name: deepchem/deepchem
Commit Name: 4a1b752726028f02bd04fc7b766b048a859e7f97
Time: 2016-05-29
Author: bharath.ramsundar@gmail.com
File Name: deepchem/models/tests/test_api.py
Class Name: TestModelAPI
Method Name: test_singletask_sklearn_rf_ECFP_regression_sharded_API
Project Name: deepchem/deepchem
Commit Name: 4a1b752726028f02bd04fc7b766b048a859e7f97
Time: 2016-05-29
Author: bharath.ramsundar@gmail.com
File Name: deepchem/models/tests/test_api.py
Class Name: TestModelAPI
Method Name: test_singletask_sklearn_rf_RDKIT_descriptor_regression_API
Project Name: deepchem/deepchem
Commit Name: 4a1b752726028f02bd04fc7b766b048a859e7f97
Time: 2016-05-29
Author: bharath.ramsundar@gmail.com
File Name: deepchem/models/tests/test_api.py
Class Name: TestModelAPI
Method Name: test_singletask_tf_mlp_ECFP_classification_API
Project Name: deepchem/deepchem
Commit Name: ee2bc2a8daaba5717e49917831ddf8229d1ebe70
Time: 2016-05-30
Author: bharath.ramsundar@gmail.com
File Name: deepchem/models/tests/test_api.py
Class Name: TestModelAPI
Method Name: test_singletask_sklearn_rf_ECFP_regression_API