f8df6021a1343d511d4c9b4c108ec5b683ce5487,modAL/batch.py,,ranked_batch,#Any#Any#Any#Any#,103

Before Change



    // Add uncertainty scores to our unlabeled data, and keep a copy of our unlabeled data.
    unlabeled_uncertainty = np.concatenate((unlabeled, np.expand_dims(uncertainty_scores, axis=1)), axis=1)
    unlabeled_uncertainty_copy = np.copy(unlabeled_uncertainty)

    // Define our record container and the maximum number of records to sample.
    instance_index_ranking = []
    ceiling = np.minimum(unlabeled.shape[0], n_instances)

    // TODO (dataframing) is there a better way to do this? Inherently sequential.
    for _ in range(ceiling):

        // Select the instance from our unlabeled copy that scores highest.
        raw_instance = select_instance(X_training=labeled, X_uncertainty=unlabeled_uncertainty_copy)
        instance = np.expand_dims(raw_instance, axis=1)

        // Find our record"s index in both the original unlabeled and our uncertainty copy.
        instance_index_original = np.where(np.all(unlabeled == raw_instance, axis=1))[0][0]
        instance_index_copy = np.where(np.all(unlabeled_uncertainty_copy[:, :-1] == instance.T, axis=1))[0][0]

        // Add our instance we"ve considered for labeling to our labeled set. Although we don"t
        // know it"s label, we want further iterations to consider the newly-added instance so
        // that we don"t query the same instance redundantly.

After Change


    unlabeled_uncertainty = np.concatenate((unlabeled, expanded_uncertainty_scores), axis=1)

    // Define our null row, which will be filtered during the select_instance call.
    null_row = np.ones(shape=(unlabeled_uncertainty.shape[1],)) * np.nan

    // Define our record container and the maximum number of records to sample.
    instance_index_ranking = []
    ceiling = np.minimum(unlabeled.shape[0], n_instances)

    for _ in range(ceiling):

        // Receive the instance and corresponding index from our unlabeled copy that scores highest.
        instance_index, instance = select_instance(
            X_training=labeled, X_uncertainty=unlabeled_uncertainty
        )

        // Prepare our most informative instance for concatenation.
        expanded_instance = np.expand_dims(instance, axis=0)

        // Add our instance we"ve considered for labeling to our labeled set. Although we don"t
        // know it"s label, we want further iterations to consider the newly-added instance so
        // that we don"t query the same instance redundantly.
        labeled = np.concatenate((labeled, expanded_instance), axis=0)

        // We "remove" our instance from the unlabeled set by setting that row to an array
        // of np.nan and filtering within select_instance.
        unlabeled_uncertainty[instance_index] = null_row

        // Finally, append our instance"s index to the bottom of our ranking.
        instance_index_ranking.append(instance_index)

In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 7

Instances

Link

Project Name: modAL-python/modAL

Commit Name: f8df6021a1343d511d4c9b4c108ec5b683ce5487

Time: 2018-08-14

Author: dannyofig@gmail.com

File Name: modAL/batch.py

Class Name:

Method Name: ranked_batch

Link

Project Name: arraiy/torchgeometry

Commit Name: 50839f8ed95147c71f9f045495ed45380a2ce513

Time: 2019-11-19

Author: priba@cvc.uab.cat

File Name: test/color/test_hls.py

Class Name: TestRgbToHls

Method Name: test_nan_rgb_to_hls

Link

Project Name: nilearn/nilearn

Commit Name: d5af4c37893a7ead45a966eb89a3e4018a97e556

Time: 2015-10-06

Author: sb238920@is223297.intra.cea.fr

File Name: nilearn/connectivity/connectivity_matrices.py

Class Name:

Method Name: sym_to_vec