dd2eaf6c174fdd757514bc06d1063e5f9c6bb4a0,torchnlp/samplers/bucket_batch_sampler.py,BucketBatchSampler,__iter__,#BucketBatchSampler#,90
Before Change
yield batch
if self.biggest_batches_first is None:
return get_batches()
else:
batches = list(get_batches())
biggest_batches = heapq.nlargest(
5,
range(len(batches)),
key=lambda i: sum([self.biggest_batches_first(self.data[j]) for j in batches[i]]))
front = [batches[i] for i in biggest_batches]
// Remove ``biggest_batches`` from data
for i in sorted(biggest_batches, reverse=True):
batches.pop(i)
// Move them to the front
batches[0:0] = front
return iter(batches)
def __len__(self):
if self.drop_last:
return len(self.data) // self.batch_size
else:
After Change
sorted_sampler = SortedSampler(bucket, self.sort_key)
for batch in SubsetRandomSampler(
list(BatchSampler(sorted_sampler, self.batch_size, self.drop_last))):
yield [bucket[i] for i in batch]
def __len__(self):
if self.drop_last:
return len(self.sampler) // self.batch_size
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 3
Instances Project Name: PetrochukM/PyTorch-NLP
Commit Name: dd2eaf6c174fdd757514bc06d1063e5f9c6bb4a0
Time: 2019-10-20
Author: petrochukm@gmail.com
File Name: torchnlp/samplers/bucket_batch_sampler.py
Class Name: BucketBatchSampler
Method Name: __iter__
Project Name: dgasmith/opt_einsum
Commit Name: 589950b1125c4561b3ec7480cc1f71bfb85249a8
Time: 2018-08-20
Author: fritzo@uber.com
File Name: opt_einsum/backends/shared.py
Class Name:
Method Name: handle_sharing
Project Name: biocore/scikit-bio
Commit Name: e17cfdf50ab43846175416f0d8f9032a4d4a6f6e
Time: 2014-03-24
Author: mcdonadt@colorado.edu
File Name: skbio/core/tree.py
Class Name: TreeNode
Method Name: tips