2573c649518391ada6214cfc72d20421dfac4072,src/preprocess.py,,get_embeddings,#Any#Any#Any#,194
Before Change
assert word in word2vec
except AssertionError as error:
log.debug(error)
pdb.set_trace()
embeddings[idx] = word2vec[word]
embeddings[vocab.get_token_index("@@PADDING@@")] = 0.
embeddings = torch.FloatTensor(embeddings)
log.info("\tFinished loading embeddings")
After Change
word_v_size, unk_idx = vocab.get_vocab_size("tokens"), vocab.get_token_index(vocab._oov_token)
embeddings = np.random.randn(word_v_size, d_word) //np.zeros((word_v_size, d_word))
with open(vec_file) as vec_fh:
for line in vec_fh:
word, vec = line.split(" ", 1)
idx = vocab.get_token_index(word)
if idx != unk_idx:
idx = vocab.get_token_index(word)
embeddings[idx] = np.array(list(map(float, vec.split())))
embeddings[vocab.get_token_index("@@PADDING@@")] = 0.
embeddings = torch.FloatTensor(embeddings)
log.info("\tFinished loading embeddings")
return embeddings
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 4
Instances
Project Name: jsalt18-sentence-repl/jiant
Commit Name: 2573c649518391ada6214cfc72d20421dfac4072
Time: 2018-03-16
Author: wang.alex.c@gmail.com
File Name: src/preprocess.py
Class Name:
Method Name: get_embeddings
Project Name: kbardool/keras-frcnn
Commit Name: 6ecffe54690da84be104cbb2ec8a709f6b2a7fd3
Time: 2017-02-03
Author: yannhenon@gmail.com
File Name: data_augment.py
Class Name:
Method Name: augment
Project Name: NifTK/NiftyNet
Commit Name: e9fb47f90dacd64ee9bfe7aafca59b5ff75e739f
Time: 2017-08-13
Author: wenqi.li@ucl.ac.uk
File Name: niftynet/engine/input_buffer.py
Class Name: InputBatchQueueRunner
Method Name: _push