7247571ab448f9ccf6b392a26df0b8b40b1085eb,2018-asr-attention/librispeech/full-setup-attention/tools/collect-train-text.py,,,#,4
Before Change
zip_files = ["%s/%s" % (zip_dir, fn) for fn in zip_files]
assert all([os.path])
for fn in sorted(glob("train-*/*/*/*.trans.txt")):
for l in open(fn).read().splitlines():
seq_name, txt = l.split(" ", 1)
print(txt)
After Change
zip_files = ["train-clean-100.zip", "train-clean-360.zip", "train-other-500.zip"]
zip_files = ["%s/%s" % (zip_dir, fn) for fn in zip_files]
assert all([os.path.exists(fn) for fn in zip_files])
zip_files = [ZipFile(fn) for fn in zip_files]
for zip_file in zip_files:
assert zip_file.filelist
assert zip_file.filelist[0].filename.startswith("LibriSpeech/")
for info in zip_file.filelist:
assert isinstance(info, ZipInfo)
path = info.filename.split("/")
assert path[0] == "LibriSpeech", "does not expect %r (%r)" % (info, info.filename)
if path[1].startswith("train-"):
subdir = path[1] // e.g. "train-clean-100"
if path[-1].endswith(".trans.txt"):
for l in zip_file.read(info).decode("utf8").splitlines():
seq_name, txt = l.split(" ", 1)
print(txt)
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 6
Instances
Project Name: rwth-i6/returnn-experiments
Commit Name: 7247571ab448f9ccf6b392a26df0b8b40b1085eb
Time: 2018-05-16
Author: zeyer@i6.informatik.rwth-aachen.de
File Name: 2018-asr-attention/librispeech/full-setup-attention/tools/collect-train-text.py
Class Name:
Method Name:
Project Name: kubeflow/kubeflow
Commit Name: d5caf230ff50260c1a6565db35edeeddd5d407e6
Time: 2018-02-08
Author: mitake.hitoshi@gmail.com
File Name: build/boilerplate/boilerplate.py
Class Name:
Method Name: get_refs
Project Name: biotite-dev/biotite
Commit Name: f259c920b941a573451c1a1fe81c407689c5768a
Time: 2018-02-08
Author: patrick.kunzm@gmail.com
File Name: setup.py
Class Name:
Method Name: get_extensions