6a0b1657c0b5619c8360f40e735253fa39e4e55a,tensorflow_datasets/summarization/gigaword.py,Gigaword,_split_generators,#Gigaword#Any#,83

Before Change


        _DOCUMENT: os.path.join(gigaword_path, "Giga/input.txt"),
        _SUMMARY: os.path.join(gigaword_path, "Giga/task1_ref0.txt")
    }
    return [
        tfds.core.SplitGenerator(
            name=tfds.Split.TRAIN,
            gen_kwargs={"path": train_path},
        ),
        tfds.core.SplitGenerator(
            name=tfds.Split.TEST,
            gen_kwargs={"path": test_path},
        ),
    ]

  def _generate_examples(self, path=None):
    Yields examples.
    with tf.io.gfile.GFile(path[_DOCUMENT]) as f_d, tf.io.gfile.GFile(

After Change


    Returns SplitGenerators.
    dl_path = dl_manager.download_and_extract(_URL)
    pattern = os.path.join(dl_path, "org_data", "%s.%s.txt")
    return [
        tfds.core.SplitGenerator(
            name=tfds.Split.TRAIN,
            gen_kwargs={
                "src_path": pattern % ("train", "src"),
                "tgt_path": pattern % ("train", "tgt")
            },
        ),
        tfds.core.SplitGenerator(
            name=tfds.Split.VALIDATION,
            gen_kwargs={
                "src_path": pattern % ("dev", "src"),
                "tgt_path": pattern % ("dev", "tgt")
            },
        ),
        tfds.core.SplitGenerator(
            name=tfds.Split.TEST,
            gen_kwargs={
                "src_path": pattern % ("test", "src"),
                "tgt_path": pattern % ("test", "tgt")
            },
        ),
    ]

  def _generate_examples(self, src_path=None, tgt_path=None):
    Yields examples.
    with tf.io.gfile.GFile(src_path) as f_d, tf.io.gfile.GFile(tgt_path) as f_s:
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 7

Instances


Project Name: tensorflow/datasets
Commit Name: 6a0b1657c0b5619c8360f40e735253fa39e4e55a
Time: 2019-10-24
Author: yaozhaoyz@google.com
File Name: tensorflow_datasets/summarization/gigaword.py
Class Name: Gigaword
Method Name: _split_generators


Project Name: tensorflow/datasets
Commit Name: 6a0b1657c0b5619c8360f40e735253fa39e4e55a
Time: 2019-10-24
Author: yaozhaoyz@google.com
File Name: tensorflow_datasets/summarization/gigaword.py
Class Name: Gigaword
Method Name: _split_generators


Project Name: tensorflow/datasets
Commit Name: ecf2583ed663faa52da43a058189c799392e6502
Time: 2019-04-01
Author: navinmohan81@gmail.com
File Name: tensorflow_datasets/image/scene_parse_150.py
Class Name: SceneParse150
Method Name: _split_generators


Project Name: tensorflow/datasets
Commit Name: 37b144737c6d068368328fbd4e102a20df98b865
Time: 2019-06-06
Author: pierrot@google.com
File Name: tensorflow_datasets/testing/test_utils.py
Class Name: DummyDatasetSharedGenerator
Method Name: _split_generators