1fe319ef49168c2c7c8d10a7c426c1414521d164,cnvlib/tabio/genepred.py,,read_refflat,#Any#Any#Any#,80

Before Change


                               dtype={c: str for c in cols_shared})
    except (pd.parser.CParserError, csv.Error) as err:
        raise ValueError("Unexpected dataframe contents:\n%s\n%s" %
                            (line, next(infile)))

    // Calculate values for output columns
    if exons:

After Change


        cols_rest = ["_start_tx", "_end_tx",  // Transcription
                     "_start_cds", "_end_cds",  // Coding region
                     "_exon_count", "exon_starts", "exon_ends"]
        converters = {"exon_starts": _split_commas, "exon_ends": _split_commas}
    elif cds:
        // Use CDS instead of transcription region
        cols_rest = ["_start_tx", "_end_tx",
                     "start", "end",
                     "_exon_count", "_exon_starts", "_exon_ends"]
    else:
        cols_rest = ["start", "end",
                     "_start_cds", "_end_cds",
                     "_exon_count", "_exon_starts", "_exon_ends"]
    colnames = cols_shared + cols_rest
    usecols = [c for c in colnames if not c.startswith("_")]
    // Parse the file contents
    dframe = pd.read_table(infile,  header=None, na_filter=False,
                           names=colnames, usecols=usecols,
                           dtype={c: str for c in cols_shared},
                           converters=converters)

    // Calculate values for output columns
    if exons:
        dframe = pd.DataFrame.from_records(_split_exons(dframe),
                                           columns=cols_shared + ["start", "end"])
        dframe["start"] = dframe["start"].astype("int")
        dframe["end"] = dframe["end"].astype("int")

    return (dframe.assign(start=dframe.start - 1)
            .sort_values(["chromosome", "start", "end"])
            .reset_index(drop=True))
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 3

Instances


Project Name: etal/cnvkit
Commit Name: 1fe319ef49168c2c7c8d10a7c426c1414521d164
Time: 2016-10-28
Author: eric.talevich@gmail.com
File Name: cnvlib/tabio/genepred.py
Class Name:
Method Name: read_refflat


Project Name: HyperGAN/HyperGAN
Commit Name: fb5a8a3e0a73eea528ac398c04ba20a96ef575e1
Time: 2020-02-17
Author: martyn@255bits.com
File Name: examples/experimental/next-frame.py
Class Name: VideoFrameSampler
Method Name: seed


Project Name: facebookresearch/pytext
Commit Name: bc6e778bc0523f463ae17ffe6f32ce2c3ff4e7b4
Time: 2019-03-12
Author: snl@fb.com
File Name: pytext/data/test/tensorizers_test.py
Class Name: TensorizersTest
Method Name: test_create_byte_tensors