5651a0d052bcfd160b187828aa3d8d90652929fe,spacy/tests/doc/test_span_merge.py,,test_span_np_merges,#Any#,69

Before Change


    tokens = en_tokenizer(text)
    doc = get_doc(tokens.vocab, words=[t.text for t in tokens], heads=heads)

    ents = [(e[0].idx, e[-1].idx + len(e[-1]), e.label_, e.lemma_) for e in doc.ents]
    for start, end, label, lemma in ents:
        merged = doc.merge(start, end, tag=label, lemma=lemma, ent_type=label)
        assert merged is not None, (start, end, label, lemma)

    text = "One test with entities like New York City so the ents list is not void"
    heads = [1, 11, -1, -1, -1, 1, 1, -3, 4, 2, 1, 1, 0, -1, -2]

After Change


    tokens = en_tokenizer(text)
    doc = get_doc(tokens.vocab, words=[t.text for t in tokens], heads=heads)
    assert doc[4].head.i == 1
    with doc.retokenize() as retokenizer:
        attrs = {"tag": "NP", "lemma": "tool", "ent_type": "O"}
        retokenizer.merge(doc[2:5], attrs=attrs)
    assert doc[2].head.i == 1

    text = "displaCy is a lightweight and modern dependency parse tree visualization tool built with CSS3 and JavaScript."
    heads = [1, 0, 8, 3, -1, -2, 4, 3, 1, 1, -9, -1, -1, -1, -1, -2, -15]

In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 8

Instances

Link

Project Name: explosion/spaCy

Commit Name: 5651a0d052bcfd160b187828aa3d8d90652929fe

Time: 2019-02-15

Author: ines@ines.io

File Name: spacy/tests/doc/test_span_merge.py

Class Name:

Method Name: test_span_np_merges

Link

Project Name: explosion/spaCy

Commit Name: 5651a0d052bcfd160b187828aa3d8d90652929fe

Time: 2019-02-15

Author: ines@ines.io

File Name: spacy/pipeline/functions.py

Class Name:

Method Name: merge_entities

Link

Project Name: explosion/spaCy

Commit Name: 5651a0d052bcfd160b187828aa3d8d90652929fe

Time: 2019-02-15

Author: ines@ines.io

File Name: spacy/displacy/__init__.py

Class Name:

Method Name: parse_deps