0de3c091c75e36ffb4c12a2048110df37cafb644,src/fonduer/candidates/mentions.py,Ngrams,apply,#Ngrams#Any#,58

Before Change


                            seen.add(ts1)
                            yield ts1
                        ts2 = TemporarySpan(
                            char_start=start + m.end(1), char_end=end, sentence=context
                        )
                        if ts2 not in seen and ts2.get_span():
                            seen.add(ts2)

After Change


                ):
                    text = context.text[start - offsets[0] : end - offsets[0] + 1]
                    // Check splits individually
                    for split_token in self.split_tokens:
                        for word in re.split(split_token, text):
                            ts = TemporarySpan(
                                char_start=text.index(word),
                                char_end=text.index(word) + len(word) - 1,
                                sentence=context,
                            )
                            if ts not in seen and ts.get_span():
                                seen.add(ts)
                                yield ts
                    // And check splits together
                    for word in re.split("|".join(self.split_tokens), text):
                        ts = TemporarySpan(
                            char_start=text.index(word),
                            char_end=text.index(word) + len(word) - 1,
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 4

Instances


Project Name: HazyResearch/fonduer
Commit Name: 0de3c091c75e36ffb4c12a2048110df37cafb644
Time: 2018-09-20
Author: lwhsiao@stanford.edu
File Name: src/fonduer/candidates/mentions.py
Class Name: Ngrams
Method Name: apply


Project Name: nipunsadvilkar/pySBD
Commit Name: 0e364f4b0f70679ca984c0ba5629c569135804a4
Time: 2020-07-26
Author: nipunsadvilkar@gmail.com
File Name: pysbd/segmenter.py
Class Name: Segmenter
Method Name: sentences_with_char_spans


Project Name: graphbrain/graphbrain
Commit Name: e3518ea890e8ec8a8e065b3cd89c14879c68dc63
Time: 2020-08-20
Author: telmo@telmomenezes.net
File Name: graphbrain/agents/system.py
Class Name: System
Method Name: run