22a7e3b66d306446852063a0a5320a30667c57dd,tmtoolkit/preprocess/_tmpreproc.py,TMPreproc,remove_tokens_by_doc_frequency,#TMPreproc#Any#Any#Any#,1300
Before Change
if blacklist:
self._invalidate_workers_tokens()
logger.debug("will remove the following %d tokens: %s" % (len(blacklist), blacklist))
self._send_task_to_workers("filter_tokens",
search_tokens=blacklist,
match_type="exact",
ignore_case=False,
After Change
df_threshold=df_threshold, absolute=absolute, return_mask=True)
if sum(sum(dmsk) for dmsk in mask) > 0:
self.remove_tokens_by_mask(dict(zip(self._workers_tokens.keys(), mask)) )
return self
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 3
Instances Project Name: WZBSocialScienceCenter/tmtoolkit
Commit Name: 22a7e3b66d306446852063a0a5320a30667c57dd
Time: 2019-11-12
Author: markus.konrad@wzb.eu
File Name: tmtoolkit/preprocess/_tmpreproc.py
Class Name: TMPreproc
Method Name: remove_tokens_by_doc_frequency
Project Name: streamlit/streamlit
Commit Name: cf2e5c02c448c6f25136a4cd1b89e7f0ba1a3d37
Time: 2018-07-06
Author: adrien.g.treuille@gmail.com
File Name: lib/streamlit/config.py
Class Name:
Method Name: get_s3_option
Project Name: streamlit/streamlit
Commit Name: c786913462decebc4157ac3e8d2ec08303021adc
Time: 2018-07-02
Author: adrien.g.treuille@gmail.com
File Name: lib/streamlit/config.py
Class Name:
Method Name: get_s3_option