Source code for sourced.ml.core.extractors.identifiers
from sourced.ml.core.algorithms.token_parser import NoopTokenParser
from sourced.ml.core.algorithms.uast_ids_to_bag import UastIds2Bag
from sourced.ml.core.extractors.bags_extractor import BagsExtractor
from sourced.ml.core.extractors.helpers import register_extractor
[docs]@register_extractor
class IdentifiersBagExtractor(BagsExtractor):
OPTS.update(BagsExtractor.OPTS)
def __init__(self, docfreq_threshold=None, split_stem=True, **kwargs):
super().__init__(docfreq_threshold, **kwargs)
self.id2bag = UastIds2Bag(None, NoopTokenParser() if not split_stem else None)