Spaces:
Build error
Build error
#!/usr/bin/env python3 | |
# Copyright 2017-present, Facebook, Inc. | |
# All rights reserved. | |
# | |
# This source code is licensed under the license found in the | |
# LICENSE file in the root directory of this source tree. | |
import os | |
DEFAULTS = { | |
'corenlp_classpath': os.getenv('CLASSPATH') | |
} | |
def set_default(key, value): | |
global DEFAULTS | |
DEFAULTS[key] = value | |
from .corenlp_tokenizer import CoreNLPTokenizer | |
from .regexp_tokenizer import RegexpTokenizer | |
from .simple_tokenizer import SimpleTokenizer | |
# Spacy is optional | |
try: | |
from .spacy_tokenizer import SpacyTokenizer | |
except ImportError: | |
pass | |
def get_class(name): | |
if name == 'spacy': | |
return SpacyTokenizer | |
if name == 'corenlp': | |
return CoreNLPTokenizer | |
if name == 'regexp': | |
return RegexpTokenizer | |
if name == 'simple': | |
return SimpleTokenizer | |
raise RuntimeError('Invalid tokenizer: %s' % name) | |
def get_annotators_for_args(args): | |
annotators = set() | |
if args.use_pos: | |
annotators.add('pos') | |
if args.use_lemma: | |
annotators.add('lemma') | |
if args.use_ner: | |
annotators.add('ner') | |
return annotators | |
def get_annotators_for_model(model): | |
return get_annotators_for_args(model.args) | |