|
|
|
@ -24,16 +24,19 @@ XML_ID_PREFIX = 's'
|
|
|
|
|
|
|
|
|
|
resource_directory = None
|
|
|
|
|
tmp_directory = None
|
|
|
|
|
nlp = None
|
|
|
|
|
|
|
|
|
|
def __get_tmp_file_name(file_name):
|
|
|
|
|
return tmp_directory + '/' + file_name
|
|
|
|
|
|
|
|
|
|
def initialise(**argument_map):
|
|
|
|
|
global tmp_directory, resource_directory
|
|
|
|
|
global tmp_directory, resource_directory, nlp
|
|
|
|
|
tmp_directory = argument_map['temp_dir']
|
|
|
|
|
resource_directory = argument_map['resource_dir']
|
|
|
|
|
shutil.rmtree(tmp_directory, True)
|
|
|
|
|
os.makedirs(tmp_directory, exist_ok=True)
|
|
|
|
|
NLP_CONFIG_MAP['models_dir'] = resource_directory + '/classla'
|
|
|
|
|
nlp = classla.Pipeline('sl', **NLP_CONFIG_MAP)
|
|
|
|
|
|
|
|
|
|
def import_string_file(file_name):
|
|
|
|
|
shutil.copyfile(file_name, __get_tmp_file_name(STRING_LIST_FILE_NAME))
|
|
|
|
@ -54,8 +57,6 @@ def do_parse():
|
|
|
|
|
doc = Document(text=None)
|
|
|
|
|
conll_file = CoNLLFile(filename=input_file_name)
|
|
|
|
|
doc.conll_file = conll_file
|
|
|
|
|
NLP_CONFIG_MAP['models_dir'] = resource_directory + '/classla'
|
|
|
|
|
nlp = classla.Pipeline('sl', **NLP_CONFIG_MAP)
|
|
|
|
|
result = nlp(doc)
|
|
|
|
|
result.conll_file.write_conll(output_file_name)
|
|
|
|
|
|
|
|
|
|