|
|
|
@ -1,20 +1,10 @@
|
|
|
|
|
# scripts
|
|
|
|
|
MWE_EXTRACTION_SCRIPT_NAME = 'wani.py'
|
|
|
|
|
STRUCTURE_ASSIGNMENT_SCRIPT_NAME = 'assign_structures.py'
|
|
|
|
|
STRUCTURE_CREATION_SCRIPT_NAME = 'create_structures.py'
|
|
|
|
|
DICTIONARY_MERGE_SCRIPT_NAME = 'merge_dictionaries.py'
|
|
|
|
|
|
|
|
|
|
# resources
|
|
|
|
|
TRANSLATION_FILE_NAME = '../resources/dict.xml'
|
|
|
|
|
STRUCTURE_SCHEMA_FILE_NAME = '../resources/structures.xsd'
|
|
|
|
|
DICTIONARY_SCHEMA_FILE_NAME = '../resources/monolingual_dictionaries.xsd'
|
|
|
|
|
|
|
|
|
|
# temporary outputs
|
|
|
|
|
FILE_MAP = {'strings-list': 'strings.txt',
|
|
|
|
|
'obeliks-tokenised': 'obeliks_raw.conllu',
|
|
|
|
|
'obeliks-tweaked': 'obeliks_tweaked.conllu',
|
|
|
|
|
'classla-parsed': 'classla_raw.conllu',
|
|
|
|
|
'classla-translated': 'classla_translated.conllu',
|
|
|
|
|
'dict': 'dict.xml',
|
|
|
|
|
'structure-schema': 'structures.xsd',
|
|
|
|
|
'tei-initial': 'tei_initial.xml',
|
|
|
|
|
'tei-single': 'tei_single.xml',
|
|
|
|
|
'tei-single-ids': 'tei_single_with_ids.xml',
|
|
|
|
@ -27,7 +17,8 @@ FILE_MAP = {'strings-list': 'strings.txt',
|
|
|
|
|
'structures-new': 'structures_new.xml',
|
|
|
|
|
'dictionary-single': 'dictionary_single.xml',
|
|
|
|
|
'dictionary-multiple': 'dictionary_multiple.xml',
|
|
|
|
|
'dictionary': 'dictionary.xml'
|
|
|
|
|
'dictionary': 'dictionary.xml',
|
|
|
|
|
'dictionary-schema': 'monolingual_dictionaries.xsd'
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
NLP_CONFIG_MAP = {
|
|
|
|
|