From 3923888172a6d4ec17a5ab288f5e4bd2ed2b59fb Mon Sep 17 00:00:00 2001 From: voje Date: Fri, 19 Apr 2019 07:45:50 +0200 Subject: [PATCH] bug fix: adding _ to adjective headwords --- src/backend_flask/preprocess.py | 3 +++ src/pkg/cjvt-corpusparser | 2 +- src/pkg/valency/valency/Frame.py | 3 ++- 3 files changed, 6 insertions(+), 2 deletions(-) diff --git a/src/backend_flask/preprocess.py b/src/backend_flask/preprocess.py index 4f26474..4057411 100644 --- a/src/backend_flask/preprocess.py +++ b/src/backend_flask/preprocess.py @@ -1,3 +1,6 @@ +# Deprecated: headword creation moved to be part of corpusparser, +# index creation moved to app.py as a preprocessing (with exit) step + CORPORA = ["kres", "ssj"] if __name__ == "__main__": diff --git a/src/pkg/cjvt-corpusparser b/src/pkg/cjvt-corpusparser index af4f604..c6b8426 160000 --- a/src/pkg/cjvt-corpusparser +++ b/src/pkg/cjvt-corpusparser @@ -1 +1 @@ -Subproject commit af4f6045bb06d05f932a720f1802062bbdeebeb7 +Subproject commit c6b8426fb30f11f64bccb7f8bf0f1dd367f1a6f2 diff --git a/src/pkg/valency/valency/Frame.py b/src/pkg/valency/valency/Frame.py index 26e099b..dc1148e 100644 --- a/src/pkg/valency/valency/Frame.py +++ b/src/pkg/valency/valency/Frame.py @@ -1,4 +1,5 @@ import logging +from corpusparser import enriched_lemma log = logging.getLogger(__name__) @@ -20,7 +21,7 @@ def frames_from_db_entry(dbent): srldict[key] += [srl] for hwtid, srlarr in srldict.items(): frames += [Frame( - hw_lemma=token_dict[hwtid]["lemma"], + hw_lemma=enriched_lemma(token_dict[hwtid]), tids=[_full_tid(hwtid)], slots=[ Slot(