From 46f3c82f7a5adae37ad7a53751f2a04564ec0954 Mon Sep 17 00:00:00 2001 From: voje Date: Tue, 29 Jan 2019 08:53:23 +0100 Subject: [PATCH] replicated Nikola's results --- tools/srl-20131216/scripts/learn_mod.sh | 38 ++++++++++++++++++++ tools/srl-20131216/scripts/parse_srl_only.sh | 6 ++-- 2 files changed, 41 insertions(+), 3 deletions(-) create mode 100644 tools/srl-20131216/scripts/learn_mod.sh diff --git a/tools/srl-20131216/scripts/learn_mod.sh b/tools/srl-20131216/scripts/learn_mod.sh new file mode 100644 index 0000000..d706ad7 --- /dev/null +++ b/tools/srl-20131216/scripts/learn_mod.sh @@ -0,0 +1,38 @@ +#!/bin/sh + +## There are three sets of options that need, may need to, and could be changed. +## (1) deals with input and output. You have to set these (in particular, you need to provide a training corpus) +## (2) deals with the jvm parameters and may need to be changed +## (3) deals with the behaviour of the system + +## For further information on switches, see the source code, or run +## java -cp srl.jar se.lth.cs.srl.Learn --help + +################################################## +## (1) The following needs to be set appropriately +################################################## +CORPUS=./../../data/sl.train.mate +Lang="ger" +MODEL="srl-$Lang.model" + +################################################## +## (2) These ones may need to be changed +################################################## +JAVA="java" #Edit this i you want to use a specific java binary. +MEM="4g" #Memory for the JVM, might need to be increased for large corpora. +CP="srl.jar:lib/liblinear-1.51-with-deps.jar" +JVM_ARGS="-cp $CP -Xmx$MEM" + +################################################## +## (3) The following changes the behaviour of the system +################################################## +#LLBINARY="-llbinary /home/anders/liblinear-1.6/train" #Path to locally compiled liblinear. Uncomment this and correct the path if you have it. This will make training models faster (30-40%). The models come out slightly differently compared to the java version though due to floating point arithmetics. +#RERANKER="-reranker" #Uncomment this if you want to train a reranker too. This takes about 8 times longer than the simple pipeline. + + +#Execute +CMD="$JAVA $JVM_ARGS se.lth.cs.srl.Learn $Lang $CORPUS $MODEL $RERANKER $LLBINARY" +echo "Executing: $CMD" + +$CMD + diff --git a/tools/srl-20131216/scripts/parse_srl_only.sh b/tools/srl-20131216/scripts/parse_srl_only.sh index e880049..1147217 100644 --- a/tools/srl-20131216/scripts/parse_srl_only.sh +++ b/tools/srl-20131216/scripts/parse_srl_only.sh @@ -11,9 +11,9 @@ ################################################## ## (1) The following needs to be set appropriately ################################################## -INPUT=~/corpora/conll09/spa/CoNLL2009-ST-evaluation-Spanish-SRLonly.txt -Lang="spa" -MODEL="./srl-spa.model" +INPUT=./../../data/sl.test.mate +Lang="ger" +MODEL="./srl-ger.model" OUTPUT="${Lang}-eval.out" ##################################################