IssueID #959: tweaked valency schema details

This commit is contained in:
Cyprian Laskowski 2020-02-25 17:02:59 +01:00
parent 1eb865b088
commit 9f1b0580f7
2 changed files with 28 additions and 26 deletions

View File

@ -9,21 +9,23 @@
<lexeme lexical_unit_lexeme_id="317">aktivirati</lexeme>
</lexicalUnit>
<grammar>
<!-- tekst in vrednosti atributov v slovenscini, rabimo pa moznost switcha v anglescini na nek nacin -->
<category>glagol</category>
<grammarFeature name="Aspect">biaspectual</grammarFeature>
<grammarFeature name="vid">dvovidski</grammarFeature>
<!-- iz Sloleksa -->
</grammar>
<measureList>
<!-- vrednosti za @source naceloma se morajo ujemati z dogovori s Tomazom o imenih korpusov itd -->
<measure type="frequency" source="Gigafida 2.0">11410</measure>
<!-- iz Gigafide -->
<measure type="frequency" source="ssj500k 2.2">5</measure>
<!-- iz ssj500k -->
</measureList>
<labelList>
<label type="Levin_class" feature_id="55">"begin" verbs</label>
<label type="Levin_class" featureId="55.1">"begin" verbs</label>
<!-- iz Levin classes list http://www-personal.umich.edu/~jlawler/levin.verbs -->
<label type="Žele_class" feature_id="56">glagol ravnanja</label>
<!-- Žele: vezljivostni slovar -->
<label type="Žele_class" featureId="56">glagol ravnanja</label>
<!-- Žele: vezljivostni slovar https://fran.si/209/vezljivostni-slovar/4410086/aktivirati?FilteredDictionaryIds=209&View=1&Query=aktivirati -->
</labelList>
</head>
<body>
@ -31,18 +33,18 @@
<statisticsContainer>
<semanticRole>PAT</semanticRole>
<measureList>
<measure type="valency_pattern_ratio" ratio_base="148">50</measure>
<measure type="valency_pattern_ratio">0.37</measure>
<!-- odstotek vzorcev, v katerih se pojavlja PAT -->
<measure type="valency_sentence_ratio">100</measure>
<measure type="valency_sentence_ratio">0.19</measure>
<!-- odstotek stavkov (v kateremkoli vzorcu), v katerih se pojavlja PAT -->
</measureList>
</statisticsContainer>
<statisticsContainer>
<semanticRole>AIM</semanticRole>
<measureList>
<measure type="valency_pattern_ratio" ratio_base="1">1</measure>
<measure type="valency_pattern_ratio">0.81</measure>
<!-- odstotek vzorcev, v katerih se pojavlja AIM -->
<measure type="valency_sentence_ratio">100</measure>
<measure type="valency_sentence_ratio">0.1</measure>
<!-- odstotek stavkov (v kateremkoli vzorcu), v katerih se pojavlja AIM -->
</measureList>
</statisticsContainer>
@ -69,7 +71,7 @@
<semanticRole>AIM</semanticRole>
<syntacticStructureList>
<syntacticStructure id="36">
<comp structure_component_index="3">za</comp>
<comp num="3">za</comp>
</syntacticStructure>
</syntacticStructureList>
</semanticRoleContainer>
@ -80,13 +82,12 @@
<corpusExample corpus_id="1" modified="false">
Glede vabe ušata res ni izbirčna
<tree role="AIM">
<comp syntactic_structure_id="36" structure_component_index="3">za</comp>
uspešen
<comp syntactic_structure_id="36" structure_component_index="4">ribolov</comp>
<comp structure_id="36" num="3">za</comp>
<comp structure_id="36" num="4">ribolov</comp>
</tree>
pa
<tree role="PAT">
<comp syntactic_structure_id="8" structure_component_index="4">jo</comp>
<comp structure_id="8" num="4">jo</comp>
</tree>
moramo
<comp role="headword">aktivirati</comp>,
@ -97,13 +98,13 @@
<corpusExample modified="false">
Glede vabe ušata res ni izbirčna
<tree role="AIM">
<comp syntactic_structure_id="36" structure_component_index="3">za</comp>
<comp structure_id="36" num="3">za</comp>
uspešen
<comp syntactic_structure_id="36" structure_component_index="4">ribolov</comp>
<comp structure_id="36" num="4">ribolov</comp>
</tree>
pa
<tree role="PAT">
<comp syntactic_structure_id="8" structure_component_index="4">jo</comp>
<comp structure_id="8" num="4">jo</comp>
</tree>
moramo
<comp role="headword">aktivirati</comp>,
@ -131,7 +132,7 @@
<syntacticStructureList>
<syntacticStructure id="8"/>
<syntacticStructure id="33">
<comp structure_component_index="2">z/s</comp>
<comp num="2">z/s</comp>
</syntacticStructure>
</syntacticStructureList>
</semanticRoleContainer>
@ -140,14 +141,14 @@
<syntacticStructureList system="JOS">
<syntacticStructure id="19"/>
<syntacticStructure id="36">
<comp structure_component_index="3">na</comp>
<comp structure_component_index="3">pred</comp>
<comp num="3">na</comp>
<comp num="3">pred</comp>
</syntacticStructure>
<syntacticStructure id="33">
<comp structure_component_index="2">z/s</comp>
<comp num="2">z/s</comp>
</syntacticStructure>
<syntacticStructure id="34">
<comp structure_component_index="3">preko</comp>
<comp num="3">preko</comp>
</syntacticStructure>
</syntacticStructureList>
</semanticRoleContainer>
@ -157,14 +158,14 @@
<exampleContainer>
<corpusExample modified="false">
<tree role="ACT">
<comp syntactic_structure_id="9" structure_component_index="1">Poljubljanje</comp>
<comp structure_id="9" num="1">Poljubljanje</comp>
</tree>
<tree role="MANN">
<comp syntactic_structure_id="19" structure_component_index="1">hitro</comp>
<comp structure_id="19" num="1">hitro</comp>
</tree>
<comp role="headword">aktivira</comp>
<tree role="PAT">
<comp syntactic_structure_id="8" structure_component_index="4">hormon</comp>
<comp structure_id="8" num="4">hormon</comp>
sreče
</tree>
in krepi imunski sistem.

View File

@ -146,6 +146,7 @@
<xsd:simpleContent>
<xsd:extension base="xsd:string">
<xsd:attribute name="feature_id" type="xsd:int"/>
<xsd:attribute name="featureId" type="xsd:string"/>
<xsd:attribute name="type" type="xsd:string"/>
</xsd:extension>
</xsd:simpleContent>
@ -186,8 +187,8 @@
<xsd:simpleContent>
<xsd:extension base="xsd:string">
<xsd:attribute name="lexical_unit_lexeme_id" type="xsd:int"/>
<xsd:attribute name="syntactic_structure_id" type="xsd:int"/>
<xsd:attribute name="structure_component_index" type="xsd:int"/>
<xsd:attribute name="structure_id" type="xsd:int"/>
<xsd:attribute name="num" type="xsd:int"/>
<xsd:attribute name="lexeme_id" type="xsd:int"/>
<xsd:attribute name="role">
<xsd:simpleType>