IssueID #1130: added support for collocation datasets
This commit is contained in:
parent
39b0f6e6b3
commit
41be10e153
|
@ -0,0 +1,84 @@
|
|||
<dictionary>
|
||||
<entry>
|
||||
<head>
|
||||
<headword>
|
||||
<lemma>absorbirati</lemma>
|
||||
</headword>
|
||||
<lexicalUnit id="294" type="single">
|
||||
<lexeme>absorbirati</lexeme>
|
||||
</lexicalUnit>
|
||||
<grammar>
|
||||
<category>glagol</category>
|
||||
</grammar>
|
||||
<measureList>
|
||||
<measure type="frequency" source="Gigafida 1.0">3295</measure>
|
||||
</measureList>
|
||||
</head>
|
||||
<body>
|
||||
<senseList>
|
||||
<sense id="1">
|
||||
<syntacticStructureList>
|
||||
<syntacticStructure id="34" name="gbz_pp_sbz2" pp="brez">
|
||||
<exampleContainerList>
|
||||
<exampleContainer>
|
||||
<multiwordExample type="collocation" cluster="1" frequency="5" logDice="2.23">
|
||||
<comp num="1" role="headword" sloleks="LE_a293f9ab871299f116dff2cc1421367a">absorbirati</comp>
|
||||
<comp num="2" role="other" sloleks="LE_4485e634af6a4b16093fe3140632418a">brez</comp>
|
||||
<comp num="3" role="collocate" sloleks="LE_b66fc194167f71cb086b3c0b80820711">težave</comp>
|
||||
</multiwordExample>
|
||||
</exampleContainer>
|
||||
<exampleContainer>
|
||||
<multiwordExample type="collocation" cluster="1" frequency="14" logDice="11.25">
|
||||
<comp num="1" role="headword" sloleks="LE_a293f9ab871299f116dff2cc1421367a">absorbirati</comp>
|
||||
<comp num="2" role="other" sloleks="LE_ba405c6d2b3a4b0cf9f6216af3812c6b">brez</comp>
|
||||
<comp num="3" role="collocate" sloleks="LE_274a6fc240c9e3c4c2dc3e4804a0c11f">zahteve</comp>
|
||||
</multiwordExample>
|
||||
</exampleContainer>
|
||||
</exampleContainerList>
|
||||
</syntacticStructure>
|
||||
<syntacticStructure id="34" name="gbz_pp_sbz2" pp="iz">
|
||||
<exampleContainerList>
|
||||
<exampleContainer>
|
||||
<multiwordExample type="collocation" cluster="2" frequency="14" logDice="11.25">
|
||||
<comp num="1" role="headword" sloleks="LE_a293f9ab871299f116dff2cc1421367a">absorbirati</comp>
|
||||
<comp num="2" role="other" sloleks="LE_ba405c6d2b3a4b0cf9f6216af3812c6b">iz</comp>
|
||||
<comp num="3" role="collocate" sloleks="LE_274a6fc240c9e3c4c2dc3e4804a0c11f">prebavila</comp>
|
||||
</multiwordExample>
|
||||
</exampleContainer>
|
||||
<exampleContainer>
|
||||
<multiwordExample type="collocation" cluster="2" frequency="14" logDice="11.25">
|
||||
<comp num="1" role="headword" sloleks="LE_a293f9ab871299f116dff2cc1421367a">absorbirati</comp>
|
||||
<comp num="2" role="other" sloleks="LE_ba405c6d2b3a4b0cf9f6216af3812c6b">iz</comp>
|
||||
<comp num="3" role="collocate" sloleks="LE_274a6fc240c9e3c4c2dc3e4804a0c11f">želodca</comp>
|
||||
</multiwordExample>
|
||||
</exampleContainer>
|
||||
</exampleContainerList>
|
||||
</syntacticStructure>
|
||||
</syntacticStructureList>
|
||||
</sense>
|
||||
<sense id="2">
|
||||
<syntacticStructureList>
|
||||
<syntacticStructure id="34" name="gbz_pp_sbz2" pp="brez">
|
||||
<exampleContainerList>
|
||||
<exampleContainer>
|
||||
<multiwordExample type="collocation" cluster="1" frequency="5" logDice="2.23">
|
||||
<comp num="1" role="headword" sloleks="LE_a293f9ab871299f116dff2cc1421367a">absorbirati</comp>
|
||||
<comp num="2" role="other" sloleks="LE_4485e634af6a4b16093fe3140632418a">brez</comp>
|
||||
<comp num="3" role="collocate" sloleks="LE_b66fc194167f71cb086b3c0b80820711">težave</comp>
|
||||
</multiwordExample>
|
||||
</exampleContainer>
|
||||
<exampleContainer>
|
||||
<multiwordExample type="collocation" cluster="2" frequency="14" logDice="11.25">
|
||||
<comp num="1" role="headword" sloleks="LE_a293f9ab871299f116dff2cc1421367a">absorbirati</comp>
|
||||
<comp num="2" role="other" sloleks="LE_ba405c6d2b3a4b0cf9f6216af3812c6b">brez</comp>
|
||||
<comp num="3" role="collocate" sloleks="LE_274a6fc240c9e3c4c2dc3e4804a0c11f">prebavila</comp>
|
||||
</multiwordExample>
|
||||
</exampleContainer>
|
||||
</exampleContainerList>
|
||||
</syntacticStructure>
|
||||
</syntacticStructureList>
|
||||
</sense>
|
||||
</senseList>
|
||||
</body>
|
||||
</entry>
|
||||
</dictionary>
|
52
resources/schema/collocation_dictionary.xsd
Normal file
52
resources/schema/collocation_dictionary.xsd
Normal file
|
@ -0,0 +1,52 @@
|
|||
<?xml version="1.0" encoding="UTF-8"?>
|
||||
<xsd:schema xmlns:xsd="http://www.w3.org/2001/XMLSchema">
|
||||
|
||||
<xsd:import namespace="http://www.w3.org/XML/1998/namespace"
|
||||
schemaLocation="http://www.w3.org/2001/xml.xsd" />
|
||||
<xsd:include schemaLocation="inventory.xsd"/>
|
||||
|
||||
<xsd:element name="dictionary">
|
||||
<xsd:complexType>
|
||||
<xsd:sequence>
|
||||
<xsd:element name="entry" minOccurs="0" maxOccurs="unbounded">
|
||||
<xsd:complexType>
|
||||
<xsd:sequence>
|
||||
<xsd:element name="head">
|
||||
<xsd:complexType>
|
||||
<xsd:sequence>
|
||||
<xsd:element name="status" type="statusType" minOccurs="0"/>
|
||||
<xsd:element name="headword" type="headwordType"/>
|
||||
<xsd:element name="lexicalUnit" type="lexicalUnitType" minOccurs="0"/>
|
||||
<xsd:element name="grammar" type="grammarType" minOccurs="0"/>
|
||||
<xsd:element name="measureList" type="measureListType" minOccurs="0"/>
|
||||
</xsd:sequence>
|
||||
</xsd:complexType>
|
||||
</xsd:element>
|
||||
<xsd:element name="body">
|
||||
<xsd:complexType>
|
||||
<xsd:sequence>
|
||||
<xsd:element name="senseList">
|
||||
<xsd:complexType>
|
||||
<xsd:sequence>
|
||||
<xsd:element name="sense" minOccurs="0" maxOccurs="unbounded">
|
||||
<xsd:complexType>
|
||||
<xsd:sequence>
|
||||
<xsd:element name="syntacticStructureList" type="syntacticStructureListType"/>
|
||||
</xsd:sequence>
|
||||
<xsd:attribute name="id" type="xsd:int"/>
|
||||
</xsd:complexType>
|
||||
</xsd:element>
|
||||
</xsd:sequence>
|
||||
</xsd:complexType>
|
||||
</xsd:element>
|
||||
</xsd:sequence>
|
||||
</xsd:complexType>
|
||||
</xsd:element>
|
||||
</xsd:sequence>
|
||||
</xsd:complexType>
|
||||
</xsd:element>
|
||||
</xsd:sequence>
|
||||
</xsd:complexType>
|
||||
</xsd:element>
|
||||
|
||||
</xsd:schema>
|
|
@ -343,9 +343,14 @@
|
|||
|
||||
<xsd:complexType name="syntacticStructureType">
|
||||
<xsd:sequence>
|
||||
<xsd:element name="component" type="componentType" minOccurs="0" maxOccurs="unbounded"/>
|
||||
<xsd:choice>
|
||||
<xsd:element name="component" type="componentType" minOccurs="0" maxOccurs="unbounded"/>
|
||||
<xsd:element name="exampleContainerList" type="exampleContainerListType" minOccurs="0" maxOccurs="unbounded"/>
|
||||
</xsd:choice>
|
||||
</xsd:sequence>
|
||||
<xsd:attribute name="id" type="xsd:int"/>
|
||||
<xsd:attribute name="name" type="xsd:string"/>
|
||||
<xsd:attribute name="pp" type="xsd:string"/>
|
||||
</xsd:complexType>
|
||||
|
||||
<xsd:complexType name="syntacticStructureListType">
|
||||
|
|
Loading…
Reference in New Issue
Block a user