xml_schemas/examples/morphological_lexicon/PCR.xml

75 lines
2.8 KiB
XML
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<lexicon>
<entry>
<head>
<headword>
<lemma orthography_ids="342" dynamic_accentuation_ids="81" pronunciation_ids="32|33|34" hyphenation_ids="" tonemic_accentuation_ids="85">PCR</lemma>
</headword>
<lexicalUnit sloleksId="LE_c77074df05d2719216d477bd01d418ad" sloleksKey="S_PCR" type="single">
<lexeme lexical_unit_lexeme_id="83224">PCR</lexeme>
</lexicalUnit>
<grammar>
<category>samostalnik</category>
<subcategory type="pronunciation">acronym</subcategory>
<grammarFeature name="type">common</grammarFeature>
<grammarFeature name="gender">masculine</grammarFeature>
</grammar>
<measureList>
<measure type="frequency" source="Gigafida 2.0">285818</measure>
</measureList>
<relatedEntryList/>
</head>
<body>
<wordFormList>
<wordForm id="333330">
<msd language="sl" system="JOS">Somei</msd>
<msd language="en" system="UD">NOUN|...</msd>
<grammarFeatureList>
<grammarFeature name="number">singular</grammarFeature>
<grammarFeature name="case">nominative</grammarFeature>
</grammarFeatureList>
<formRepresentations>
<orthographyList>
<orthography id="342" morphologyPatterns="Sm.5.1.o">
<form>PCR</form>
<measureList>
<measure type="frequency" source="Gigafida 2.0">813</measure>
<measure type="frequency" source="GOS 1.0">432</measure>
</measureList>
</orthography>
</orthographyList>
<accentuationList type="dynamic">
<accentuation id="81" orthography_id="342" accentuationPatterns="cjvt:no_accentuation"/>
</accentuationList>
<accentuationList type="tonemic">
<accentuation id="85" orthography_id="342" accentuationPatterns="zrc:no_accentuation"/>
</accentuationList>
<pronunciationList>
<pronunciation id="32" dynamic_accentuation_id="81" type="slovene_spelling_short" status="preferred">
<form script="IPA">ˈˈtsəˈ</form>
<form script="SAMPA">"p@"ts@"r@</form>
<measureList>
<measure type="frequency" source="XXX">7777</measure>
</measureList>
</pronunciation>
<pronunciation id="33" dynamic_accentuation_id="81" type="slovene_spelling_long">
<form script="IPA">ˈpeːˈʦeːˈɛɾ</form>
<form script="SAMPA">"pe:"tse:"E:r</form>
<measureList>
<measure type="frequency" source="XXX">7777</measure>
</measureList>
</pronunciation>
<pronunciation id="34" dynamic_accentuation_id="81" type="english_spelling">
<form script="IPA">ˈpiːˈsiːˈaːɾ</form>
<form script="SAMPA">"pi:"si:"a:r</form>
<measureList>
<measure type="frequency" source="XXX">7777</measure>
</measureList>
</pronunciation>
</pronunciationList>
<hyphenationList/>
</formRepresentations>
</wordForm>
</wordFormList>
</body>
</entry>
</lexicon>