-
Notifications
You must be signed in to change notification settings - Fork 0
/
stats.xml
99 lines (99 loc) · 7.25 KB
/
stats.xml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
<?xml version="1.0" encoding="UTF-8"?>
<treebank>
<!-- tokens means "surface tokens", e.g. Spanish "vámonos" counts as one token
words means "syntactic words", e.g. Spanish "vámonos" is split to two words, "vamos" and "nos"
fused is the number of tokens that are split to two or more syntactic words
The words and fused elements can be omitted if no token is split to smaller syntactic words. -->
<size>
<total><sentences>20</sentences><tokens>170</tokens><words>170</words><fused>0</fused></total>
<train><sentences>0</sentences><tokens>0</tokens><words>0</words><fused>0</fused></train>
<dev><sentences>0</sentences><tokens>0</tokens><words>0</words><fused>0</fused></dev>
<test><sentences>20</sentences><tokens>170</tokens><words>170</words><fused>0</fused></test>
</size>
<lemmas unique="108" /><!-- ., ,, jis, Pīters, i, ?, tu, Mareja, byut, ni, voi, -, bet, es, jei -->
<forms unique="117" /><!-- ., ,, i, ?, jis, tu, Pītera, ir, ni, voi, Mareja, Pīters, bet, jei, ka -->
<fusions unique="0" /><!-- -->
<!-- Statistics of universal POS tags. The comments show the most frequent lemmas. -->
<tags unique="12">
<tag name="ADJ">5</tag><!-- foršs, lels, mozs, sorkons, tovejs -->
<tag name="ADP">3</tag><!-- deļ, iz, nu -->
<tag name="ADV">8</tag><!-- kai, kod, leidza, mudri, partū, puoruok, tod, vakar -->
<tag name="CCONJ">10</tag><!-- i, bet, ni, voi -->
<tag name="DET">6</tag><!-- itei, kaids, muns, sova, sovs, tei -->
<tag name="NOUN">27</tag><!-- mašyna, viestule, bronza, bruoļs, draudzine, dzeršona, dīna, golvyspiļsāta, jausma, kruosa -->
<tag name="PART">5</tag><!-- voi, koč, ni, tik -->
<tag name="PRON">20</tag><!-- jis, tu, es, jei, tys, jī, kas, kurs -->
<tag name="PROPN">15</tag><!-- Pīters, Mareja, Brauna, Džeina, Fraņceja, Igvasu, Parize, Sems, Smits -->
<tag name="PUNCT">33</tag><!-- ., ,, ?, -, ! -->
<tag name="SCONJ">3</tag><!-- ka, nakai -->
<tag name="VERB">35</tag><!-- byut, navarēt, tikt, apgrīzt, apsaskaut, atmest, attaiseit, atīt, ceņstīs, dabuot -->
</tags>
<!-- Statistics of features and values. The comments show the most frequent word forms. -->
<feats unique="37">
<feat name="Aspect" value="Perf" upos="VERB">1</feat><!-- pīguoduota -->
<feat name="Case" value="Acc" upos="NOUN,PRON">16</feat><!-- mašynu, bronzu, dzeršonu, kuo, lūgu, motus, peipiešonu, ritini, statini, sudobru -->
<feat name="Case" value="Dat" upos="DET,NOUN,PRON">8</feat><!-- Jai, Jim, Maņ, draudzinei, jam, sovai, sovam, veiram -->
<feat name="Case" value="Gen" upos="DET,NOUN,PRON,PROPN">11</feat><!-- Pītera, Braunys, Fraņcejis, Marejis, Smita, jausmys, juo, kaida, īmesļa -->
<feat name="Case" value="Loc" upos="ADJ,DET,NOUN,PROPN">6</feat><!-- Parizē, dīnā, golvyspiļsātā, kruosā, sorkonā, tamā -->
<feat name="Case" value="Nom" upos="ADJ,DET,NOUN,PRON,PROPN,VERB">31</feat><!-- jis, tu, Mareja, Pīters, jei, Džeina, Es, Itei, Meitine, Muns -->
<feat name="Case" value="Voc" upos="PROPN">1</feat><!-- Sem -->
<feat name="Definite" value="Def" upos="ADJ">1</feat><!-- tovejais -->
<feat name="Definite" value="Ind" upos="ADJ,VERB">5</feat><!-- foršuoks, lela, moza, pīguoduota, sorkonā -->
<feat name="Degree" value="Cmp" upos="ADJ">1</feat><!-- foršuoks -->
<feat name="Degree" value="Pos" upos="ADJ,ADV,VERB">6</feat><!-- lela, moza, mudri, pīguoduota, sorkonā, tovejais -->
<feat name="Evident" value="Fh" upos="VERB">26</feat><!-- ir, pīraksteja, Navarēja, apsaskuove, ceņtēs, dabuoja, dūmoj, gribi, izauga, leist -->
<feat name="Gender" value="Fem" upos="ADJ,DET,NOUN,PRON,PROPN,VERB">33</feat><!-- Mareja, jei, mašynu, Braunys, Džeina, Fraņcejis, Itei, Jai, Jis, Marejis -->
<feat name="Gender" value="Masc" upos="ADJ,DET,NOUN,PRON,PROPN">33</feat><!-- Pītera, jis, Pīters, Jim, Muns, Sem, Smita, bruoļs, foršuoks, jam -->
<feat name="Mood" value="Imp" upos="VERB">1</feat><!-- attaisi -->
<feat name="Mood" value="Ind" upos="VERB">26</feat><!-- ir, pīraksteja, Navarēja, apsaskuove, ceņtēs, dabuoja, dūmoj, gribi, izauga, leist -->
<feat name="Number" value="Plur" upos="NOUN,PRON">3</feat><!-- Jim, motus, sābri -->
<feat name="Number" value="Sing" upos="ADJ,DET,NOUN,PRON,PROPN,VERB">75</feat><!-- jis, tu, Pītera, Mareja, Pīters, jei, mašynu, Braunys, Džeina, Es -->
<feat name="Person" value="1" upos="PRON,VERB">3</feat><!-- Es, Maņ, navarieju -->
<feat name="Person" value="2" upos="PRON,VERB">9</feat><!-- tu, attaisi, dūmoj, gribi, variesi, verīs -->
<feat name="Person" value="3" upos="DET,PRON,VERB">35</feat><!-- jis, ir, jei, pīraksteja, Itei, Jai, Jim, Navarēja, apsaskuove, ceņtēs -->
<feat name="Polarity" value="Neg" upos="VERB">4</feat><!-- Navarēja, naizdareja, nav, navarieju -->
<feat name="Polarity" value="Pos" upos="VERB">31</feat><!-- ir, pīraksteja, apgrīzt, apsaskuove, atmest, attaisi, atīt, ceņtēs, dabuoja, dūmoj -->
<feat name="Poss" value="Yes" upos="DET">3</feat><!-- Muns, sovai, sovam -->
<feat name="PronType" value="Dem" upos="DET,PRON">4</feat><!-- Itei, tamā, tuo, tū -->
<feat name="PronType" value="Ind" upos="DET">1</feat><!-- kaida -->
<feat name="PronType" value="Prs" upos="DET,PRON">19</feat><!-- jis, tu, jei, Es, Jai, Jim, Maņ, Muns, jam, juo -->
<feat name="PronType" value="Rel" upos="PRON">2</feat><!-- kuo, kurs -->
<feat name="Reflex" value="Yes" upos="VERB">4</feat><!-- apsaskuove, ceņtēs, ruodīs, verīs -->
<feat name="Tense" value="Fut" upos="VERB">1</feat><!-- variesi -->
<feat name="Tense" value="Past" upos="VERB">17</feat><!-- pīraksteja, Navarēja, apsaskuove, ceņtēs, dabuoja, izauga, lyka, naizdareja, navarieju, nūkruosuoja -->
<feat name="Tense" value="Pres" upos="VERB">9</feat><!-- ir, dūmoj, gribi, leist, nav, ruodīs, verīs -->
<feat name="VerbForm" value="Fin" upos="VERB">27</feat><!-- ir, pīraksteja, Navarēja, apsaskuove, attaisi, ceņtēs, dabuoja, dūmoj, gribi, izauga -->
<feat name="VerbForm" value="Inf" upos="VERB">7</feat><!-- apgrīzt, atmest, atīt, izalaseit, nūmozguot, tikt, īt -->
<feat name="VerbForm" value="Part" upos="VERB">1</feat><!-- pīguoduota -->
<feat name="Voice" value="Act" upos="VERB">27</feat><!-- ir, pīraksteja, Navarēja, apsaskuove, attaisi, ceņtēs, dabuoja, dūmoj, gribi, izauga -->
<feat name="Voice" value="Pass" upos="VERB">1</feat><!-- pīguoduota -->
</feats>
<!-- Statistics of universal dependency relations. -->
<deps unique="25">
<dep name="acl">1</dep>
<dep name="advcl">1</dep>
<dep name="advmod">6</dep>
<dep name="amod">2</dep>
<dep name="appos">1</dep>
<dep name="case">5</dep>
<dep name="cc">10</dep>
<dep name="ccomp">2</dep>
<dep name="conj">10</dep>
<dep name="csubj">1</dep>
<dep name="det">7</dep>
<dep name="discourse">5</dep>
<dep name="fixed">1</dep>
<dep name="flat:name">2</dep>
<dep name="iobj">2</dep>
<dep name="mark">2</dep>
<dep name="nmod">2</dep>
<dep name="nsubj">21</dep>
<dep name="obj">12</dep>
<dep name="obl">10</dep>
<dep name="orphan">3</dep>
<dep name="punct">33</dep>
<dep name="root">20</dep>
<dep name="vocative">1</dep>
<dep name="xcomp">10</dep>
</deps>
</treebank>