-
Notifications
You must be signed in to change notification settings - Fork 0
/
Velez_assess_wordlist_vs_Lasla.rq
55 lines (53 loc) · 2.19 KB
/
Velez_assess_wordlist_vs_Lasla.rq
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
###############################################
# TITLE: Velez's Dictionary Assessment: wordlist vs. Lasla
# DESCRIPTION: Counts the number of dictionary headwords included in the top 1000 commonly used lemmas in the Lasla Corpus, grouped by PoS.
###############################################
PREFIX powla: <http://purl.org/powla/powla.owl#>
PREFIX xsd:<http://www.w3.org/2001/XMLSchema#>
PREFIX lila: <http://lila-erc.eu/ontologies/lila/>
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
PREFIX lime: <http://www.w3.org/ns/lemon/lime#>
PREFIX ontolex: <http://www.w3.org/ns/lemon/ontolex#>
SELECT ?partofspeech ?VelezTotal ?LaslaTotal
WHERE
{
{
# List the 1012 most Freq lemmas in the LASLA corpus (above 260 occurrences)
SELECT ?partofspeech (count(?partofspeech) as ?VelezTotal)
WHERE
{
{
SELECT ?V_lemma ?partofspeech (count(?V_lemma) as ?LemmaTotal)
WHERE
{
?t a powla:Terminal ; lila:hasLemma ?V_lemma .
?t powla:hasLayer/powla:hasDocument/^powla:hasSubDocument <http://lila-erc.eu/data/corpora/Lasla/id/corpus> .
?V_lemma lila:hasPOS ?UPOS .
?UPOS rdfs:label ?partofspeech .
<http://lila-erc.eu/data/lexicalResources/LatinPortuguese/Velez/Lexicon> lime:entry ?lexentry .
?lexentry ontolex:canonicalForm ?V_lemma .
} group by ?V_lemma ?partofspeech having (count(?V_lemma) > 260)
}
}
}
UNION
{
# List the lemmas covered by the Index Totius Artis in the 1012 most Freq lemmas in the LASLA corpus
SELECT ?partofspeech (count(?partofspeech) as ?LaslaTotal)
WHERE
{
{
SELECT ?pnomlemma ?partofspeech (count(?pnomlemma) as ?LemmaTotal)
WHERE
{
?t a powla:Terminal ; lila:hasLemma ?pnomlemma .
?t powla:hasLayer/powla:hasDocument/^powla:hasSubDocument <http://lila-erc.eu/data/corpora/Lasla/id/corpus> .
?pnomlemma rdfs:label ?lablemma .
?pnomlemma lila:hasPOS ?UPOS .
?UPOS rdfs:label ?partofspeech .
} group by ?pnomlemma ?partofspeech having (count(?pnomlemma) > 260)
}
}
}
}
group by ?partofspeech order by ?partofspeech ?LaslaTotal