Help
Difference between revisions of "SPARQL"
Line 10: | Line 10: | ||
'''Javascript:'''<br> | '''Javascript:'''<br> | ||
At least 3 methods exists ([https://jsfiddle.net/hugolpz/tsg9ewa7/4/ code snippet]), example: | At least 3 methods exists ([https://jsfiddle.net/hugolpz/tsg9ewa7/4/ code snippet]), example: | ||
− | {| | + | {| style="width:100%" |
|- | |- | ||
! Query || Result's basic unit | ! Query || Result's basic unit | ||
Line 42: | Line 42: | ||
== ✅ Is Language level ([[Q5]]) → list possible values == | == ✅ Is Language level ([[Q5]]) → list possible values == | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 67: | Line 67: | ||
== ✅ Is Sex or Gender([[Q7]]) → list possible values == | == ✅ Is Sex or Gender([[Q7]]) → list possible values == | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 93: | Line 93: | ||
== ✅🇶 Is Speaker ([[Q3]]) → list all speakers == | == ✅🇶 Is Speaker ([[Q3]]) → list all speakers == | ||
<!-- Q: add grouping per language ?--> | <!-- Q: add grouping per language ?--> | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 119: | Line 119: | ||
== ✅ Speaker name(s) → Speaker Qid(s) == | == ✅ Speaker name(s) → Speaker Qid(s) == | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 146: | Line 146: | ||
== ✅🇶 Speaker Qid ([[Q42]]) → Speaker data == | == ✅🇶 Speaker Qid ([[Q42]]) → Speaker data == | ||
<!-- Q: alternative words for "predicate" and "object". "property" and "value" ?--> | <!-- Q: alternative words for "predicate" and "object". "property" and "value" ?--> | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 173: | Line 173: | ||
== ✅🇶 Speaker Qid ([[Q42]]) → Speaker data → Speaker languages ([[Property:P4|P4]]) == | == ✅🇶 Speaker Qid ([[Q42]]) → Speaker data → Speaker languages ([[Property:P4|P4]]) == | ||
<!-- Q: Add languages iso P:13 --> | <!-- Q: Add languages iso P:13 --> | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 198: | Line 198: | ||
== ✅ Speaker Qid + language → list of all associated audios == | == ✅ Speaker Qid + language → list of all associated audios == | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 241: | Line 241: | ||
=== Sub-queries === | === Sub-queries === | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 261: | Line 261: | ||
|} | |} | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 283: | Line 283: | ||
== Isolang → Language LL Qid == | == Isolang → Language LL Qid == | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 300: | Line 300: | ||
== ✅ Isolang → Language WD Qid == | == ✅ Isolang → Language WD Qid == | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 322: | Line 322: | ||
== ✅ Language WD Qid → Language data == | == ✅ Language WD Qid → Language data == | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 342: | Line 342: | ||
== ✅ Language LL Qid ([[Q209]]) → Language data == | == ✅ Language LL Qid ([[Q209]]) → Language data == | ||
'''Case:'' Get for language Q209 'Breton' all its data. | '''Case:'' Get for language Q209 'Breton' all its data. | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 361: | Line 361: | ||
== ✅ Language LL Qid ([[Q209]]) → core Language data == | == ✅ Language LL Qid ([[Q209]]) → core Language data == | ||
'''Case:'' Get for language Q209 'Breton' all its CORE data. | '''Case:'' Get for language Q209 'Breton' all its CORE data. | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 381: | Line 381: | ||
== ✅ Language LL Qid ([[Q209]]) → Number of records == | == ✅ Language LL Qid ([[Q209]]) → Number of records == | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 402: | Line 402: | ||
== ✅ Language LL Qid ([[Q209]]) → Number of speakers == | == ✅ Language LL Qid ([[Q209]]) → Number of speakers == | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| | ||
Line 424: | Line 424: | ||
== ✅ Language ([[Q209]]) + speaker ([[Q584098]]) + word (ni) → Audio's Qid == | == ✅ Language ([[Q209]]) + speaker ([[Q584098]]) + word (ni) → Audio's Qid == | ||
'''Case:''' Search in Breton language, with speaker 'ThonyVezbe', | '''Case:''' Search in Breton language, with speaker 'ThonyVezbe', | ||
− | {| | + | {| style="width:100%" |
|- style="vertical-align:top;" | |- style="vertical-align:top;" | ||
|style="padding: 0 3em;width:60%"| | |style="padding: 0 3em;width:60%"| |
Revision as of 21:08, 6 December 2021
Base
Fetch SPARQL data
Data can be fetched using various coding languages such as Python, Javascript, R and others. On the Wikidata Query Service page, after running your SPARQL query, click "Code" : a pop up window appears with various implementations.
Javascript:
At least 3 methods exists (code snippet), example:
Query | Result's basic unit |
---|---|
var endpoint = 'https://lingualibre.org/sparql';
var sparql = 'SELECT ?item WHERE { ?item prop:P2 entity:Q5 } LIMIT 10';
$.getJSON(endpoint,
{ query: sparql, format: 'json' },
function(data){ console.log('JQuery: ',data)}
);
|
{ … },
{
"item": {
"type": "uri",
"value": "https://lingualibre.org/entity/Q12"
},
"itemLabel": {
"xml:lang": "en",
"type": "literal",
"value": "beginner"
}
},
{ … }
|
✅ Is Language level (language level (Q5)) → list possible values
SELECT ?item ?itemLabel
WHERE {
?item prop:P2 entity:Q5 # Condition 1, P2 'instance of' is Q5 'language level'.
SERVICE wikibase:label {
bd:serviceParam wikibase:language "[AUTO_LANGUAGE],en" .
}
}
|
|
✅ Is Sex or Gender(sex or gender (Q7)) → list possible values
SELECT ?item ?itemLabel
WHERE {
?item prop:P2 entity:Q7 # Condition 1, P2 'instance of' is Q7 'sex or gender'.
SERVICE wikibase:label {
bd:serviceParam wikibase:language "[AUTO_LANGUAGE],en" .
}
}
|
|
✅🇶 Is Speaker (speaker (Q3)) → list all speakers
SELECT ?speaker ?speakerLabel
WHERE {
?speaker prop:P2 entity:Q3 . # Condition 1, P2 'instance of' is Q3 'speaker'.
SERVICE wikibase:label {
bd:serviceParam wikibase:language "[AUTO_LANGUAGE],en" .
}
}
|
|
✅ Speaker name(s) → Speaker Qid(s)
SELECT ?speakerName ?speakerId
WHERE {
VALUES ?speakerName { "Yug" "VIGNERON" } # One or multiple values
BIND ( STRLANG(?speakerName, "en") AS ?speakerLabel )
# P2: instance of; Q3: speaker.
?speakerId prop:P2 entity:Q3 ; rdfs:label ?speakerLabel .
}
|
|
✅🇶 Speaker Qid (0x010C (Q42)) → Speaker data
# Get Q42 (User:0x010C)'s data
SELECT ?predicate ?predicate ?object ?objectLabel
WHERE {
entity:Q42 ?predicate ?object .
SERVICE wikibase:label {
bd:serviceParam wikibase:language "[AUTO_LANGUAGE],en" .
}
}
|
|
✅🇶 Speaker Qid (0x010C (Q42)) → Speaker data → Speaker languages (P4)
SELECT ?languages ?languagesLabel
WHERE {
entity:Q42 prop:P4 ?languages .
SERVICE wikibase:label {
bd:serviceParam wikibase:language "[AUTO_LANGUAGE],en" .
}
}
|
|
✅ Speaker Qid + language → list of all associated audios
SELECT ?audio ?audioLabel
WHERE {
?audio prop:P5 entity:Q42 . # Condition 1, P5 Speaker is Q42 User:0x010C
?audio prop:P4 entity:Q21 . # Condition 2, P4 language is Q21 French
# Labels
SERVICE wikibase:label {
bd:serviceParam wikibase:language "[AUTO_LANGUAGE],en" .
}
}
|
|
❌ Is Language (speaker (Q3)) → list all languages with number of unique words and speakers
Too large to run (not even on Lingualibre Query).
SELECT ?language (COUNT(?audio) AS ?nbAudio) (COUNT(?speaker) AS ?nbSpeaker) WHERE {
?language prop:P2 entity:Q4 .
?audio prop:P4 ?language .
?speaker prop:P4 ?language .
}
GROUP BY ?language
To do: do smaller sub-queries. For now, works only for one counter and one language at a time:
Sub-queries
SELECT ?language (COUNT(?audio) AS ?nbAudio) WHERE {
VALUES ?language { entity:Q21 }
?audio prop:P4 ?language .
}
GROUP BY ?language
|
|
SELECT ?language (COUNT(DISTINCT ?speaker) AS ?nbSpeaker) WHERE {
VALUES ?language { entity:Q21 }
?speaker prop:P4 ?language .
}
GROUP BY ?language
|
|
Isolang → Language LL Qid
SELECT * WHERE {
?lang prop:P13 ?code .
}
|
|
✅ Isolang → Language WD Qid
SELECT ?langIso ?langId
WHERE {
VALUES ?langIso { "ban" "bre" } # One or multiple values
# P2 'instance of'; Q4 'language'; P13 'ISO 639-3 code'
?langId prop:P2 entity:Q4 ; prop:P13 ?langIso .
}
|
|
✅ Language WD Qid → Language data
SELECT * WHERE {
?lang prop:P12 "Q12107" . # P12 'Wikidata id' is Wikidata's "Q12107"
?lang ?predicate ?object . #
}
|
|
✅ Language LL Qid (Breton (Q209)) → Language data
'Case: Get for language Q209 'Breton' all its data.
SELECT * WHERE {
# Given Q209 'Breton language', get all properties and values
entity:Q209 ?predicate ?object .
}
|
|
✅ Language LL Qid (Breton (Q209)) → core Language data
'Case: Get for language Q209 'Breton' all its CORE data.
SELECT * WHERE {
# Given Q209 'Breton language', get all properties and values
entity:Q209 ?predicate ?object .
?predicate rdf:type owl:DatatypeProperty .
}
|
|
✅ Language LL Qid (Breton (Q209)) → Number of records
SELECT ?language (COUNT(?audio) AS ?nbAudio) WHERE {
VALUES ?language { entity:Q209 }
?audio prop:P4 ?language .
}
GROUP BY ?language
|
|
✅ Language LL Qid (Breton (Q209)) → Number of speakers
SELECT ?language (COUNT(?speaker) AS ?nbSpeaker) WHERE {
VALUES ?language { entity:Q209 }
?speaker prop:P4 ?language .
}
GROUP BY ?language
|
|
✅ Language (Breton (Q209)) + speaker (ThonyVezbe (Q584098)) + word (ni) → Audio's Qid
Case: Search in Breton language, with speaker 'ThonyVezbe',
SELECT ?audio
WHERE {
?audio prop:P4 entity:Q209 . # P4 'language' is Q209 'Breton'
?audio prop:P5 entity:Q584098 . # P5 'speaker' is Q584098 'ThonyVezbe'
?audio rdfs:label ?word . #word
FILTER ( STR(?word) = "ni" ) # word = 'ni'
}
|
|
Audio Qid → Audio data
✅ Langue + speaker + word → Audio's Commons url
Tools
- Special:ApiSandbox – API queries generator for Lingualibre wikipage and wikibase contents.