Examples of queries to assess scope of Wikidata coverage.
Find people in Wikidata that have IPNI author ids (set of botanical taxonomists that have published plant names)
SELECT * WHERE {
?item wdt:P586 ?IPNI_author_ID.
OPTIONAL {
?item wdt:P496 ?orcid.
}
OPTIONAL {
?article schema:about ?item ;
schema:isPartOf <https://species.wikimedia.org/> .
}
}
Try it 46725 rows 2019-09-27
Find IPNI authors who also have an ORCID id
SELECT * WHERE {
?item wdt:P586 ?IPNI_author_ID .
?item wdt:P496 ?orcid .
}
Try it 400 rows 2019-09-27
IPNI authors that also have Wikispecies articles
SELECT * WHERE {
?item wdt:P586 ?IPNI_author_ID.
?article schema:about ?item ;
schema:isPartOf <https://species.wikimedia.org/> .
}
Try it 12223 rows 2019-09-27
Find people with ZooBank author ids (set of zoological authors who have published names)
SELECT * WHERE {
?item wdt:P2006 ?zoobank.
}
15658 rows 2019-09-27 (same as Wikispecies)
Zoobank authors that also have Wikispecies articles
SELECT * WHERE {
?item wdt:P2006 ?zoobank.
?article schema:about ?item;
schema:isPartOf <https://species.wikimedia.org/>.
}
Try it 15658 rows 2019-09-27
ZooBank authors with ORCID ids in Wikidata
SELECT * WHERE {
?item wdt:P2006 ?zoobank.
?item wdt:P496 ?orcid .
}
Try it 1138 rows 2019-09-27
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
SELECT DISTINCT
?citizenship ?citizenship_label (COUNT(?citizenship_label) AS ?count)
WHERE
{
# get people
?item wdt:P2006 ?zoobank.
# get citizenship
?item rdfs:label ?name .
FILTER (lang(?name) = 'en')
?item wdt:P27 ?citizenship .
?citizenship rdfs:label ?citizenship_label .
FILTER (lang(?citizenship_label) = 'en')
}
GROUP BY ?citizenship ?citizenship_label
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
SELECT DISTINCT
?gender ?gender_label (COUNT(?gender_label) AS ?count)
WHERE
{
# get people
?item wdt:P2006 ?zoobank.
?item rdfs:label ?name .
FILTER (lang(?name) = 'en')
?item wdt:P21 ?gender .
?gender rdfs:label ?gender_label .
FILTER (lang(?gender_label) = 'en')
}
GROUP BY ?gender ?gender_label
Note that major problem is birth dates are often not precise, and a date of “20th C” gets translated as 1 January 2000, which is of no use.
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
SELECT DISTINCT
?item ?name
(YEAR(?birth) AS ?year)
WHERE
{
# get people
?item wdt:P2006 ?zoobank.
?item rdfs:label ?name .
FILTER (lang(?name) = 'en')
?item wdt:P569 ?birth .
}
ORDER BY ?year
SELECT * WHERE {
?item wdt:P6264 ?harvard_id.
OPTIONAL {
?article schema:about ?item ;
schema:isPartOf <https://species.wikimedia.org/> .
}
}
SELECT * WHERE {
?item wdt:P106 wd:Q2083925.
}
Only 388 results!