forked from zbw/sparql-queries
-
Notifications
You must be signed in to change notification settings - Fork 0
/
search_corp_by_pm20_names.rq
101 lines (100 loc) · 3.24 KB
/
search_corp_by_pm20_names.rq
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
# Search for organizations from PM20, looking up all available
# labels, with additional data for identification
#
# Uses diverse literal properties, brings the best match on top
# of the list
#
PREFIX gndo: <https://d-nb.info/standards/elementset/gnd#>
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
PREFIX skos: <http://www.w3.org/2004/02/skos/core#>
PREFIX text: <http://jena.apache.org/text#>
PREFIX wd: <http://www.wikidata.org/entity/>
PREFIX xsd: <http://www.w3.org/2001/XMLSchema#>
PREFIX schema: <http://schema.org/>
PREFIX wdt: <http://www.wikidata.org/prop/direct/>
PREFIX xs: <http://www.w3.org/2001/XMLSchema#>
#
select distinct ?pm20 (str(?prefLabel) as ?pm20Label) ?wd ?wdLabel
?time ?description ?addpm20 ('add' as ?addpm20Label)
# debug information
# ?score ?literal ?labels
where {
# lookup additional information about pm20 folder
service <https://zbw.eu/beta/sparql/pm20/query> {
select ?pm20 ?prefLabel (group_concat(?altLabel) as ?altLabels)
where {
values ( ?pm20 ) {
( <http://purl.org/pressemappe20/folder/co/018039> )
}
?pm20 skos:prefLabel ?prefLabel ;
skos:altLabel ?alt .
# truncate combined alt labels
bind(coalesce(strbefore(?alt, ' <'), strbefore(?alt, ' -- '), ?alt) as ?altLabel)
}
group by ?pm20 ?prefLabel
}
# create one string of all labels
bind(concat(?prefLabel, ' ', ?altLabels) as ?labels)
#
# search text and limit number of results
(?wd ?score ?literal) text:query ( ?labels 100 ) .
#
# filter out wikimedia categories, disambig pages, first-family names, templates
optional {
?wd wdt:P31 ?class .
}
# exclude certain classes
filter(!bound(?class) || ?class not in (
wd:Q4167410, # disambiguation page
wd:Q11266439, # template
wd:Q4167836, # category
wd:Q202444, # given name
wd:Q101352, # family name
wd:Q7725634, # literary work
wd:Q732577, # publication
wd:Q571, # book
wd:Q23927052, # conference paper
wd:Q5633421, # scientific journal
wd:Q13442814, # scientific article
wd:Q7366, # song
wd:Q134556, # single
wd:Q16551537, # album
wd:Q11424 # film
))
#
# try to get a label
optional {
?wd rdfs:label ?wdLabelDe .
filter(lang(?wdLabelDe) = 'de')
}
optional {
?wd rdfs:label ?wdLabelEn .
filter(lang(?wdLabelEn) = 'en')
}
bind(strafter(str(?wd), str(wd:)) as ?wdId)
bind(coalesce(str(?wdLabelDe), str(?wdLabelEn), ?wdId) as ?wdLabel)
#
# try to get a description
optional {
?wd schema:description ?descDe .
filter(lang(?descDe) = 'de')
}
optional {
?wd schema:description ?descEn .
filter(lang(?descEn) = 'en')
}
bind(coalesce(str(?descDe), str(?descEn), '') as ?description)
#
# additional information to display
optional {
?wd wdt:P571 ?established .
}
optional {
?wd wdt:P576 ?terminated .
}
bind(concat(if(bound(?established), str(year(?established)), ''), ' - ', if(bound(?terminated), str(year(?terminated)), '')) as ?time)
#
# Quickstatements link
bind(strafter(str(?pm20), 'http://purl.org/pressemappe20/folder/co/') as ?id)
bind(uri(concat('https://tools.wmflabs.org/quickstatements/#v1=', ?wdId, '|P4293|"co%2F', ?id, '"')) as ?addpm20)
}