1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
|
# -*- coding: utf-8 -*-
import os
import shutil
import tempfile
from test.data import context1, likes, pizza, tarek
import pytest
from rdflib import URIRef, plugin
from rdflib.graph import DATASET_DEFAULT_GRAPH_ID, Dataset, Graph
from rdflib.namespace import Namespace
from rdflib.store import Store
# Will also run SPARQLUpdateStore tests against local SPARQL1.1 endpoint if
# available. This assumes SPARQL1.1 query/update endpoints running locally at
# http://localhost:3030/db/
#
# Testing SPARQLUpdateStore Dataset behavior needs a different endpoint behavior
# than our ConjunctiveGraph tests in test_sparqlupdatestore.py!
#
# For the tests here to run, you can for example start fuseki with:
# ./fuseki-server --mem --update /db
# THIS WILL DELETE ALL DATA IN THE /db dataset
HOST = "http://localhost:3030"
DB = "/db/"
pluginstores = []
for s in plugin.plugins(None, Store):
if s.name in ("Memory", "Auditable", "Concurrent", "SPARQLStore"):
continue # these are tested by default
if not s.getClass().graph_aware:
continue
if s.name == "SPARQLUpdateStore":
from urllib.request import urlopen
try:
assert len(urlopen(HOST).read()) > 0
except Exception:
continue
pluginstores.append(s.name)
@pytest.fixture(
scope="function",
params=pluginstores,
)
def get_dataset(request):
store = request.param
try:
dataset = Dataset(store=store)
except ImportError:
pytest.skip("Dependencies for store '%s' not available!" % store)
graph = Dataset(store=store)
if not graph.store.graph_aware:
return
if store in ["SQLiteLSM", "LevelDB"]:
path = os.path.join(tempfile.gettempdir(), f"test_{store.lower()}")
try:
shutil.rmtree(path)
except Exception:
pass
elif store == "SPARQLUpdateStore":
root = HOST + DB
path = root + "sparql", root + "update"
else:
path = tempfile.mkdtemp()
graph.open(path, create=True if store != "SPARQLUpdateStore" else False)
if store == "SPARQLUpdateStore":
try:
graph.store.update("CLEAR ALL")
except Exception as e:
if "SPARQLStore does not support BNodes! " in str(e):
pass
else:
raise Exception(e)
yield store, graph
if store == "SPARQLUpdateStore":
try:
graph.store.update("CLEAR ALL")
except Exception as e:
if "SPARQLStore does not support BNodes! " in str(e):
pass
else:
raise Exception(e)
graph.close()
else:
graph.close()
graph.destroy(path)
if os.path.isdir(path):
shutil.rmtree(path)
else:
try:
os.remove(path)
except Exception:
pass
def test_graph_aware(get_dataset):
store, dataset = get_dataset
if not dataset.store.graph_aware:
return
g1 = dataset.graph(context1)
# Some SPARQL endpoint backends (e.g. TDB) do not consider
# empty named graphs
if store != "SPARQLUpdateStore":
# added graph exists
assert set(x.identifier for x in dataset.contexts()) == set(
[context1, DATASET_DEFAULT_GRAPH_ID]
)
# added graph is empty
assert len(g1) == 0
g1.add((tarek, likes, pizza))
# added graph still exists
assert set(x.identifier for x in dataset.contexts()) == set(
[context1, DATASET_DEFAULT_GRAPH_ID]
)
# added graph contains one triple
assert len(g1) == 1
g1.remove((tarek, likes, pizza))
# added graph is empty
assert len(g1) == 0
# Some SPARQL endpoint backends (e.g. TDB) do not consider
# empty named graphs
if store != "SPARQLUpdateStore":
# graph still exists, although empty
assert set(x.identifier for x in dataset.contexts()) == set(
[context1, DATASET_DEFAULT_GRAPH_ID]
)
dataset.remove_graph(context1)
# graph is gone
assert set(x.identifier for x in dataset.contexts()) == set(
[DATASET_DEFAULT_GRAPH_ID]
)
def test_default_graph(get_dataset):
# Something the default graph is read-only (e.g. TDB in union mode)
store, dataset = get_dataset
if store == "SPARQLUpdateStore":
print(
"Please make sure updating the default graph "
"is supported by your SPARQL endpoint"
)
dataset.add((tarek, likes, pizza))
assert len(dataset) == 1
# only default exists
assert list(dataset.contexts()) == [dataset.default_context]
# removing default graph removes triples but not actual graph
dataset.remove_graph(DATASET_DEFAULT_GRAPH_ID)
assert len(dataset) == 0
# default still exists
assert set(dataset.contexts()) == set([dataset.default_context])
def test_not_union(get_dataset):
store, dataset = get_dataset
# Union depends on the SPARQL endpoint configuration
if store == "SPARQLUpdateStore":
print(
"Please make sure your SPARQL endpoint has not configured "
"its default graph as the union of the named graphs"
)
subgraph1 = dataset.graph(context1)
subgraph1.add((tarek, likes, pizza))
assert list(dataset.objects(tarek, None)) == []
assert list(subgraph1.objects(tarek, None)) == [pizza]
def test_iter(get_dataset):
store, d = get_dataset
"""PR 1382: adds __iter__ to Dataset"""
uri_a = URIRef("https://example.com/a")
uri_b = URIRef("https://example.com/b")
uri_c = URIRef("https://example.com/c")
uri_d = URIRef("https://example.com/d")
d.graph(URIRef("https://example.com/subgraph1"))
d.add((uri_a, uri_b, uri_c, URIRef("https://example.com/subgraph1")))
d.add(
(uri_a, uri_b, uri_c, URIRef("https://example.com/subgraph1"))
) # pointless addition: duplicates above
d.graph(URIRef("https://example.com/g2"))
d.add((uri_a, uri_b, uri_c, URIRef("https://example.com/g2")))
d.add((uri_a, uri_b, uri_d, URIRef("https://example.com/subgraph1")))
# traditional iterator
i_trad = 0
for t in d.quads((None, None, None)):
i_trad += 1
# new Dataset.__iter__ iterator
i_new = 0
for t in d:
i_new += 1
assert i_new == i_trad # both should be 3
EGSCHEMA = Namespace("example:")
def test_subgraph_without_identifier() -> None:
"""
Graphs with no identifies assigned are identified by Skolem IRIs with a
prefix that is bound to `genid`.
TODO: This is somewhat questionable and arbitrary behaviour and should be
reviewed at some point.
"""
dataset = Dataset()
nman = dataset.namespace_manager
genid_prefix = URIRef("https://rdflib.github.io/.well-known/genid/rdflib/")
namespaces = set(nman.namespaces())
assert (
next((namespace for namespace in namespaces if namespace[0] == "genid"), None)
is None
)
subgraph: Graph = dataset.graph()
subgraph.add((EGSCHEMA["subject"], EGSCHEMA["predicate"], EGSCHEMA["object"]))
namespaces = set(nman.namespaces())
assert next(
(namespace for namespace in namespaces if namespace[0] == "genid"), None
) == ("genid", genid_prefix)
assert f"{subgraph.identifier}".startswith(genid_prefix)
|