-
Notifications
You must be signed in to change notification settings - Fork 13
/
Copy pathsparql_query.py
48 lines (41 loc) · 1.93 KB
/
sparql_query.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
from typing import List
import jsonasobj
import requests
from SPARQLWrapper import JSON
from rdflib import URIRef
from pyshex.user_agent import UserAgent, SPARQLWrapperWithAgent
class SPARQLQuery:
def __init__(self, sparql_endpoint: str, sparql_file_uri_or_text: str,
print_query: bool=False, print_results: bool=False, user_agent: str = UserAgent) -> None:
""" Set up the query to run
:param sparql_endpoint: URL of sparql endpoint
:param sparql_file_uri_or_text: URI, filename or SPARQL text
:param print_query: Print the sparql results query
:param print_results: Print query results
"""
self.print_results = print_results
if '\n' in sparql_file_uri_or_text or '\r' in sparql_file_uri_or_text or ' ' in sparql_file_uri_or_text:
self.query = sparql_file_uri_or_text
elif ':/' in sparql_file_uri_or_text:
req = requests.get(sparql_file_uri_or_text, headers={'User-Agent': user_agent})
if not req.ok:
raise ValueError(f"Unable to read {sparql_file_uri_or_text}")
self.query = req.text
else:
with open(sparql_file_uri_or_text) as f:
self.query = f.read()
if print_query:
print("SPARQL:")
print(self.query)
self.endpoint = SPARQLWrapperWithAgent(sparql_endpoint)
self.endpoint.setQuery(self.query)
self.endpoint.setReturnFormat(JSON)
def focus_nodes(self) -> List[URIRef]:
result = self.endpoint.query()
processed_results = jsonasobj.load(result.response)
if self.print_results:
print('\t' + ('\n\t'.join([row.item.value for row in processed_results.results.bindings[:10]])))
if len(processed_results.results.bindings) > 10:
print('\n\t ...')
print('\n')
return [URIRef(row.item.value) for row in processed_results.results.bindings]