2 rokov pred · 8a5f37fde0
--- a/README.rst
+++ b/README.rst
@@ -1,6 +1,10 @@
 
				+##########
			
 
				 SpEndPoint
			
 
				 ##########
			
 
				 
			
 
				+Creates a SPARQL endpoint supporting custom services.
			
 
				+Default access at `http://127.0.0.1:8000/gui`.
			
 
				+
			
 
				 Installation
			
 
				 ------------
			
 
				 
			
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,5 +1,5 @@
 
				 # SpEndPoint
			
 
				-arklog            ~= 0.5.0
			
 
				+arklog            ~= 0.5.1
			
 
				 rdflib            ~= 6.2.0
			
 
				 fastapi           ~= 0.92
			
 
				 starlette         ~= 0.25.0
			
--- a/spendpoint/endpoint.py
+++ b/spendpoint/endpoint.py
@@ -2,11 +2,11 @@
 
				 
			
 
				 import logging
			
 
				 import re
			
 
				-from typing import Any, Callable, Dict, List, Optional, Union
			
 
				-from urllib import parse
			
 
				-
			
 
				+import arklog
			
 
				 import pkg_resources
			
 
				 import rdflib
			
 
				+from typing import Any, Callable, Dict, List, Optional, Union
			
 
				+from urllib import parse
			
 
				 from fastapi import FastAPI, Query, Request, Response
			
 
				 from fastapi.responses import JSONResponse
			
 
				 from rdflib import ConjunctiveGraph, Dataset, Graph, Literal, URIRef
			
@@ -16,6 +16,8 @@ from rdflib.plugins.sparql.evalutils import _eval
 
				 from rdflib.plugins.sparql.parserutils import CompValue
			
 
				 from rdflib.plugins.sparql.sparql import QueryContext, SPARQLError
			
 
				 
			
 
				+arklog.set_config_logging()
			
 
				+
			
 
				 
			
 
				 class SparqlEndpoint(FastAPI):
			
 
				     """SPARQL endpoint for services and storage of heterogeneous data."""
			
@@ -40,24 +42,31 @@ class SparqlEndpoint(FastAPI):
 
				         """"""
			
 
				         return mime.split(",")[0] in ("text/turtle",)
			
 
				 
			
 
				-
			
 
				-    def __init__(
			
 
				-        self,
			
 
				-        *args: Any,
			
 
				-        title: str,
			
 
				-        description: str,
			
 
				-        version: str,
			
 
				-        functions: Dict[str, Callable[..., Any]],
			
 
				-        graph: Union[Graph, ConjunctiveGraph, Dataset] = ConjunctiveGraph(),
			
 
				-        **kwargs: Any,
			
 
				-    ):
			
 
				+    async def requested_result_type(self, request: Request, operation: str) -> str:
			
 
				+        logging.debug("Getting mime type.")
			
 
				+        output_mime_type = request.headers["accept"]
			
 
				+        # TODO Ugly hack, fix later (Fuseki sends options)
			
 
				+        output_mime_type = output_mime_type.split(",")[0]
			
 
				+        if isinstance(output_mime_type, list):
			
 
				+            return output_mime_type[0]
			
 
				+
			
 
				+        # TODO Use match or dict for this
			
 
				+        if not output_mime_type:
			
 
				+            logging.warning("No mime type provided. Setting mimetype to 'application/xml'.")
			
 
				+            return "application/xml"
			
 
				+        if operation == "Construct Query" and (self.is_json_mime_type(output_mime_type) or self.is_csv_mime_type(output_mime_type)):
			
 
				+            return "text/turtle"
			
 
				+        if operation == "Construct Query" and output_mime_type == "application/xml":
			
 
				+            return "application/rdf+xml"
			
 
				+        return output_mime_type
			
 
				+
			
 
				+    def __init__(self, *args: Any, title: str, description: str, version: str, functions: Dict[str, Callable[..., Any]], graph: Union[Graph, ConjunctiveGraph, Dataset] = ConjunctiveGraph(), **kwargs: Any):
			
 
				         """"""
			
 
				         self.graph = graph
			
 
				         self.functions = functions
			
 
				         self.title = title
			
 
				         self.description = description
			
 
				         self.version = version
			
 
				-
			
 
				         super().__init__(*args, title=title, description=description, version=version, **kwargs)
			
 
				         rdflib.plugins.sparql.CUSTOM_EVALS["evalCustomFunctions"] = self.eval_custom_functions
			
 
				         api_responses: Optional[Dict[Union[int, str], Dict[str, Any]]] = {
			
@@ -95,7 +104,9 @@ class SparqlEndpoint(FastAPI):
 
				 
			
 
				         @self.get("/", name="SPARQL endpoint", description="", responses=api_responses)
			
 
				         async def sparql_endpoint_get(request: Request, query: Optional[str] = Query(None)) -> Response:
			
 
				+            logging.debug("Received GET request.")
			
 
				             if not query:
			
 
				+                logging.warning("No query provided in GET request!")
			
 
				                 return JSONResponse({"error": "No query provided."})
			
 
				 
			
 
				             graph_ns = {}
			
@@ -121,30 +132,26 @@ class SparqlEndpoint(FastAPI):
 
				                     content={"message": "Error executing the SPARQL query on the RDFLib Graph"},
			
 
				                 )
			
 
				 
			
 
				-            # Format and return results depending on Accept mime type in request header
			
 
				-            output_mime_type = request.headers["accept"]
			
 
				-            if not output_mime_type:
			
 
				-                output_mime_type = "application/xml"
			
 
				-            # Handle mime type for construct queries
			
 
				-            if query_operation == "Construct Query" and (self.is_json_mime_type(output_mime_type) or self.is_csv_mime_type(output_mime_type)):
			
 
				-                output_mime_type = "text/turtle"
			
 
				-                # TODO: support JSON-LD for construct query?
			
 
				-                # g.serialize(format='json-ld', indent=4)
			
 
				-            if query_operation == "Construct Query" and output_mime_type == "application/xml":
			
 
				-                output_mime_type = "application/rdf+xml"
			
 
				-
			
 
				-            if self.is_csv_mime_type(output_mime_type):
			
 
				-                return Response(query_results.serialize(format="csv"), media_type=output_mime_type)
			
 
				-            elif self.is_json_mime_type(output_mime_type):
			
 
				-                return Response(query_results.serialize(format="json"), media_type=output_mime_type)
			
 
				-            elif self.is_xml_mime_type(output_mime_type):
			
 
				-                return Response(query_results.serialize(format="xml"), media_type=output_mime_type)
			
 
				-            elif self.is_turtle_mime_type(output_mime_type):
			
 
				-                return Response(query_results.serialize(format="turtle"), media_type=output_mime_type)
			
 
				-            return Response(query_results.serialize(format="xml"), media_type="application/sparql-results+xml")
			
 
				+            logging.debug(f"{type(query_results)=}")
			
 
				+            output_mime_type = await self.requested_result_type(request, query_operation)
			
 
				+            logging.debug(f"Returning {output_mime_type}.")
			
 
				+            try:
			
 
				+                if self.is_csv_mime_type(output_mime_type):
			
 
				+                    return Response(query_results.serialize(format="csv"), media_type=output_mime_type)
			
 
				+                elif self.is_json_mime_type(output_mime_type):
			
 
				+                    return Response(query_results.serialize(format="json"), media_type=output_mime_type)
			
 
				+                elif self.is_xml_mime_type(output_mime_type):
			
 
				+                    return Response(query_results.serialize(format="xml"), media_type=output_mime_type)
			
 
				+                elif self.is_turtle_mime_type(output_mime_type):
			
 
				+                    return Response(query_results.serialize(format="turtle"), media_type=output_mime_type)
			
 
				+                return Response(query_results.serialize(format="xml"), media_type="application/sparql-results+xml")
			
 
				+            except Exception as e:
			
 
				+                logging.exception(e)
			
 
				+                return JSONResponse(status_code=400, content={"message": "Error executing the SPARQL query on the RDFLib Graph"})
			
 
				 
			
 
				         @self.post("/", name="SPARQL endpoint", description="", responses=api_responses)
			
 
				         async def sparql_endpoint_post(request: Request, query: Optional[str] = Query(None)) -> Response:
			
 
				+            logging.debug("Received POST request.")
			
 
				             if not query:
			
 
				                 # Handle federated query services which provide the query in the body
			
 
				                 query_body = await request.body()
			
@@ -168,6 +175,7 @@ class SparqlEndpoint(FastAPI):
 
				             raise NotImplementedError()
			
 
				 
			
 
				         query_results = []
			
 
				+        logging.debug("Custom evaluation.")
			
 
				         for eval_part in evalPart(ctx, part.p):
			
 
				             # Checks if the function is a URI (custom function)
			
 
				             if hasattr(part.expr, "iri"):
			
--- a/spendpoint/wrapper.py
+++ b/spendpoint/wrapper.py
@@ -1,145 +0,0 @@
 
				-# Copied from https://pypi.org/project/rdflib-endpoint/
			
 
				-
			
 
				-"""
			
 
				-This example shows how a custom evaluation function can be added to
			
 
				-handle certain SPARQL Algebra elements.
			
 
				-
			
 
				-A custom function is added that adds ``rdfs:subClassOf`` "inference" when
			
 
				-asking for ``rdf:type`` triples.
			
 
				-
			
 
				-Here the custom eval function is added manually, normally you would use
			
 
				-setuptools and entry_points to do it:
			
 
				-i.e. in your setup.py::
			
 
				-
			
 
				-    entry_points = {
			
 
				-        'rdf.plugins.sparqleval': [
			
 
				-            'myfunc =     mypackage:MyFunction',
			
 
				-            ],
			
 
				-    }
			
 
				-"""
			
 
				-
			
 
				-# EvalBGP https://rdflib.readthedocs.io/en/stable/_modules/rdflib/plugins/sparql/evaluate.html
			
 
				-# Custom fct for rdf:type with auto infer super-classes: https://github.com/RDFLib/rdflib/blob/master/examples/custom_eval.py
			
 
				-# BGP = Basic Graph Pattern
			
 
				-# Docs rdflib custom fct: https://rdflib.readthedocs.io/en/stable/intro_to_sparql.html
			
 
				-# StackOverflow: https://stackoverflow.com/questions/43976691/custom-sparql-functions-in-rdflib/66988421#66988421
			
 
				-
			
 
				-# Another project: https://github.com/bas-stringer/scry/blob/master/query_handler.py
			
 
				-# https://www.w3.org/TR/sparql11-service-description/#example-turtle
			
 
				-# Federated query: https://www.w3.org/TR/2013/REC-sparql11-federated-query-20130321/#defn_service
			
 
				-# XML method: https://rdflib.readthedocs.io/en/stable/apidocs/rdflib.plugins.sparql.results.html#module-rdflib.plugins.sparql.results.xmlresults
			
 
				-
			
 
				-import rdflib
			
 
				-from rdflib import Literal, URIRef
			
 
				-from rdflib.plugins.sparql import parser
			
 
				-from rdflib.plugins.sparql.algebra import pprintAlgebra, translateQuery
			
 
				-from rdflib.plugins.sparql.evaluate import evalBGP
			
 
				-
			
 
				-# inferredSubClass = rdflib.RDFS.subClassOf * "*"  # any number of rdfs.subClassOf
			
 
				-biolink = URIRef("https://w3id.org/biolink/vocab/")
			
 
				-
			
 
				-
			
 
				-class Result:
			
 
				-    pass
			
 
				-
			
 
				-
			
 
				-def add_to_graph(ctx, drug, disease, score):
			
 
				-    bnode = rdflib.BNode()
			
 
				-    ctx.graph.add((bnode, rdflib.RDF.type, rdflib.RDF.Statement))
			
 
				-    ctx.graph.add((bnode, rdflib.RDF.subject, drug))
			
 
				-    ctx.graph.add((bnode, rdflib.RDF.predicate, biolink + "treats"))
			
 
				-    ctx.graph.add((bnode, rdflib.RDF.object, disease))
			
 
				-    ctx.graph.add((bnode, biolink + "category", biolink + "ChemicalToDiseaseOrPhenotypicFeatureAssociation"))
			
 
				-    ctx.graph.add((bnode, biolink + "has_confidence_level", score))
			
 
				-
			
 
				-
			
 
				-def get_triples(disease):
			
 
				-    drug = URIRef("http://bio2rdf.org/drugbank:DB00001")
			
 
				-    score = Literal("1.0")
			
 
				-
			
 
				-    r = Result()
			
 
				-    r.drug = drug
			
 
				-    r.disease = disease
			
 
				-    r.score = score
			
 
				-
			
 
				-    results = []
			
 
				-    results.append(r)
			
 
				-    return results
			
 
				-
			
 
				-
			
 
				-def custom_eval(ctx, part):
			
 
				-    """ """
			
 
				-    # print (part.name)
			
 
				-
			
 
				-    if part.name == "Project":
			
 
				-        ctx.myvars = []
			
 
				-
			
 
				-    # search extend for variable binding
			
 
				-    if part.name == "Extend" and hasattr(part, "expr") and not isinstance(part.expr, list):
			
 
				-        ctx.myvars.append(part.expr)
			
 
				-
			
 
				-    # search for filter
			
 
				-    if part.name == "Filter" and hasattr(part, "expr"):
			
 
				-        if hasattr(part.expr, "expr"):
			
 
				-            if part.expr.expr["op"] == "=":
			
 
				-                part.expr.expr["expr"]
			
 
				-                d = part.expr.expr["other"]
			
 
				-                ctx.myvars.append(d)
			
 
				-        else:
			
 
				-            if part.expr["op"] == "=":
			
 
				-                part.expr["expr"]
			
 
				-                d = part.expr["other"]
			
 
				-                ctx.myvars.append(d)
			
 
				-
			
 
				-    # search the BGP for the variable of interest
			
 
				-    if part.name == "BGP":
			
 
				-        triples = []
			
 
				-        for t in part.triples:
			
 
				-            if t[1] == rdflib.RDF.object:
			
 
				-                disease = t[2]
			
 
				-                # check first if the disease term is specified in the bgp triple
			
 
				-                if isinstance(disease, rdflib.term.URIRef):
			
 
				-                    ctx.myvars.append(disease)
			
 
				-
			
 
				-                # fetch instances
			
 
				-                for d in ctx.myvars:
			
 
				-                    results = get_triples(d)
			
 
				-                    for r in results:
			
 
				-                        add_to_graph(ctx, r.drug, r.disease, r.score)
			
 
				-
			
 
				-            triples.append(t)
			
 
				-        return evalBGP(ctx, triples)
			
 
				-    raise NotImplementedError()
			
 
				-
			
 
				-
			
 
				-if __name__ == "__main__":
			
 
				-    # add function directly, normally we would use setuptools and entry_points
			
 
				-    rdflib.plugins.sparql.CUSTOM_EVALS["exampleEval"] = custom_eval
			
 
				-
			
 
				-    g = rdflib.Graph()
			
 
				-
			
 
				-    q = """PREFIX openpredict: <https://w3id.org/um/openpredict/>
			
 
				-        PREFIX biolink: <https://w3id.org/biolink/vocab/>
			
 
				-        PREFIX omim: <http://bio2rdf.org/omim:>
			
 
				-        SELECT ?disease ?drug ?score
			
 
				-        {
			
 
				-            ?association a rdf:Statement ;
			
 
				-                rdf:subject ?drug ;
			
 
				-                rdf:predicate ?predicate ;
			
 
				-                #rdf:object omim:246300 ;
			
 
				-                rdf:object ?disease ;
			
 
				-                biolink:category biolink:ChemicalToDiseaseOrPhenotypicFeatureAssociation ;
			
 
				-                biolink:has_confidence_level ?score .
			
 
				-            #?disease dcat:identifier "OMIM:246300" .
			
 
				-            BIND(omim:1 AS ?disease)
			
 
				-            #FILTER(?disease = omim:2 || ?disease = omim:3)
			
 
				-            #VALUES ?disease { omim:5 omim:6 omim:7 }
			
 
				-        }"""
			
 
				-
			
 
				-    pq = parser.parseQuery(q)
			
 
				-    tq = translateQuery(pq)
			
 
				-    pprintAlgebra(tq)
			
 
				-
			
 
				-    # Find all FOAF Agents
			
 
				-    for x in g.query(q):
			
 
				-        print(x)
			
--- a/spendpoint/yasgui.html
+++ b/spendpoint/yasgui.html
@@ -2,27 +2,27 @@
 
				 <html lang="en">
			
 
				 
			
 
				 <head>
			
 
				-    <meta charset="utf-8">
			
 
				-    <title>RDFLib endpoint</title>
			
 
				-    <link href="https://unpkg.com/@triply/yasgui@4/build/yasgui.min.css" rel="stylesheet" type="text/css" />
			
 
				-    <script src="https://unpkg.com/@triply/yasgui@4/build/yasgui.min.js"></script>
			
 
				+  <meta charset="utf-8">
			
 
				+  <title>RDFLib endpoint</title>
			
 
				+  <link href="https://unpkg.com/@triply/yasgui@4/build/yasgui.min.css" rel="stylesheet" type="text/css"/>
			
 
				+  <script src="https://unpkg.com/@triply/yasgui@4/build/yasgui.min.js"></script>
			
 
				 </head>
			
 
				 
			
 
				 <body>
			
 
				-    <div id="yasgui"></div>
			
 
				-    <script>
			
 
				-        Yasqe.defaults.value = `$EXAMPLE_QUERY`
			
 
				-        const url = window.location.href.endsWith('/') ? window.location.href.slice(0, -1) : window.location.href;
			
 
				-        const yasgui = new Yasgui(document.getElementById("yasgui"), {
			
 
				-            requestConfig: { endpoint: url + "/" },
			
 
				-            endpointCatalogueOptions: {
			
 
				-                getData: function () {
			
 
				-                    return [
			
 
				-                        { endpoint: url + "/" },
			
 
				-                    ];
			
 
				-                },
			
 
				-                keys: [],
			
 
				-            },
			
 
				-        });
			
 
				-    </script>
			
 
				+<div id="yasgui"></div>
			
 
				+<script>
			
 
				+  Yasqe.defaults.value = `$EXAMPLE_QUERY`
			
 
				+  const url = window.location.href.endsWith('/') ? window.location.href.slice(0, -1) : window.location.href;
			
 
				+  const yasgui = new Yasgui(document.getElementById("yasgui"), {
			
 
				+    requestConfig: {endpoint: url + "/"},
			
 
				+    endpointCatalogueOptions: {
			
 
				+      getData: function () {
			
 
				+        return [
			
 
				+          {endpoint: url + "/"},
			
 
				+        ];
			
 
				+      },
			
 
				+      keys: [],
			
 
				+    },
			
 
				+  });
			
 
				+</script>
			
 
				 </body>
			
--- a/tests/test_query_endpoint.py
+++ b/tests/test_query_endpoint.py
@@ -1,30 +0,0 @@
 
				-import logging
			
 
				-import arklog
			
 
				-import pytest
			
 
				-# arklog.set_config_logging()
			
 
				-from SPARQLWrapper import SPARQLWrapper, JSON
			
 
				-
			
 
				-logging.basicConfig(encoding="utf-8", level=logging.DEBUG)
			
 
				-
			
 
				-# TODO Convert to test
			
 
				-def query_0():
			
 
				-    """"""
			
 
				-    sparql = SPARQLWrapper("http://localhost:8000/")
			
 
				-    sparql.setReturnFormat(JSON)
			
 
				-    sparql.setQuery(
			
 
				-        """
			
 
				-        PREFIX dtf: <https://ontology.rys.app/dt/function/>
			
 
				-        SELECT ?outlier ?outlier_value WHERE {
			
 
				-            BIND(dtf:outlier("data.csv", "2") AS ?outlier)
			
 
				-        }
			
 
				-        """
			
 
				-    )
			
 
				-    ret = sparql.query().convert()
			
 
				-    if not ret:
			
 
				-        logging.info("No outliers!")
			
 
				-    for r in ret["results"]["bindings"]:
			
 
				-        logging.info(r)
			
 
				-
			
 
				-
			
 
				-if __name__ == "__main__":
			
 
				-    query_0()