RDFLib · ashleysommer · Oct 8, 2020 · Oct 3, 2020 · Oct 3, 2020 · Oct 3, 2020
diff --git a/.travis.fuseki_install_optional.sh b/.travis.fuseki_install_optional.sh
@@ -2,7 +2,7 @@
 
 set -v
 
-uri="http://archive.apache.org/dist/jena/binaries/apache-jena-fuseki-2.4.0.tar.gz"
+uri="http://archive.apache.org/dist/jena/binaries/apache-jena-fuseki-3.9.0.tar.gz"
 
 if wget "$uri" &&
        tar -zxf *jena*fuseki*.tar.gz &&

diff --git a/.travis.yml b/.travis.yml
@@ -9,9 +9,9 @@ git:
   depth: 3
 
 python:
-    - 3.5
     - 3.6
     - 3.7
+    - 3.8
 
 jobs:
   include:
@@ -24,6 +24,7 @@ before_install:
 
 install:
     - pip install --default-timeout 60 -r requirements.txt
+    - pip install --default-timeout 60 -r requirements.dev.txt
     - pip install --default-timeout 60 coverage coveralls nose-timer && export HAS_COVERALLS=1
     - python setup.py install
 

diff --git a/CONTRIBUTORS b/CONTRIBUTORS
@@ -1,6 +1,7 @@
 Aaron Swartz
 Andrew Eland
 Andrew Kuchling
+Ashley Sommer
 Arve Knudsen
 Chimezie Ogbuji
 Daniel Krech
@@ -18,7 +19,9 @@ Kendall Clark
 Leandro López
 Lucio Torre
 Michel Pelletier
+Natanael Arndt
 Nacho Barrientos Arias
+Nicholas J. Car
 Niklas Lindström
 Phil Dawes
 Phillip Pearson

diff --git a/LICENSE b/LICENSE
@@ -1,6 +1,6 @@
 LICENSE AGREEMENT FOR RDFLIB 
 ------------------------------------------------
-Copyright (c) 2002-2017, RDFLib Team
+Copyright (c) 2002-2020, RDFLib Team
 See CONTRIBUTORS and http://github.com/RDFLib/rdflib
 All rights reserved.
 

diff --git a/README.md b/README.md
@@ -31,7 +31,7 @@ Please see the list for all packages/repositories here:
 ## Versions
 
  * `5.x.y` supports Python 2.7 and 3.4+ and is [mostly backwards compatible with 4.2.2](https://rdflib.readthedocs.io/en/stable/upgrade4to5.html). Only bug fixes will be applied.
- * `6.x.y` is the next major release which will support Python 3.5+. (Current master branch)
+ * `6.x.y` is the next major release which will support Python 3.6+. (Current master branch)
 
 
 ## Installation

diff --git a/docs/developers.rst b/docs/developers.rst
@@ -59,7 +59,7 @@ Compatibility
 
 RDFLib 5.x.y tries to be compatible with python versions 2.7, 3.4, 3.5, 3.6, 3.7.
 
-The current master branch (which will be released as 6.0.0) will only support Python 3.5 and newer.
+The current master branch (which will be released as 6.0.0) will only support Python 3.6 and newer.
 
 
 Releasing

diff --git a/examples/sparqlstore_example.py b/examples/sparqlstore_example.py
@@ -1,16 +1,15 @@
 """
-A simple example showing how to use the SPARQLStore
+Simple examples showing how to use the SPARQLStore
 """
 
-import locale
 from rdflib import Graph, URIRef, Namespace
 from rdflib.plugins.stores.sparqlstore import SPARQLStore
 
 if __name__ == "__main__":
 
     dbo = Namespace("http://dbpedia.org/ontology/")
 
-    # using a Graph with the Store type string set to "SPARQLStore"
+    # EXAMPLE 1: using a Graph with the Store type string set to "SPARQLStore"
     graph = Graph("SPARQLStore", identifier="http://dbpedia.org")
     graph.open("http://dbpedia.org/sparql")
 
@@ -22,13 +21,28 @@
         ).replace(",", ".")
     )
 
-    # using a SPARQLStore object directly
-    s = SPARQLStore(endpoint="http://dbpedia.org/sparql")
-    s.open(None)
-    pop = graph.value(
-        URIRef("http://dbpedia.org/resource/Brisbane"), dbo.populationTotal
-    )
-    print(
-        "According to DBPedia, Brisbane has a population of "
-        "{0:,}".format(int(pop), ",d")
-    )
+    # EXAMPLE 2: using a SPARQLStore object directly
+    st = SPARQLStore(query_endpoint="http://dbpedia.org/sparql")
+
+    for p in st.objects(URIRef("http://dbpedia.org/resource/Brisbane"), dbo.populationTotal):
+        print(
+            "According to DBPedia, Brisbane has a population of "
+            "{0:,}".format(int(pop), ",d")
+        )
+
+    # EXAMPLE 3: doing RDFlib triple navigation using SPARQLStore as a Graph()
+    graph = Graph("SPARQLStore", identifier="http://dbpedia.org")
+    graph.open("http://dbpedia.org/sparql")
+    # we are asking DBPedia for 3 skos:Concept instances
+    count = 0
+    from rdflib.namespace import RDF, SKOS
+    for s in graph.subjects(predicate=RDF.type, object=SKOS.Concept):
+        count += 1
+        print(s)
+        if count >= 3:
+            break
+
+    # EXAMPLE 4: using a SPARQL endpoint that requires Basic HTTP authentication
+    # NOTE: this example won't run since the endpoint isn't live (or real)
+    s = SPARQLStore(query_endpoint="http://fake-sparql-endpoint.com/repository/x", auth=("my_username", "my_password"))
+    # do normal Graph things
diff --git a/rdflib/plugins/sparql/evaluate.py b/rdflib/plugins/sparql/evaluate.py
@@ -17,7 +17,9 @@
 import collections
 import itertools
 import re
-import requests
+from urllib.request import urlopen, Request
+from urllib.parse import urlencode
+import json as j
 from pyparsing import ParseException
 
 from rdflib import Variable, Graph, BNode, URIRef, Literal
@@ -313,13 +315,11 @@ def evalServiceQuery(ctx, part):
         }
         # GET is easier to cache so prefer that if the query is not to long
         if len(service_query) < 600:
-            response = requests.get(service_url, params=query_settings, headers=headers)
+            response = urlopen(Request(service_url + "?" + urlencode(query_settings), headers=headers))
         else:
-            response = requests.post(
-                service_url, params=query_settings, headers=headers
-            )
-        if response.status_code == 200:
-            json = response.json()
+            response = urlopen(Request(service_url, data=urlencode(query_settings).encode(), headers=headers))
+        if response.status == 200:
+            json = j.loads(response.read())
             variables = res["vars_"] = json["head"]["vars"]
             # or just return the bindings?
             res = json["results"]["bindings"]
@@ -329,7 +329,7 @@ def evalServiceQuery(ctx, part):
                         yield bound
         else:
             raise Exception(
-                "Service: %s responded with code: %s", service_url, response.status_code
+                "Service: %s responded with code: %s", service_url, response.status
             )
 
 

diff --git a/rdflib/plugins/stores/sparqlconnector.py b/rdflib/plugins/stores/sparqlconnector.py
@@ -1,12 +1,13 @@
 import logging
-import threading
-import requests
-
-import os
+from urllib.request import urlopen, Request
+from urllib.parse import urlencode
+from urllib.error import HTTPError, URLError
+import base64
 
 from io import BytesIO
 
 from rdflib.query import Result
+from rdflib import BNode
 
 log = logging.getLogger(__name__)
 
@@ -26,7 +27,6 @@ class SPARQLConnectorException(Exception):
 
 
 class SPARQLConnector(object):
-
     """
     this class deals with nitty gritty details of talking to a SPARQL server
     """
@@ -37,29 +37,26 @@ def __init__(
         update_endpoint=None,
         returnFormat="xml",
         method="GET",
+        auth=None,
         **kwargs
     ):
         """
-        Any additional keyword arguments will be passed to requests, and can be used to setup timesouts, basic auth, etc.
+        auth, if present, must be a tuple of (username, password) used for Basic Authentication
+
+        Any additional keyword arguments will be passed to to the request, and can be used to setup timesouts etc.
         """
 
         self.returnFormat = returnFormat
         self.query_endpoint = query_endpoint
         self.update_endpoint = update_endpoint
         self.kwargs = kwargs
         self.method = method
-
-        # it is recommended to have one session object per thread/process. This assures that is the case.
-        # https://github.com/kennethreitz/requests/issues/1871
-
-        self._session = threading.local()
-
-    @property
-    def session(self):
-        k = "session_%d" % os.getpid()
-        self._session.__dict__.setdefault(k, requests.Session())
-        log.debug("Session %s %s", os.getpid(), id(self._session.__dict__[k]))
-        return self._session.__dict__[k]
+        if auth is not None:
+            assert type(auth) == tuple, "auth must be a tuple"
+            assert len(auth) == 2, "auth must be a tuple (user, password)"
+            base64string = base64.b64encode(bytes('%s:%s' % auth, 'ascii'))
+            self.kwargs.setdefault("headers", {})
+            self.kwargs["headers"].update({"Authorization": "Basic %s" % base64string.decode('utf-8')})
 
     @property
     def method(self):
@@ -72,19 +69,18 @@ def method(self, method):
 
         self._method = method
 
-    def query(self, query, default_graph=None):
-
+    def query(self, query, default_graph: str = None, named_graph: str = None):
         if not self.query_endpoint:
             raise SPARQLConnectorException("Query endpoint not set!")
 
         params = {"query": query}
-        if default_graph:
+        # this test ensures we don't have a useless (BNode) default graph URI, which calls to Graph().query() will add
+        if default_graph is not None and type(default_graph) != BNode:
             params["default-graph-uri"] = default_graph
 
         headers = {"Accept": _response_mime_types[self.returnFormat]}
 
         args = dict(self.kwargs)
-        args.update(url=self.query_endpoint)
 
         # merge params/headers dicts
         args.setdefault("params", {})
@@ -94,47 +90,46 @@ def query(self, query, default_graph=None):
 
         if self.method == "GET":
             args["params"].update(params)
+            qsa = "?" + urlencode(args["params"])
+            try:
+                res = urlopen(Request(self.query_endpoint + qsa, headers=args["headers"]))
+            except Exception as e:
+                raise ValueError("You did something wrong formulating either the URI or your SPARQL query")
         elif self.method == "POST":
             args["headers"].update({"Content-Type": "application/sparql-query"})
-            args["data"] = params
+            try:
+                res = urlopen(Request(self.query_endpoint, data=query.encode(), headers=args["headers"]))
+            except HTTPError as e:
+                return e.code, str(e), None
         else:
             raise SPARQLConnectorException("Unknown method %s" % self.method)
-
-        res = self.session.request(self.method, **args)
-
-        res.raise_for_status()
-
         return Result.parse(
-            BytesIO(res.content), content_type=res.headers["Content-type"]
+            BytesIO(res.read()), content_type=res.headers["Content-Type"].split(";")[0]
         )
 
-    def update(self, update, default_graph=None):
+    def update(self, query, default_graph: str = None, named_graph: str = None):
         if not self.update_endpoint:
             raise SPARQLConnectorException("Query endpoint not set!")
 
         params = {}
 
-        if default_graph:
+        if default_graph is not None:
             params["using-graph-uri"] = default_graph
 
+        if named_graph is not None:
+            params["using-named-graph-uri"] = default_graph
+
         headers = {
             "Accept": _response_mime_types[self.returnFormat],
             "Content-Type": "application/sparql-update",
         }
 
-        args = dict(self.kwargs)
-
-        args.update(url=self.update_endpoint, data=update.encode("utf-8"))
+        args = dict(self.kwargs)  # other QSAs
 
-        # merge params/headers dicts
         args.setdefault("params", {})
         args["params"].update(params)
         args.setdefault("headers", {})
         args["headers"].update(headers)
 
-        res = self.session.post(**args)
-
-        res.raise_for_status()
-
-    def close(self):
-        self.session.close()
+        qsa = "?" + urlencode(args["params"])
+        res = urlopen(Request(self.update_endpoint + qsa, data=query.encode(), headers=args["headers"]))