diff env/lib/python3.7/site-packages/rdflib/plugins/parsers/hturtle.py @ 5:9b1c78e6ba9c draft default tip

"planemo upload commit 6c0a8142489327ece472c84e558c47da711a9142"
author shellac
date Mon, 01 Jun 2020 08:59:25 -0400
parents 79f47841a781
children
line wrap: on
line diff
--- a/env/lib/python3.7/site-packages/rdflib/plugins/parsers/hturtle.py	Thu May 14 16:47:39 2020 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,114 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-Extraction parser RDF embedded verbatim into HTML or XML files. This is based
-on:
-
-* The specification on embedding turtle into html:
-    http://www.w3.org/TR/turtle/#in-html
-
-For SVG (and currently SVG only) the method also extracts an embedded RDF/XML
-data, per SVG specification
-
-License: W3C Software License,
-http://www.w3.org/Consortium/Legal/copyright-software
-Author: Ivan Herman
-Copyright: W3C
-"""
-
-from rdflib.parser import Parser
-from .pyRdfa import pyRdfa, Options
-from .pyRdfa.state import ExecutionContext
-from .pyRdfa.embeddedRDF import handle_embeddedRDF
-from .structureddata import _get_orig_source, _check_error
-
-try:
-    import html5lib
-    assert html5lib
-    html5lib = True
-except ImportError:
-    import warnings
-    warnings.warn(
-        'html5lib not found! RDFa and Microdata parsers ' +
-        'will not be available.')
-    html5lib = False
-
-
-class HTurtle(pyRdfa):
-    """
-    Bastardizing the RDFa 1.1 parser to do a hturtle extractions
-    """
-    def __init__(self, options=None, base="", media_type=""):
-        pyRdfa.__init__(self, options=options, base=base,
-                        media_type=media_type, rdfa_version="1.1")
-
-    def graph_from_DOM(self, dom, graph, pgraph=None):
-        """
-        Stealing the parsing function from the original class, to do
-        turtle extraction only
-        """
-
-        def copyGraph(tog, fromg):
-            for t in fromg:
-                tog.add(t)
-            for k, ns in fromg.namespaces():
-                tog.bind(k, ns)
-
-        def _process_one_node(node, graph, state):
-            if handle_embeddedRDF(node, graph, state):
-                # we got an RDF content that has been extracted into Graph;
-                # the recursion should stop
-                return
-            else:
-                # recurse through all the child elements of the current node
-                for n in node.childNodes:
-                    if n.nodeType == node.ELEMENT_NODE:
-                        _process_one_node(n, graph, state)
-
-        topElement = dom.documentElement
-        state = ExecutionContext(topElement, graph, base=self.base,
-                                 options=self.options, rdfa_version="1.1")
-        _process_one_node(topElement, graph, state)
-        if pgraph is not None:
-            copyGraph(pgraph, self.options.processor_graph.graph)
-
-# This is the parser interface as it would look when called from the rest of
-# RDFLib
-
-
-class HTurtleParser(Parser):
-    def parse(self, source, graph, pgraph=None, media_type=""):
-        """
-        @param source: one of the input sources that the RDFLib package defined
-        @type source: InputSource class instance
-        @param graph: target graph for the triples; output graph, in RDFa spec.
-        parlance
-        @type graph: RDFLib Graph
-        @keyword media_type: explicit setting of the preferred media type
-        (a.k.a. content type) of the the RDFa source. None means the content
-        type of the HTTP result is used, or a guess is made based on the
-        suffix of a file
-        @type media_type: string
-        """
-        if html5lib is False:
-            raise ImportError(
-                'html5lib is not installed, cannot ' +
-                'use RDFa and Microdata parsers.')
-
-        (baseURI, orig_source) = _get_orig_source(source)
-        self._process(
-            graph, pgraph, baseURI, orig_source, media_type=media_type)
-
-    def _process(self, graph, baseURI, orig_source, media_type=""):
-        self.options = Options(output_processor_graph=None,
-                               embedded_rdf=True,
-                               vocab_expansion=False,
-                               vocab_cache=False)
-
-        if media_type is None:
-            media_type = ""
-        processor = HTurtle(
-            self.options, base=baseURI, media_type=media_type)
-        processor.graph_from_source(
-            orig_source, graph=graph, pgraph=None, rdfOutput=False)
-        # get possible error triples to raise exceptions
-        _check_error(graph)