forked from minhnh/rdf-utils
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
* handle lists of lists & expand_curie exception - add recursive functions to iterate over lists of lists - add method optionally mute exception for expand_curie - address minhnh#8 * add unittest for collection module - add test for parsing list of lists and URIs - add test for assertion for container with loops - update rdflib version requirement - handle URIRef type in list parsing - change variable names to better match function behaviour
- Loading branch information
Showing
7 changed files
with
169 additions
and
5 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,3 +1,5 @@ | ||
# SPDX-License-Identifier: MPL-2.0 | ||
from importlib.metadata import version | ||
|
||
RDF_UTILS_VERSION = version("rdf-utils") | ||
|
||
__version__ = version("rdf-utils") |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,66 @@ | ||
# SPDX-License-Identifier: MPL-2.0 | ||
from typing import Any | ||
from rdflib import Graph, BNode, IdentifiedNode, Literal, URIRef | ||
from rdf_utils.uri import try_expand_curie | ||
|
||
|
||
def _load_list_re( | ||
graph: Graph, first_node: BNode, node_set: set[IdentifiedNode], parse_uri: bool, quiet: bool | ||
) -> list[Any]: | ||
"""Recursive internal function to extract list of lists from RDF list containers.""" | ||
list_data = [] | ||
for node in graph.items(list=first_node): | ||
if isinstance(node, URIRef): | ||
list_data.append(node) | ||
continue | ||
|
||
if isinstance(node, Literal): | ||
node_val = node.toPython() | ||
if not isinstance(node_val, str): | ||
list_data.append(node_val) | ||
continue | ||
|
||
if not parse_uri: | ||
list_data.append(node_val) | ||
continue | ||
|
||
# try to expand short-form URIs, | ||
# if doesn't work then just return URIRef of the string | ||
uri = try_expand_curie( | ||
ns_manager=graph.namespace_manager, curie_str=node_val, quiet=quiet | ||
) | ||
if uri is None: | ||
uri = URIRef(node_val) | ||
|
||
list_data.append(uri) | ||
continue | ||
|
||
assert isinstance( | ||
node, BNode | ||
), f"load_collections: node '{node}' not a Literal or BNode, type: {type(node)}" | ||
|
||
if node in node_set: | ||
raise RuntimeError(f"Loop detected in collection at node: {node}") | ||
node_set.add(node) | ||
|
||
# recursive call | ||
list_data.append(_load_list_re(graph, node, node_set, parse_uri, quiet)) | ||
|
||
return list_data | ||
|
||
|
||
def load_list_re( | ||
graph: Graph, first_node: BNode, parse_uri: bool = True, quiet: bool = True | ||
) -> list[Any]: | ||
"""!Recursively iterate over RDF list containers for extracting lists of lists. | ||
@param graph Graph object to extract the list(s) from | ||
@param first_node First element in the list | ||
@param parse_uri if True will try converting literals into URIRef | ||
@param quiet if True will not throw exceptions other than loop detection | ||
@exception RuntimeError Raised when a loop is detected | ||
@exception ValueError Raised when `quiet` is `False` and short URI cannot be expanded | ||
""" | ||
node_set = set() | ||
|
||
return _load_list_re(graph, first_node, node_set, parse_uri, quiet) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,68 @@ | ||
# SPDX-License-Identifier: MPL-2.0 | ||
import unittest | ||
from rdflib import RDF, BNode, Graph, URIRef | ||
from rdf_utils.collection import load_list_re | ||
from rdf_utils.uri import URL_SECORO_M, try_expand_curie | ||
|
||
|
||
CORRECT_LIST_MODEL = f""" | ||
{{ | ||
"@context": {{ | ||
"test": "{URL_SECORO_M}/tests/collection/", | ||
"TestNode": {{ "@id": "test:TestNode" }}, | ||
"test-cont": {{ "@id": "test:has-container", "@container": "@list", "@type": "@id" }} | ||
}}, | ||
"@graph": [ | ||
{{ "@id": "test:node1", "@type": "test:TestNode" }}, | ||
{{ "@id": "test:node2", "@type": "test:TestNode" }}, | ||
{{ "@id": "test:node3", "@type": "test:TestNode" }}, | ||
{{ | ||
"@id": "test:cont-node", "@type": "test:TestNode", | ||
"test-cont": [ | ||
["test:node1", "test:node2"], | ||
"test-node3" | ||
] | ||
}} | ||
] | ||
}} | ||
""" | ||
|
||
|
||
class CollectionTest(unittest.TestCase): | ||
def test_load_list_re(self): | ||
correct_g = Graph() | ||
correct_g.parse(data=CORRECT_LIST_MODEL, format="json-ld") | ||
|
||
cont_node_uri = try_expand_curie( | ||
ns_manager=correct_g.namespace_manager, curie_str="test:cont-node", quiet=False | ||
) | ||
assert cont_node_uri is not None | ||
cont_pred_uri = try_expand_curie( | ||
ns_manager=correct_g.namespace_manager, curie_str="test:has-container", quiet=False | ||
) | ||
assert cont_pred_uri is not None | ||
|
||
cont_bnode = correct_g.value(subject=cont_node_uri, predicate=cont_pred_uri) | ||
assert isinstance(cont_bnode, BNode) | ||
cont_list = load_list_re( | ||
graph=correct_g, first_node=cont_bnode, parse_uri=True, quiet=False | ||
) | ||
self.assertTrue(len(cont_list[0]) == 2) | ||
self.assertIsInstance(cont_list[1], URIRef) | ||
|
||
def test_loop_exception(self): | ||
loop_g = Graph() | ||
b1 = BNode() | ||
b2 = BNode() | ||
loop_g.add((b1, RDF.first, b2)) | ||
loop_g.add((b1, RDF.rest, RDF.nil)) | ||
loop_g.add((b2, RDF.first, b1)) | ||
loop_g.add((b2, RDF.rest, RDF.nil)) | ||
with self.assertRaises( | ||
RuntimeError, msg="test load_list_re: graph with loop should raise exception" | ||
): | ||
_ = load_list_re(graph=loop_g, first_node=b1) | ||
|
||
|
||
if __name__ == "__main__": | ||
unittest.main() |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters