From ea60c41e00b9cfab4ed2fd4299b3d393de3d7fba Mon Sep 17 00:00:00 2001 From: dachafra Date: Tue, 5 Dec 2023 13:16:44 +0100 Subject: [PATCH] supporting blank nodes with data reference --- VERSION | 2 +- src/yatter/constants.py | 3 + src/yatter/predicateobject.py | 12 +++- src/yatter/subject.py | 4 ++ src/yatter/termmap.py | 14 ++--- test/r2rml/YARRRMLTC-r2rml-0016/mapping.ttl | 57 +++++++++++++++++++ test/r2rml/YARRRMLTC-r2rml-0016/mapping.yml | 19 +++++++ .../test_yarrrmltc_r2rml_0016.py | 27 +++++++++ 8 files changed, 129 insertions(+), 9 deletions(-) create mode 100644 test/r2rml/YARRRMLTC-r2rml-0016/mapping.ttl create mode 100644 test/r2rml/YARRRMLTC-r2rml-0016/mapping.yml create mode 100644 test/r2rml/YARRRMLTC-r2rml-0016/test_yarrrmltc_r2rml_0016.py diff --git a/VERSION b/VERSION index 9084fa2..524cb55 100644 --- a/VERSION +++ b/VERSION @@ -1 +1 @@ -1.1.0 +1.1.1 diff --git a/src/yatter/constants.py b/src/yatter/constants.py index df7387a..08d2c9e 100644 --- a/src/yatter/constants.py +++ b/src/yatter/constants.py @@ -81,6 +81,7 @@ R2RML_TERMTYPE = 'rr:termType' R2RML_LANGUAGE = 'rr:language' R2RML_IRI = 'rr:IRI' +R2RML_BLANK_NODE = 'rr:BlankNode' R2RML_LITERAL = 'rr:Literal' R2RML_REFOBJECT_CLASS = 'rr:RefObjectMap' R2RML_PARENT_TRIPLESMAP = 'rr:parentTriplesMap' @@ -92,6 +93,7 @@ R2RML_TABLE_NAME = 'rr:tableName' R2RML_COLUMN = 'rr:column' + ############################################################################## ############################# D2RQ CONSTANTS ########################### ############################################################################## @@ -154,6 +156,7 @@ YARRRML_IRI = '~iri' YARRRML_LANG = '~lang' +YARRRML_BLANK = 'blank' YARRRML_QUOTED = 'quoted' YARRRML_NON_ASSERTED = 'quotedNonAsserted' diff --git a/src/yatter/predicateobject.py b/src/yatter/predicateobject.py index 4972923..d8fa5e8 100644 --- a/src/yatter/predicateobject.py +++ b/src/yatter/predicateobject.py @@ -156,11 +156,15 @@ def add_predicate_object(data, mapping, predicate_object, mapping_format=RML_URI for om in object_list: iri = False + blank = False if type(om) == list: object_value = om[0] if YARRRML_IRI in om[0]: - object_value = om[0].split(YARRRML_IRI)[0] + object_value = om[0].split("~")[0] iri = True + if YARRRML_BLANK in om[0]: + object_value = om[0].split("~")[0] + blank = True if mapping_format == STAR_URI: template += generate_rml_termmap(STAR_OBJECT, R2RML_OBJECT_CLASS, object_value, "\t\t\t", mapping_format) @@ -195,6 +199,9 @@ def add_predicate_object(data, mapping, predicate_object, mapping_format=RML_URI if iri: template = template[0:len(template) - 5] + "\t\t\t" + R2RML_TERMTYPE + " " \ + R2RML_IRI + "\n\t\t];\n" + if blank: + template = template[0:len(template) - 5] + "\t\t\t" + R2RML_TERMTYPE + " " \ + + R2RML_BLANK_NODE + "\n\t\t];\n" elif YARRRML_MAPPING in om or YARRRML_NON_ASSERTED in om or YARRRML_QUOTED in om: if YARRRML_MAPPING in om: template += ref_mapping(data, mapping, om, YARRRML_MAPPING, R2RML_PARENT_TRIPLESMAP, mapping_format) @@ -236,6 +243,9 @@ def add_predicate_object(data, mapping, predicate_object, mapping_format=RML_URI elif om.get(YARRRML_TYPE) == "literal": template = template[0:len(template) - 5] + "\t\t\t" + R2RML_TERMTYPE + " " \ + R2RML_LITERAL + "\n\t\t];\n" + elif om.get(YARRRML_TYPE) == YARRRML_BLANK: + template = template[0:len(template) - 5] + "\t\t\t" + R2RML_TERMTYPE + " " \ + + R2RML_BLANK_NODE + "\n\t\t];\n" if YARRRML_TARGETS in om: template = template[0:len(template) - 5] + "\t\t\t" + RML_LOGICAL_TARGET + " <"+ om.get(YARRRML_TARGETS) + ">\n\t\t];\n" diff --git a/src/yatter/subject.py b/src/yatter/subject.py index cb92703..d77691d 100644 --- a/src/yatter/subject.py +++ b/src/yatter/subject.py @@ -54,6 +54,10 @@ def add_subject(data, mapping, mapping_format): if YARRRML_TARGETS in individual_subject: subject_termmap = subject_termmap[0:-3]+"\t"+RML_LOGICAL_TARGET+" <"+individual_subject[YARRRML_TARGETS]+">\n\t];\n" + if YARRRML_TYPE in individual_subject: + if individual_subject.get(YARRRML_TYPE) == YARRRML_BLANK: + subject_termmap = subject_termmap[0:-3] + "\t" + R2RML_TERMTYPE + " " + R2RML_BLANK_NODE +"\n\t];\n" + rml_subjects.append(subject_termmap) if YARRRML_GRAPHS in data.get(YARRRML_MAPPINGS).get(mapping): diff --git a/src/yatter/termmap.py b/src/yatter/termmap.py index a522707..ee2334d 100644 --- a/src/yatter/termmap.py +++ b/src/yatter/termmap.py @@ -18,8 +18,8 @@ def get_termmap_type(text, mapping_format): ## Generates a TermMap (subject, predicate, object) based on the property, class and the text -def generate_rml_termmap(rml_property, rml_class, text, identation, mapping_format=RML_URI): - template = identation[0:-1] + rml_property + " [\n"+identation+"a " + rml_class + ";\n" + identation +def generate_rml_termmap(rml_property, rml_class, text, indentation, mapping_format=RML_URI): + template = indentation[0:-1] + rml_property + " [\n"+indentation+"a " + rml_class + ";\n" + indentation term_map = get_termmap_type(text, mapping_format) if term_map == R2RML_TEMPLATE: text = generate_rml_template(text) @@ -32,16 +32,16 @@ def generate_rml_termmap(rml_property, rml_class, text, identation, mapping_form if term_map == STAR_QUOTED: if 'quoted' in text: - template += term_map + " <" + text[YARRRML_QUOTED] + "_0>;\n" + identation[0:-1] + "];\n" + template += term_map + " <" + text[YARRRML_QUOTED] + "_0>;\n" + indentation[0:-1] + "];\n" else: - template += term_map + " <" + text[YARRRML_NON_ASSERTED] + "_0>;\n" + identation[0:-1] + "];\n" + template += term_map + " <" + text[YARRRML_NON_ASSERTED] + "_0>;\n" + indentation[0:-1] + "];\n" elif term_map != "rr:constant": - template += term_map + " \"" + text + "\";\n"+identation[0:-1]+"];\n" + template += term_map + " \"" + text + "\";\n"+indentation[0:-1]+"];\n" else: if text.startswith("http"): - template += term_map + " <" + text + ">;\n" + identation[0:-1] + "];\n" + template += term_map + " <" + text + ">;\n" + indentation[0:-1] + "];\n" else: - template += term_map + " " + text + ";\n"+identation[0:-1]+"];\n" + template += term_map + " " + text + ";\n"+indentation[0:-1]+"];\n" return template diff --git a/test/r2rml/YARRRMLTC-r2rml-0016/mapping.ttl b/test/r2rml/YARRRMLTC-r2rml-0016/mapping.ttl new file mode 100644 index 0000000..7c12163 --- /dev/null +++ b/test/r2rml/YARRRMLTC-r2rml-0016/mapping.ttl @@ -0,0 +1,57 @@ +@prefix foaf: . +@prefix rdfs: . +@prefix ex: . +@prefix rr: . +@prefix rml: . +@prefix rdf: . +@prefix xsd: . +@prefix ql: . +@prefix d2rq: . +@prefix schema: . +@prefix formats: . +@prefix comp: . +@prefix void: . +@prefix fnml: . +@prefix grel: . +@base . + + + a rr:TriplesMap; + + rr:logicalTable [ + a rr:LogicalTable; + rr:tableName "Student"; + rr:sqlVersion rr:SQL2008 + ]; + rr:subjectMap [ + a rr:SubjectMap; + rr:column "Name"; + rr:termType rr:BlankNode + ]; + rr:predicateObjectMap [ + rr:predicateMap [ + a rr:PredicateMap; + rr:constant rdf:type; + ]; + rr:objectMap [ + a rr:ObjectMap; + rr:constant foaf:Person; + ]; + rr:objectMap [ + a rr:ObjectMap; + rr:constant ex:Student; + ]; + ]; + rr:predicateObjectMap [ + rr:predicateMap [ + a rr:PredicateMap; + rr:constant foaf:Name; + ]; + rr:objectMap [ + a rr:ObjectMap; + rr:column "Name"; + rr:termType rr:BlankNode + ]; + ]. + + diff --git a/test/r2rml/YARRRMLTC-r2rml-0016/mapping.yml b/test/r2rml/YARRRMLTC-r2rml-0016/mapping.yml new file mode 100644 index 0000000..7f22a3a --- /dev/null +++ b/test/r2rml/YARRRMLTC-r2rml-0016/mapping.yml @@ -0,0 +1,19 @@ +prefixes: + foaf: http://xmlns.com/foaf/0.1/ + rdfs: http://www.w3.org/2000/01/rdf-schema# + ex: http://example.com/ + +mappings: + TriplesMap1: + sources: + - table: Student + s: + value: $(Name) + type: blank + po: + - p: rdf:type + o: [foaf:Person, ex:Student] + - p: foaf:Name + o: + value: $(Name) + type: blank \ No newline at end of file diff --git a/test/r2rml/YARRRMLTC-r2rml-0016/test_yarrrmltc_r2rml_0016.py b/test/r2rml/YARRRMLTC-r2rml-0016/test_yarrrmltc_r2rml_0016.py new file mode 100644 index 0000000..9558f55 --- /dev/null +++ b/test/r2rml/YARRRMLTC-r2rml-0016/test_yarrrmltc_r2rml_0016.py @@ -0,0 +1,27 @@ +__author__ = "Marino Gonzalez Garcia" +__credits__ = ["Marino Gonzalez Garcia"] + +__license__ = "Apache-2.0" +__maintainer__ = "David Chaves-Fraga" +__email__ = "david.chaves@upm.es" + + +import os +from ruamel.yaml import YAML +import yatter +from rdflib.graph import Graph +from rdflib import compare +R2RML_URI = 'http://www.w3.org/ns/r2rml#' + + +def test_r2rml_yarrrmltc0016(): + expected_mapping = Graph() + expected_mapping.parse(os.path.join(os.path.dirname(os.path.realpath(__file__)), 'mapping.ttl'), format="ttl") + + translated_mapping = Graph() + yaml = YAML(typ='safe', pure=True) + mapping_path = os.path.join(os.path.dirname(os.path.realpath(__file__)), 'mapping.yml') + translated_mapping.parse(data=yatter.translate(yaml.load(open(mapping_path)), mapping_format=R2RML_URI), format="ttl") + translated_mapping.serialize(destination="mapping.rml.ttl",format="ttl") + + assert compare.isomorphic(expected_mapping, translated_mapping) \ No newline at end of file