Skip to content

Commit

Permalink
Merge branch 'master' into update-emmocheck2
Browse files Browse the repository at this point in the history
  • Loading branch information
jesper-friis authored Dec 12, 2024
2 parents 8fcc5d8 + de542a3 commit 5c642a9
Show file tree
Hide file tree
Showing 3 changed files with 130 additions and 2 deletions.
83 changes: 81 additions & 2 deletions ontopy/ontology.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,7 @@
import uuid
import tempfile
import types
import re
from pathlib import Path
from collections import defaultdict
from collections.abc import Iterable
Expand Down Expand Up @@ -50,7 +51,7 @@
)

if TYPE_CHECKING:
from typing import List, Sequence
from typing import Iterator, List, Sequence


# Default annotations to look up
Expand Down Expand Up @@ -1364,7 +1365,7 @@ def sync_reasoner(
)

if include_imported:
ontologies = self.get_imported_ontologies(recursive=True)
ontologies = [self] + self.get_imported_ontologies(recursive=True)
else:
ontologies = [self]

Expand All @@ -1381,6 +1382,8 @@ def sync_reasoner(
# Datatype instances that are known to crash the reasoner
datatypes = (
"http://www.w3.org/2002/07/owl#rational",
"http://www.w3.org/1999/02/22-rdf-syntax-ns#HTML",
"http://www.w3.org/1999/02/22-rdf-syntax-ns#JSON",
"http://www.w3.org/2001/XMLSchema#NCName",
"http://www.w3.org/2001/XMLSchema#NMTOKEN",
"http://www.w3.org/2001/XMLSchema#Name",
Expand Down Expand Up @@ -2107,6 +2110,82 @@ def difference(self, other: owlready2.Ontology) -> set:
s2 = set(other.get_unabbreviated_triples(blank="_:b"))
return s1.difference(s2)

def find(
self, text: str, domain="world", case_sensitive=False, regex=False
) -> "Iterator":
"""A simple alternative to the Owlready2 `search()` method.
This method searches through all literal strings in the given domain.
Args:
text: Free text string to search for.
domain: Domain to search. Should be one of:
- "ontology": Current ontology.
- "imported": Current and all imported ontologies.
- "world": The world.
case_sensitive: Whether the search is case sensitive.
regex: Whether to use regular expression search.
Returns:
Iterator over `(subject, predicate, literal_string)` triples,
converted to EMMOntoPy objects.
"""
# pylint: disable=too-many-locals,too-many-branches

if domain == "ontology":
ontologies = [self]
elif domain == "imported":
ontologies = [self] + self.get_imported_ontologies(recursive=True)
elif domain == "world":
ontologies = [self.world]
else:
raise ValueError(
"`domain` must be 'ontology', 'imported' or 'world'. "
f"Got: {domain}"
)

# Define our match function
if regex:
flags = 0 if case_sensitive else re.IGNORECASE
pattern = re.compile(f"{text}", flags=flags)

def matchfun(string):
"""Match function using regex."""
return re.match(pattern, string)

else:
if not case_sensitive:
text = text.lower()

def matchfun(string):
"""Match function without regex."""
if case_sensitive:
return text in string
return text in string.lower()

ontology_storid = self.world._abbreviate(
"http://www.w3.org/2002/07/owl#Ontology"
)
for onto in ontologies:
for s, p, o, _ in onto._get_data_triples_spod_spod(
None, None, None, None
):
predicate = self.world.get(self.world._unabbreviate(p))
if isinstance(o, str) and matchfun(o):
assert isinstance(
s, int
), "subject should be a storid" # nosec
if s >= 0:
subject = self.world.get(self.world._unabbreviate(s))
if s == ontology_storid:
yield self.world.get_ontology(
subject.iri
), predicate, o
yield subject, predicate, o
else:
yield BlankNode(self.world, s), predicate, o


class BlankNode:
"""Represents a blank node.
Expand Down
44 changes: 44 additions & 0 deletions tests/ontopy_tests/test_ontology.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,44 @@
"""Test Ontology class methods."""

from ontopy import get_ontology
from ontopy.testutils import ontodir

animal = get_ontology(ontodir / "mammal.ttl").load()


def test_find():
"""Test find() method."""
m1 = (animal.chasing, animal.prefLabel, "chasing")
m2 = (animal.Mouse, animal.prefLabel, "Mouse")
# for domain in "ontology", "imported", "world":
assert m1 not in animal.find("chas", domain="ontology")
assert m2 in animal.find("Mouse", domain="ontology")
assert m2 in animal.find("Mouse", domain="ontology", regex=True)
assert m2 in animal.find("Mouse", domain="ontology", case_sensitive=True)
assert m2 in animal.find(
"Mouse", domain="ontology", regex=True, case_sensitive=True
)
assert m2 not in animal.find(
"mouse", domain="ontology", case_sensitive=True
)
assert m2 in animal.find("mouse", domain="ontology", case_sensitive=False)

assert m1 in animal.find("chas", domain="imported", regex=True)
assert m1 in animal.find("chas", domain="imported", case_sensitive=True)
assert m1 in animal.find(
"chas", domain="imported", regex=True, case_sensitive=True
)

assert m1 in animal.find("Chas", domain="imported")
assert m1 in animal.find("Chas", domain="imported", regex=True)
assert m1 not in animal.find("Chas", domain="imported", case_sensitive=True)
assert m1 not in animal.find(
"Chas", domain="imported", regex=True, case_sensitive=True
)

assert m2 not in animal.imported_ontologies[0].find(
"mouse", domain="ontology"
)
assert m2 in animal.imported_ontologies[0].find(
"mouse", domain="world", regex=True
)
5 changes: 5 additions & 0 deletions tests/test_basic.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,11 @@
from ontopy.ontology import Ontology


# if True:
# from emmopy import get_emmo
# emmo = get_emmo()


@pytest.mark.filterwarnings("ignore:adding new IRI to ontology:UserWarning")
def test_basic(emmo: "Ontology") -> None:
from ontopy import get_ontology
Expand Down

0 comments on commit 5c642a9

Please sign in to comment.