EMMC-ASBL · jesper-friis · Nov 19, 2025 · Nov 19, 2025 · Nov 19, 2025 · Nov 19, 2025
diff --git a/pyproject.toml b/pyproject.toml
@@ -42,8 +42,11 @@ units = [
 mappings = [
     "tripper[units]",
 ]
+search = [
+    "sparql-builder @ git+https://github.com/PINK-project/SPARQL-builder@master",
+]
 datadoc = [
-    "tripper[mappings]",
+    "tripper[mappings]",  # add requirement on search
     "keyring>=22.0.0,<25.6.1",
     "PyLD>=2.0.0,<2.0.5; python_version<='3.13'",
     "PyYaml>=3.0.0,<6.0.3",  # todo: check lower version

diff --git a/tripper/search.py b/tripper/search.py
@@ -0,0 +1,113 @@
+"""Module providing a simple interface to SPARQL queries.
+
+This module is not imported by default, since it depends on the
+excellent `SPARQL-builder` package develop by 7P9 in the PINK project.
+"""
+
+from typing import TYPE_CHECKING
+
+from sparqlbuilder import select
+
+if TYPE_CHECKING:  # pragma: no cover
+    from typing import IO, Optional, Sequence, Tuple
+
+    from tripper.datadoc.context import ContextType
+    from tripper.datadoc.keywords import KeywordsType
+
+
+def make_query(
+    criteria: "Sequence[Tuple]" = (),
+    type: "Optional[str]" = None,
+    skipblanks: "bool" = True,
+    distinct: "bool" = True,
+    reduced: "bool" = False,
+    limit: "Optional[int]" = None,
+    offset: "int" = 0,
+    keywords: "Optional[KeywordsType]" = None,
+    context: "Optional[ContextType]" = None,
+    prefixes: "Optional[dict]" = None,
+) -> "str":
+    """Creates a SPARQL query to find resources in a knowledge base.
+
+    The returned query will return the IRIs of all resources that match the
+    criteria specified in the arguments.
+
+    Arguments:
+        criteria: A sequence of tuples describing a set of matching criteria
+            that all must be met.
+
+                (pred, obj, [spec])
+
+
+        type: Either a [resource type] (ex: "Dataset", "Distribution", ...)
+            or the IRI of a class to limit the search to.
+        skipblanks: Whether the query will skip matching blank nodes.
+        distinct: Whether the query will filter out duplicated matches.
+        reduced: A weaker version of `distinct` that may eliminate
+            some duplicates but is not required to eliminate all
+            duplicates. This can be more efficient than `distinct` in
+            some query engines. `distinct` and `reduced` are mutually
+            exclusive.
+        limit: Limit the number of returned IRIs to this number.
+        offset: The index of the first returned IRI. `offset` often used in
+            combination with limit for pagination.
+        keywords: Keywords instance defining prefixes and keywords for
+            use in `criteria`.
+        context: Context instance defining prefixes and keywords for
+            use in `criteria`.  Extends what has been provided by `keywords`.
+        prefixes: Additional prefixes to use in criteria.
+
+    Returns:
+        A string with a SPARQL query that can be passed to the
+        `Triplestore.query()` method.
+
+    Examples:
+
+        Alternative ways to search for all datasets:
+
+        ```
+        >>> q = make_query(criteria=[("rdf:type", "dcat:Dataset")])
+        >>> q = make_query(type="dcat:Dataset"))  # use `type` argument
+        >>> q = make_query(type="Dataset"))  # refer to a pre-defined keyword
+        ```
+
+        Search for all datasets created by a given agent:
+
+        ```
+        >>> q = make_query(
+        ...     type="Dataset",
+        ...     criteria=[("creator", "kb:JohnDow")],
+        ... )
+        ```
+
+        alternatively:
+
+        ```
+        >>> q = make_query(
+        ...     criteria=[("rdf:type": "Dataset"), ("creator", "kb:JohnDow")],
+        ... )
+        ```
+
+        Match all datasets that has a creator, regardless who:
+
+        ```
+        >>> q = make_query(
+        ...     type="Dataset",
+        ...     criteria=[("creator", None)],
+        ... )
+        ```
+
+        Use regular expressions to match all resources that have a labels that
+        ends with "Atom".
+
+        ```
+        >>> q = make_query(
+        ...     criteria=[("rdfs:label", ".+Atom", "regex")],
+        ... )
+        ```
+
+
+    """
+
+
+# make_query(prefixes=ts.namespaces)