Skip to content

triplestore_extend

A module that adds additional functionality to triplestore

Tripper (Triplestore)

Class that provides additional methods for handling data in the triplestore, such as get_value, add_data and add_interpolation_source.

Source code in tripper/triplestore_extend.py
class Tripper(Triplestore):
    """
    Class that provides additional
    methods for handling data in the triplestore,
    such as get_value, add_data and add_interpolation_source.
    """

    def add_data(
        self,
        func: "Union[Callable, Literal]",
        iri: "Optional[Union[str, Sequence]]" = None,
        configurations: "Optional[dict]" = None,
        base_iri: "Optional[str]" = None,
        standard: str = "emmo",
        cost: "Optional[Union[float, Callable]]" = None,
    ) -> str:
        """Register a data source to the triplestore.

        Parameters:
            func: A callable that should return the value of the registered
                data source.  It is called with following protopype:

                    func(returns, configurations, triplestore)

                The returned value may in principle be of any type, but for
                values with unit, it is recommended to return a
                tripper.mappings.Value object.
                Alternatively, `func` may also be a literal value.
            iri: IRI of ontological concept or individual that the data
                returned by `func` should be mapped to.  If `func` is a
                callable and multiple values are returned, it may also be
                given as a sequenceof IRIs.
                If not given, it will default to a new blank node.
            configurations: Configurations passed on to `func`.
            base_iri: Base of the IRI representing the function in the
                knowledge base.  Defaults to the base IRI of the triplestore.
            standard: Name of ontological standard to use when describing the
                function.  Valid values are:
                - "emmo": Elementary Multiperspective Material Ontology (EMMO)
                - "fno": Function Ontology (FnO)
            cost: User-defined cost of following this mapping relation
                represented as a float.  It may be given either as a
                float or as a callable taking the same arguments as `func`
                returning the cost as a float.

        Returns:
            IRI of data source.
        """
        if iri is None:
            # pylint complains about uuid being unused if we make this an
            # f-string
            iri = "_bnode_" + str(uuid.uuid4())
        data_source = "_data_source_" + random_string(8)
        self.add((data_source, RDF.type, DataSource))

        if isinstance(func, Literal):
            self.add((data_source, hasDataValue, func))
            if cost is not None:
                self._add_cost(cost, data_source)
            if isinstance(iri, str):
                self.map(data_source, iri)
            else:
                raise TypeError("literal data can only have a single `iri`")

        elif callable(func):

            def fn():
                return func(iri, configurations, self)

            # Include data source IRI in documentation to ensure that the
            # function_id of `fn()` will differ for different data sources...
            fn.__doc__ = (
                f"Function for data source: {data_source}.\n\n{func.__doc__}"
            )
            fn.__name__ = func.__name__

            func_iri = self.add_function(
                fn,
                expects=(),
                returns=iri,
                base_iri=base_iri,
                standard=standard,
                cost=cost,
            )
            self.add((data_source, hasAccessFunction, func_iri))
        else:
            raise TypeError(
                f"`func` must be a callable or literal, got {type(func)}"
            )

        return data_source

    def get_value(
        self,
        iri,
        routeno=0,
        unit: "Optional[str]" = None,
        magnitude: bool = False,
        quantity: "Optional[Any]" = None,
        **kwargs,
    ) -> "Value":
        """Return the value of an individual.

        Parameters:
            iri: IRI of individual who's value we want to return.  IRI may
                either refer to a data source or an individual mapped to
                an ontological concept.
            routeno: Number identifying the mapping route to apply for
                retrieving the individual value in case IRI does not refer
                to a data source.
            unit: return the result in the given unit.
                Implies `magnitude=True`.
            magnitude: Whether to only return the magnitude of the evaluated
                value (with no unit).
            quantity: Quantity class to use for evaluation.  Defaults to pint.
            kwargs: Additional arguments passed on to `mapping_routes()`.

        Returns:
            The value of the individual.
        """
        from tripper.mappings import (  # pylint: disable=import-outside-toplevel
            Value,
            mapping_routes,
        )

        if self.has(iri, RDF.type, DataSource):
            # `iri` refer to a DataSource
            if self.has(iri, hasDataValue):  # literal value
                return Value(
                    value=parse_literal(
                        self.value(iri, hasDataValue)
                    ).to_python(),
                    unit=(
                        parse_literal(self.value(iri, hasUnit)).to_python()
                        if self.has(iri, hasUnit)
                        else None
                    ),
                    iri=self.value(iri, MAP.mapsTo),
                    cost=(
                        parse_literal(self.value(iri, hasCost)).to_python()
                        if self.has(iri, hasCost)
                        else 0.0
                    ),
                ).get_value(unit=unit, magnitude=magnitude, quantity=quantity)

            if self.has(iri, hasAccessFunction):  # callable
                func_iri = self.value(iri, hasAccessFunction)
                func = self.function_repo[func_iri]
                assert callable(func)  # nosec
                retval = func()
                if isinstance(retval, Value):
                    return retval.get_value(
                        unit=unit, magnitude=magnitude, quantity=quantity
                    )
                return retval

            raise TripperError(
                f"data source {iri} has neither a 'hasDataValue' or a "
                f"'hasAccessFunction' property"
            )

        # `iri` correspond to an individual mapped to an ontological concept.
        # In this case we check if there exists a mapping route.
        routes = mapping_routes(
            target=iri,
            sources=list(self.subjects(RDF.type, DataSource)),
            triplestore=self,
            **kwargs,
        )
        if isinstance(routes, Value):
            return routes.get_value(
                unit=unit, magnitude=magnitude, quantity=quantity
            )
        return routes.eval(
            routeno=routeno,
            unit=unit,
            magnitude=magnitude,
            quantity=quantity,
        )

    def add_interpolation_source(  # pylint: disable=too-many-arguments
        self,
        xcoord: str,
        ycoord: str,
        input_iri: str,
        output_iri: str,
        base_iri: "Optional[str]" = None,
        standard: str = "emmo",
        cost: "Optional[Union[float, Callable]]" = None,
        left: "Optional[float]" = None,
        right: "Optional[float]" = None,
        period: "Optional[float]" = None,
    ) -> str:
        """Add data source to triplestore, such that it can be used to
        transparently transform other data.

        No data will be fetch before it is actually needed.

        Parameters:
            xcoord: IRI of data source with x-coordinates `xp`.  Must be
                increasing if argument `period` is not specified. Otherwise,
                `xp` is internally sorted after normalising the periodic
                boundaries with ``xp = xp % period``.
            ycoord: IRI of data source with y-coordinates `yp`.  Must have
                the same length as `xp`.
            input_iri: IRI of ontological concept that interpolation input-
                data should be mapped to.
            output_iri: IRI of ontological concept that interpolation output-
                data should be mapped to.
            base_iri: Base of the IRI representing the transformation in the
                knowledge base.  Defaults to the base IRI of the triplestore.
            standard: Name of ontology to use when describing the
                transformation.  Valid values are:
                - "emmo": Elementary Multiperspective Material Ontology (EMMO)
                - "fno": Function Ontology (FnO)
            cost: User-defined cost of following this mapping relation
                represented as a float.  It may be given either as a
                float or as a callable taking the same arguments as `func`
                returning the cost as a float.
            left: Value to return for `x < xp[0]`, default is `fp[0]`.
            right: Value to return for `x > xp[-1]`, default is `fp[-1]`.
            period: A period for the x-coordinates. This parameter allows the
                proper interpolation of angular x-coordinates. Parameters
                `left` and `right` are ignored if `period` is specified.

        Returns:
            transformation_iri: IRI of the added transformation.

        """
        try:
            import numpy as np  # pylint: disable=import-outside-toplevel
        except ImportError as exc:
            raise RuntimeError(
                "Triplestore.add_interpolation_source() requires numpy.\n"
                "Install it with\n\n"
                "    pip install numpy"
            ) from exc

        def func(x):
            xp = self.get_value(xcoord)
            fp = self.get_value(ycoord)
            return np.interp(
                x,
                xp=xp,
                fp=fp,
                left=left,
                right=right,
                period=period,
            )

        return self.add_function(
            func,
            expects=input_iri,
            returns=output_iri,
            base_iri=base_iri,
            standard=standard,
            cost=cost,
        )

add_data(self, func, iri=None, configurations=None, base_iri=None, standard='emmo', cost=None)

Register a data source to the triplestore.

Parameters:

Name Type Description Default
func 'Union[Callable, Literal]'

A callable that should return the value of the registered data source. It is called with following protopype:

func(returns, configurations, triplestore)

The returned value may in principle be of any type, but for values with unit, it is recommended to return a tripper.mappings.Value object. Alternatively, func may also be a literal value.

required
iri 'Optional[Union[str, Sequence]]'

IRI of ontological concept or individual that the data returned by func should be mapped to. If func is a callable and multiple values are returned, it may also be given as a sequenceof IRIs. If not given, it will default to a new blank node.

None
configurations 'Optional[dict]'

Configurations passed on to func.

None
base_iri 'Optional[str]'

Base of the IRI representing the function in the knowledge base. Defaults to the base IRI of the triplestore.

None
standard str

Name of ontological standard to use when describing the function. Valid values are: - "emmo": Elementary Multiperspective Material Ontology (EMMO) - "fno": Function Ontology (FnO)

'emmo'
cost 'Optional[Union[float, Callable]]'

User-defined cost of following this mapping relation represented as a float. It may be given either as a float or as a callable taking the same arguments as func returning the cost as a float.

None

Returns:

Type Description
str

IRI of data source.

Source code in tripper/triplestore_extend.py
def add_data(
    self,
    func: "Union[Callable, Literal]",
    iri: "Optional[Union[str, Sequence]]" = None,
    configurations: "Optional[dict]" = None,
    base_iri: "Optional[str]" = None,
    standard: str = "emmo",
    cost: "Optional[Union[float, Callable]]" = None,
) -> str:
    """Register a data source to the triplestore.

    Parameters:
        func: A callable that should return the value of the registered
            data source.  It is called with following protopype:

                func(returns, configurations, triplestore)

            The returned value may in principle be of any type, but for
            values with unit, it is recommended to return a
            tripper.mappings.Value object.
            Alternatively, `func` may also be a literal value.
        iri: IRI of ontological concept or individual that the data
            returned by `func` should be mapped to.  If `func` is a
            callable and multiple values are returned, it may also be
            given as a sequenceof IRIs.
            If not given, it will default to a new blank node.
        configurations: Configurations passed on to `func`.
        base_iri: Base of the IRI representing the function in the
            knowledge base.  Defaults to the base IRI of the triplestore.
        standard: Name of ontological standard to use when describing the
            function.  Valid values are:
            - "emmo": Elementary Multiperspective Material Ontology (EMMO)
            - "fno": Function Ontology (FnO)
        cost: User-defined cost of following this mapping relation
            represented as a float.  It may be given either as a
            float or as a callable taking the same arguments as `func`
            returning the cost as a float.

    Returns:
        IRI of data source.
    """
    if iri is None:
        # pylint complains about uuid being unused if we make this an
        # f-string
        iri = "_bnode_" + str(uuid.uuid4())
    data_source = "_data_source_" + random_string(8)
    self.add((data_source, RDF.type, DataSource))

    if isinstance(func, Literal):
        self.add((data_source, hasDataValue, func))
        if cost is not None:
            self._add_cost(cost, data_source)
        if isinstance(iri, str):
            self.map(data_source, iri)
        else:
            raise TypeError("literal data can only have a single `iri`")

    elif callable(func):

        def fn():
            return func(iri, configurations, self)

        # Include data source IRI in documentation to ensure that the
        # function_id of `fn()` will differ for different data sources...
        fn.__doc__ = (
            f"Function for data source: {data_source}.\n\n{func.__doc__}"
        )
        fn.__name__ = func.__name__

        func_iri = self.add_function(
            fn,
            expects=(),
            returns=iri,
            base_iri=base_iri,
            standard=standard,
            cost=cost,
        )
        self.add((data_source, hasAccessFunction, func_iri))
    else:
        raise TypeError(
            f"`func` must be a callable or literal, got {type(func)}"
        )

    return data_source

add_interpolation_source(self, xcoord, ycoord, input_iri, output_iri, base_iri=None, standard='emmo', cost=None, left=None, right=None, period=None)

Add data source to triplestore, such that it can be used to transparently transform other data.

No data will be fetch before it is actually needed.

Parameters:

Name Type Description Default
xcoord str

IRI of data source with x-coordinates xp. Must be increasing if argument period is not specified. Otherwise, xp is internally sorted after normalising the periodic boundaries with xp = xp % period.

required
ycoord str

IRI of data source with y-coordinates yp. Must have the same length as xp.

required
input_iri str

IRI of ontological concept that interpolation input- data should be mapped to.

required
output_iri str

IRI of ontological concept that interpolation output- data should be mapped to.

required
base_iri 'Optional[str]'

Base of the IRI representing the transformation in the knowledge base. Defaults to the base IRI of the triplestore.

None
standard str

Name of ontology to use when describing the transformation. Valid values are: - "emmo": Elementary Multiperspective Material Ontology (EMMO) - "fno": Function Ontology (FnO)

'emmo'
cost 'Optional[Union[float, Callable]]'

User-defined cost of following this mapping relation represented as a float. It may be given either as a float or as a callable taking the same arguments as func returning the cost as a float.

None
left 'Optional[float]'

Value to return for x < xp[0], default is fp[0].

None
right 'Optional[float]'

Value to return for x > xp[-1], default is fp[-1].

None
period 'Optional[float]'

A period for the x-coordinates. This parameter allows the proper interpolation of angular x-coordinates. Parameters left and right are ignored if period is specified.

None

Returns:

Type Description
transformation_iri

IRI of the added transformation.

Source code in tripper/triplestore_extend.py
def add_interpolation_source(  # pylint: disable=too-many-arguments
    self,
    xcoord: str,
    ycoord: str,
    input_iri: str,
    output_iri: str,
    base_iri: "Optional[str]" = None,
    standard: str = "emmo",
    cost: "Optional[Union[float, Callable]]" = None,
    left: "Optional[float]" = None,
    right: "Optional[float]" = None,
    period: "Optional[float]" = None,
) -> str:
    """Add data source to triplestore, such that it can be used to
    transparently transform other data.

    No data will be fetch before it is actually needed.

    Parameters:
        xcoord: IRI of data source with x-coordinates `xp`.  Must be
            increasing if argument `period` is not specified. Otherwise,
            `xp` is internally sorted after normalising the periodic
            boundaries with ``xp = xp % period``.
        ycoord: IRI of data source with y-coordinates `yp`.  Must have
            the same length as `xp`.
        input_iri: IRI of ontological concept that interpolation input-
            data should be mapped to.
        output_iri: IRI of ontological concept that interpolation output-
            data should be mapped to.
        base_iri: Base of the IRI representing the transformation in the
            knowledge base.  Defaults to the base IRI of the triplestore.
        standard: Name of ontology to use when describing the
            transformation.  Valid values are:
            - "emmo": Elementary Multiperspective Material Ontology (EMMO)
            - "fno": Function Ontology (FnO)
        cost: User-defined cost of following this mapping relation
            represented as a float.  It may be given either as a
            float or as a callable taking the same arguments as `func`
            returning the cost as a float.
        left: Value to return for `x < xp[0]`, default is `fp[0]`.
        right: Value to return for `x > xp[-1]`, default is `fp[-1]`.
        period: A period for the x-coordinates. This parameter allows the
            proper interpolation of angular x-coordinates. Parameters
            `left` and `right` are ignored if `period` is specified.

    Returns:
        transformation_iri: IRI of the added transformation.

    """
    try:
        import numpy as np  # pylint: disable=import-outside-toplevel
    except ImportError as exc:
        raise RuntimeError(
            "Triplestore.add_interpolation_source() requires numpy.\n"
            "Install it with\n\n"
            "    pip install numpy"
        ) from exc

    def func(x):
        xp = self.get_value(xcoord)
        fp = self.get_value(ycoord)
        return np.interp(
            x,
            xp=xp,
            fp=fp,
            left=left,
            right=right,
            period=period,
        )

    return self.add_function(
        func,
        expects=input_iri,
        returns=output_iri,
        base_iri=base_iri,
        standard=standard,
        cost=cost,
    )

get_value(self, iri, routeno=0, unit=None, magnitude=False, quantity=None, **kwargs)

Return the value of an individual.

Parameters:

Name Type Description Default
iri

IRI of individual who's value we want to return. IRI may either refer to a data source or an individual mapped to an ontological concept.

required
routeno

Number identifying the mapping route to apply for retrieving the individual value in case IRI does not refer to a data source.

0
unit 'Optional[str]'

return the result in the given unit. Implies magnitude=True.

None
magnitude bool

Whether to only return the magnitude of the evaluated value (with no unit).

False
quantity 'Optional[Any]'

Quantity class to use for evaluation. Defaults to pint.

None
kwargs

Additional arguments passed on to mapping_routes().

{}

Returns:

Type Description
'Value'

The value of the individual.

Source code in tripper/triplestore_extend.py
def get_value(
    self,
    iri,
    routeno=0,
    unit: "Optional[str]" = None,
    magnitude: bool = False,
    quantity: "Optional[Any]" = None,
    **kwargs,
) -> "Value":
    """Return the value of an individual.

    Parameters:
        iri: IRI of individual who's value we want to return.  IRI may
            either refer to a data source or an individual mapped to
            an ontological concept.
        routeno: Number identifying the mapping route to apply for
            retrieving the individual value in case IRI does not refer
            to a data source.
        unit: return the result in the given unit.
            Implies `magnitude=True`.
        magnitude: Whether to only return the magnitude of the evaluated
            value (with no unit).
        quantity: Quantity class to use for evaluation.  Defaults to pint.
        kwargs: Additional arguments passed on to `mapping_routes()`.

    Returns:
        The value of the individual.
    """
    from tripper.mappings import (  # pylint: disable=import-outside-toplevel
        Value,
        mapping_routes,
    )

    if self.has(iri, RDF.type, DataSource):
        # `iri` refer to a DataSource
        if self.has(iri, hasDataValue):  # literal value
            return Value(
                value=parse_literal(
                    self.value(iri, hasDataValue)
                ).to_python(),
                unit=(
                    parse_literal(self.value(iri, hasUnit)).to_python()
                    if self.has(iri, hasUnit)
                    else None
                ),
                iri=self.value(iri, MAP.mapsTo),
                cost=(
                    parse_literal(self.value(iri, hasCost)).to_python()
                    if self.has(iri, hasCost)
                    else 0.0
                ),
            ).get_value(unit=unit, magnitude=magnitude, quantity=quantity)

        if self.has(iri, hasAccessFunction):  # callable
            func_iri = self.value(iri, hasAccessFunction)
            func = self.function_repo[func_iri]
            assert callable(func)  # nosec
            retval = func()
            if isinstance(retval, Value):
                return retval.get_value(
                    unit=unit, magnitude=magnitude, quantity=quantity
                )
            return retval

        raise TripperError(
            f"data source {iri} has neither a 'hasDataValue' or a "
            f"'hasAccessFunction' property"
        )

    # `iri` correspond to an individual mapped to an ontological concept.
    # In this case we check if there exists a mapping route.
    routes = mapping_routes(
        target=iri,
        sources=list(self.subjects(RDF.type, DataSource)),
        triplestore=self,
        **kwargs,
    )
    if isinstance(routes, Value):
        return routes.get_value(
            unit=unit, magnitude=magnitude, quantity=quantity
        )
    return routes.eval(
        routeno=routeno,
        unit=unit,
        magnitude=magnitude,
        quantity=quantity,
    )