# ''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''
# Copyright (c) 2025 Mira Geoscience Ltd. '
# '
# This file is part of geoh5py. '
# '
# geoh5py is free software: you can redistribute it and/or modify '
# it under the terms of the GNU Lesser General Public License as published by '
# the Free Software Foundation, either version 3 of the License, or '
# (at your option) any later version. '
# '
# geoh5py is distributed in the hope that it will be useful, '
# but WITHOUT ANY WARRANTY; without even the implied warranty of '
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the '
# GNU Lesser General Public License for more details. '
# '
# You should have received a copy of the GNU Lesser General Public License '
# along with geoh5py. If not, see <https://www.gnu.org/licenses/>. '
# ''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''''
from __future__ import annotations
import uuid
from abc import abstractmethod
from typing import Any
import numpy as np
from ..shared import Entity
from ..shared.utils import mask_by_extent
from .data_association_enum import DataAssociationEnum
from .data_type import DataType, ReferenceDataType
from .primitive_type_enum import PrimitiveTypeEnum
[docs]
class Data(Entity):
"""
Base class for Data entities.
:param association: Relationship made between the parent object and values.
:param modifiable: Entity can be modified.
:param visible: Entity is visible. Only a single data can be visible at a time.
:param values: Data values.
"""
_attribute_map = Entity._attribute_map.copy()
_attribute_map.update({"Association": "association", "Modifiable": "modifiable"})
def __init__(
self,
association: DataAssociationEnum = DataAssociationEnum.OBJECT,
modifiable: bool = True,
visible: bool = False,
values: Any | None = None,
**kwargs,
):
self._association = self.validate_association(association)
super().__init__(visible=visible, **kwargs)
self.modifiable = modifiable
self.values = values
[docs]
def copy(
self,
parent=None,
*,
clear_cache: bool = False,
mask: np.ndarray | None = None,
**kwargs,
) -> Data:
"""
Function to copy data to a different parent entity.
:param parent: Target parent to copy the entity under. Copied to current
:obj:`~geoh5py.shared.entity.Entity.parent` if None.
:param clear_cache: Clear array attributes after copy.
:param mask: Array of bool defining the values to keep.
:param kwargs: Additional keyword arguments to pass to the copy constructor.
:return entity: Registered Entity to the workspace.
"""
if parent is None:
parent = self.parent
if (
self.values is not None
and mask is not None
and self.association
in (
DataAssociationEnum.VERTEX,
DataAssociationEnum.CELL,
)
):
if not isinstance(mask, np.ndarray):
raise TypeError("Mask must be an array or None.")
if mask.dtype != bool or mask.shape != self.values.shape:
raise ValueError(
f"Mask must be a boolean array of shape {self.values.shape}, not {mask.shape}"
)
n_values = (
parent.n_cells
if self.association is DataAssociationEnum.CELL
else parent.n_vertices
)
# Trimming values to the mask
if n_values < self.values.shape[0]:
values = self.values[mask]
else:
values = self.values.copy()
values[~mask] = self.nan_value
kwargs.update({"values": values})
new_entity = parent.workspace.copy_to_parent(
self,
parent,
clear_cache=clear_cache,
**kwargs,
)
return new_entity
[docs]
def copy_from_extent(
self,
extent: np.ndarray,
parent=None,
*,
clear_cache: bool = False,
inverse: bool = False,
**kwargs,
) -> Entity | None:
"""
Function to copy data based on a bounding box extent.
:param extent: Bounding box extent requested for the input entity, as supplied for
:func:`~geoh5py.shared.entity.Entity.mask_by_extent`.
:param parent: Target parent to copy the entity under. Copied to current
:obj:`~geoh5py.shared.entity.Entity.parent` if None.
:param clear_cache: Clear array attributes after copy.
:param inverse: Keep the inverse (clip) of the extent selection.
:param kwargs: Additional keyword arguments to pass to the copy constructor.
:return entity: Registered Entity to the workspace.
"""
indices = self.mask_by_extent(extent, inverse=inverse)
if indices is None:
return None
return self.copy(
parent=parent,
clear_cache=clear_cache,
mask=indices,
**kwargs,
)
[docs]
@classmethod
def default_type_uid(cls) -> uuid.UUID | None:
"""Abstract method to return the default type uid for the class."""
return None
@property
def formatted_values(self):
"""
The data with the right format for Geoscience ANALYST.
"""
return self.values
@property
def n_values(self) -> int | None:
"""
Number of expected data values based on :obj:`~geoh5py.data.data.Data.association`
"""
if self.association in [
DataAssociationEnum.VERTEX,
DataAssociationEnum.DEPTH,
] and hasattr(self.parent, "n_vertices"):
return self.parent.n_vertices
if self.association is DataAssociationEnum.CELL and hasattr(
self.parent, "n_cells"
):
return self.parent.n_cells
if self.association is DataAssociationEnum.FACE and hasattr(
self.parent, "n_faces"
):
return self.parent.n_faces
if self.association is DataAssociationEnum.OBJECT:
return 1
return None
@property
def nan_value(self) -> None:
"""
Value used to represent missing data in python.
"""
return None
@property
def association(self) -> DataAssociationEnum:
"""
Relationship made between the
:func:`~geoh5py.data.data.Data.values` and elements of the
:obj:`~geoh5py.shared.entity.Entity.parent` object.
"""
return self._association
@property
def entity_type(self):
"""
Type of data.
"""
return self._entity_type
@entity_type.setter
def entity_type(self, data_type: DataType | ReferenceDataType):
self._entity_type = data_type
if self.on_file:
self.workspace.update_attribute(self, "entity_type")
@property
def modifiable(self) -> bool:
"""
Entity can be modified within ANALYST.
"""
return self._modifiable
@modifiable.setter
def modifiable(self, value: bool):
self._modifiable = value
if self.on_file:
self.workspace.update_attribute(self, "attributes")
[docs]
@classmethod
@abstractmethod
def primitive_type(cls) -> PrimitiveTypeEnum:
"""Abstract method to return the primitive type of the class."""
[docs]
def mask_by_extent(
self, extent: np.ndarray, inverse: bool = False
) -> np.ndarray | None:
"""
Sub-class extension of :func:`~geoh5py.shared.entity.Entity.mask_by_extent`.
Uses the parent object's vertices or centroids coordinates.
:param extent: Array or coordinate defining the lower and upper bounds of the extent.
:param inverse: Keep the inverse (clip) of the extent selection.
"""
if self.association is DataAssociationEnum.VERTEX and hasattr(
self.parent, "vertices"
):
return mask_by_extent(self.parent.vertices, extent, inverse=inverse)
if self.association is DataAssociationEnum.CELL:
if hasattr(self.parent, "vertices") and hasattr(self.parent, "_cells"):
indices = mask_by_extent(self.parent.vertices, extent, inverse=inverse)
if indices is not None:
indices = np.all(indices[self.parent.cells], axis=1)
return indices
if hasattr(self.parent, "centroids"):
return mask_by_extent(self.parent.centroids, extent, inverse=inverse)
return None
[docs]
def validate_entity_type(self, entity_type: DataType | None) -> DataType:
"""
Validate the entity type.
:param entity_type: Entity type to validate.
"""
if (
not isinstance(entity_type, DataType)
or entity_type.primitive_type != self.primitive_type()
):
raise TypeError(
"Input 'entity_type' must be a DataType object of primitive_type 'TEXT'."
)
if entity_type.name == "Entity":
entity_type.name = self.name
return entity_type
[docs]
@staticmethod
def validate_association(value: str | DataAssociationEnum):
if isinstance(value, str):
if value.upper() not in DataAssociationEnum.__members__:
raise ValueError(
f"Association flag should be one of {DataAssociationEnum.__members__}"
)
value = getattr(DataAssociationEnum, value.upper())
if not isinstance(value, DataAssociationEnum):
raise TypeError(f"Association must be of type {DataAssociationEnum}")
return value
[docs]
@abstractmethod
def validate_values(self, values: Any | None) -> Any:
"""
Validate the values.
To be deprecated along with the standalone Drillhole class in future version.
:param values: Values to validate.
"""
@property
def values(self):
"""
Data values
"""
if getattr(self, "_values", None) is None:
values = self.workspace.fetch_values(self)
self._values = self.validate_values(values)
return self._values
@values.setter
def values(self, values: np.ndarray | None):
self._values = self.validate_values(values)
if self.on_file:
self.workspace.update_attribute(self, "values")
@property
def visible(self) -> bool:
"""
Whether the data is visible in camera (checked in ANALYST object tree).
"""
return self._visible
@visible.setter
def visible(self, value: bool):
self._visible = value
if self.on_file:
self.workspace.update_attribute(self, "attributes")
if value:
for child in self.parent.children:
child.visible = False
def __call__(self):
return self.values