Source code for tecplot.data.array

from builtins import range, super

import ctypes
import logging
import textwrap

from ctypes import (
    addressof,
    byref,
    cast,
    c_double,
    c_float,
    c_int8,
    c_int16,
    c_int32,
    c_int64,
    c_void_p,
    POINTER,
)

from ..tecutil import _tecutil, _tecutil_connector
from ..constant import *
from ..exception import *
from .. import session, tecutil
from . import operate

log = logging.getLogger(__name__)



[docs]
class Array(c_void_p):
    """Low-level accessor for underlying data within a `Dataset <tecplot.data.Dataset>`.

    This object exposes a list-like interface to the underlying data array.
    Using it, values can be directly queried and modified. After any
    modification to the data, the Tecplot Engine will have to be notified of
    the change. This notification will happen automatically in most cases, but
    can be turned off using the `suspend context <tecplot.session.suspend>` for
    a significant performance increase on large data sets.

    Accessing values within an `Array` is done through the standard ``[]``
    syntax::

        >>> print(array[3])
        3.1415

    The numbers passed are interpreted just like Python's built-in
    :py:class:`slice` object::

        >>> # print the values at indices: 5, 7, 9
        >>> print(array[5:10:2])
        [1.0, 1.0, 1.0]

    Elements within an array can be manipulated in-place with the assignment
    operator::

        >>> array[3] = 5.0
        >>> print(array[3])
        5.0

    Element-by-element access is *not* guaranteed to be performant and users
    should avoid writing loops over indices in Python. Instead, whole arrays
    should be used. This will effectively push the loop down to the underlying
    native library and will be much faster in virtually all cases.

    Consider this array of 10k elements::

        >>> ds = frame.create_dataset('Dataset', ['x'])
        >>> zn = ds.add_ordered_zone('Zone', 10000)
        >>> array = zn.values('x')

    The following loop, which takes the sine of all values in the array will
    require several Python function calls per element which is a tremendous
    overhead::

        >>> import math
        >>> for i in range(len(ar)):
        ...     ar[i] = math.sin(ar[i])

    An immediate improvement on this can be made by looping over the elements
    in Python only when reading the values, but assigning them using the
    whole array. This will be several times faster for even modest arrays::

        >>> ar[:] = [math.sin(x) for x in ar]

    But there is still a large performance penalty for looping over elements
    directly in Python and PyTecplot supports two solutions for large arrays:
    `tecplot.data.operate.execute_equation` and `Array.as_numpy_array()`.
    Please refer to these for details. Continuing with the example above, we
    could accomplish the same thing with either of the following using
    `execute_equation()` (assuming the array is identified by the first zone,
    first variable)::

        >>> from tecplot.data.operate import execute_equation
        >>> execute_equation('V1 = SIN(V1)', zones=[dataset.zone(0)])

    or by using the `numpy` library::

        >>> import numpy as np
        >>> ar[:] = np.sin(ar[:])

    In both of these cases, the calculation of the sine and loop over elements
    is pushed to the low level library and is much faster. Note that only the
    `execute_equation()` solution does the calculation within Tecplot and does
    not require the data to copied out to Python so it will typically be the
    fastest option.

    .. note::

        When modifying data using this class, it may be necessary to update the
        range of any associated contouring with a call to
        `ContourLevels.reset()` or similar. This will ensure that the total
        range of the new values is presented in the plot.
    """

    def __init__(self, zone, variable):
        self.zone = zone
        self.variable = variable
        super().__init__(self._native_reference())

    @property
    def _cache(self):
        if _tecutil_connector.suspended:
            _tecutil_connector._delete_caches.append(self._delete_cache)
            return True
        else:
            return False

    def _delete_cache(self):
        attrs = """
            _rnr _wnr _rrp _wrp
            _location
            _len
            _data_type
        """.split()
        for attr in attrs:
            try:
                delattr(self, attr)
            except AttributeError:
                pass

    def _native_reference(self, writable=False):
        args = (
            self.zone.dataset.uid,
            self.zone.index + 1,
            self.variable.index + 1,
        )
        if writable:
            if self._cache:
                if not hasattr(self, '_wnr'):
                    with tecutil.lock():
                        self._wnr = _tecutil.DataValueGetWritableNativeRefByUniqueID(
                            *args
                        )
                return self._wnr
            else:
                with tecutil.lock():
                    return _tecutil.DataValueGetWritableNativeRefByUniqueID(*args)
        else:
            if self._cache:
                if not hasattr(self, '_rnr'):
                    with tecutil.lock():
                        self._rnr = _tecutil.DataValueGetReadableNativeRefByUniqueID(
                            *args
                        )
                return self._rnr
            else:
                with tecutil.lock():
                    return _tecutil.DataValueGetReadableNativeRefByUniqueID(*args)

    @tecutil.lock()
    def _raw_pointer(self, writable=False):
        if _tecutil_connector.connected:
            msg = 'raw pointer access only available in batch-mode'
            raise TecplotLogicError(msg)
        elif writable:
            ref = self._native_reference(writable=True)
            _tecutil.handle.tecUtilDataValueGetWritableRawPtrByRef.restype = POINTER(
                self.c_type
            )
            wrp = _tecutil.DataValueGetWritableRawPtrByRef(ref)
            if self._cache:
                if not hasattr(self, '_wrp'):
                    self._wrp = wrp
                return self._wrp
            else:
                return wrp
        else:
            _tecutil.handle.tecUtilDataValueGetReadableRawPtrByRef.restype = POINTER(
                self.c_type
            )
            rrp = _tecutil.DataValueGetReadableRawPtrByRef(self)
            if self._cache:
                if not hasattr(self, '_rrp'):
                    self._rrp = rrp
                return self._rrp
            else:
                return rrp

    def __eq__(self, other):
        self_addr = addressof(cast(self, POINTER(c_int64)).contents)
        other_addr = addressof(cast(other, POINTER(c_int64)).contents)
        return self_addr == other_addr

    def __ne__(self, other):
        return not (self == other)

    def __len__(self):
        """The number of values in this array.

        :rtype: `integer <int>`

        Example showing size of ordered data::

            >>> x = dataset.zone('Zone').values('X')
            >>> print(x.shape)
            (10, 10, 10)
            >>> print(len(x))
            1000
        """
        if self._cache:
            if not hasattr(self, '_len'):
                self._len = _tecutil.DataValueGetCountByRef(self)
            return self._len
        else:
            return _tecutil.DataValueGetCountByRef(self)

    def _value_location(self):
        with self.zone.dataset.frame.activated():
            return _tecutil.DataValueGetLocation(
                self.zone.index + 1, self.variable.index + 1
            )

    @property
    def location(self):
        """`ValueLocation`: Data points location with respect to the elements.

        Possible values are `ValueLocation.CellCentered` and
        `ValueLocation.Nodal`. Example usage::

            >>> print(dataset.zone(0).values('X').location)
            ValueLocation.Nodal
        """
        if self._cache:
            if not hasattr(self, '_location'):
                self._location = self._value_location()
            return self._location
        else:
            return self._value_location()

    @property
    def shape(self):
        """`tuple` of `floats <float>`: ``(i, j, k)`` shape for this array.

        This is defined by the parent zone and can be used to reshape arrays.
        The following example assumes 32-bit floating point array and copies
        the Tecplot-owned ``data`` into the `numpy`-owned ``array``::

            >>> import numpy as np
            >>> data = dataset.zone('Zone').values('X')
            >>> array = np.empty(data.shape, dtype=np.float32)
            >>> arr_ptr = array.ctypes.data_as(POINTER(data.c_type))
            >>> memmove(arr_ptr, data.copy(), sizeof(data.c_type) * len(data))

        The data array presented is normally one-dimensional. For ordered data,
        you may wish to reshape the array indexing according to the
        dimensionality given by the ``shape`` attribute:

        .. code-block:: python
            :emphasize-lines: 30

            import numpy as np
            import tecplot as tp

            frame = tp.active_frame()
            dataset = frame.create_dataset('Dataset', ['X'])
            zone = dataset.add_ordered_zone('Zone', shape=(3,3,3))

            '''
            the following will print:
            [ 0.  0.  0.  0.  0.  0.  0.  0.  0.  0.  0.  0.  0.  0.
              0.  0.  0.  0.  0.  0.  0.  0.  0.  0.  0.  0.  0.]
            '''
            x = np.array(zone.values('X')[:])
            print(x)

            '''
            the following will print:
            [[[ 0.  0.  0.]
              [ 0.  0.  0.]
              [ 0.  0.  0.]]

             [[ 0.  0.  0.]
              [ 0.  0.  0.]
              [ 0.  0.  0.]]

             [[ 0.  0.  0.]
              [ 0.  0.  0.]
              [ 0.  0.  0.]]]
            '''
            x.shape = zone.values('X').shape
            print(x)

        """
        if self.zone.zone_type is ZoneType.Ordered:
            array_shape = tuple(i for i in self.zone._shape if i > 1)
        else:
            array_shape = (self.zone.num_points,)
        if self.location is ValueLocation.CellCentered:
            array_shape = tuple(i - 1 for i in array_shape if i > 2)
        if not array_shape:
            array_shape = (1,)
        return array_shape

    @property
    def c_type(self):
        """`ctypes` compatible data type of this array.

        This is the `ctypes` equivalent of `Array.data_type` and will return
        one of the following:

            * `ctypes.c_float`
            * `ctypes.c_double`
            * `ctypes.c_int`
            * `ctypes.c_int16`
            * `ctypes.c_int8`

        and can be used to create a `ctypes` array to store a copy of the
        data:

        .. code-block:: python

            import tecplot as tp
            frame = tp.active_frame()
            dataset = frame.create_dataset('Dataset', ['x'])
            dataset.add_ordered_zone('Zone', (3,3,3))
            x = dataset.zone('Zone').values('x')
            # allocate array using Python's ctypes
            x_array = (x.c_type * len(x))()
            # copy values from Dataset into ctypes array
            x_array[:] = x[:]
        """
        _ctypes = {
            FieldDataType.Float: ctypes.c_float,
            FieldDataType.Double: ctypes.c_double,
            FieldDataType.Int32: ctypes.c_int32,
            FieldDataType.Int16: ctypes.c_int16,
            FieldDataType.Byte: ctypes.c_int8,
        }
        return _ctypes[self.data_type]

    @property
    def data_type(self):
        """`FieldDataType`: Indicating the underlying value type of this array.

        Example usage::

            >>> print(dataset.zone('Zone').values('X').data_type)
            FieldDataType.Float
        """
        return _tecutil.DataValueGetRefType(self)

    @tecutil.lock()
    def as_ctypes_array(self, offset=0, size=None, copy=True):
        """Present the underlying data array as a `ctypes.Array`.

        If the **copy** parameter is `False`, this method will attempt to return
        an array pointing to the actual data stored in the Tecplot Engine. This
        will fail in connected mode or if the loader does not support
        immediate loading of the entire array into memory. Care should be taken
        to ensure the validity of the pointers to the data.

        Parameters:
            offset (`int`, optional): Zero-based offset into the array. This
                will be the starting point of the resulting data. (default: 0)
            size (`int`, optional): Number of elements in the resulting array.
                The default (a value of `None`) is to go to the end of the
                data.
            copy (`bool`, optional): Copy the data out from the Tecplot Engine.
                If `False`, an attempt is made to point to the underlying raw
                data and an exception is thrown on error. (default: `True`)

        Returns:
            `ctypes.Array`

        Example usage::

            >>> x = dataset.zone('Zone').values('X').as_ctypes_array()
        """
        size = (len(self) - offset) if size is None else size
        CArray = self.c_type * size
        if copy:
            arr = CArray()
            _tecutil.DataValueArrayGetByRef(self, offset + 1, size, arr)
            return arr
        else:
            ptr = self._raw_pointer(True)
            if offset:
                vptr = ctypes.cast(ctypes.pointer(ptr), ctypes.POINTER(ctypes.c_void_p))
                vptr.contents.value += ctypes.sizeof(ptr._type_) * offset
            ptr_addr = ctypes.addressof(ptr.contents)
            arr = CArray.from_address(ptr_addr)
            return arr


[docs]
    def as_numpy_array(self, offset=0, size=None, copy=True):
        """Present the underlying data array as a `numpy.ndarray`.

        If the **copy** parameter is `False`, this method will attempt to return
        an array pointing to the actual data stored in the Tecplot Engine. This
        will fail in connected mode or if the loader does not support
        immediate loading of the entire array into memory. Care should be taken
        to ensure the validity of the pointers to the data.

        Parameters:
            offset (`int`, optional): Zero-based offset into the array. This
                will be the starting point of the resulting data. (default: 0)
            size (`int`, optional): Number of elements in the resulting array.
                The default (a value of `None`) is to go to the end of the
                data.
            copy (`bool`, optional): Copy the data out from the Tecplot Engine.
                If `False`, an attempt is made to point to the underlying raw
                data and an exception is thrown on error. (default: `True`)

        Returns:
            `numpy.ndarray`

        Example usage::

            >>> x = dataset.zone('Zone').values('X').as_numpy_array()
        """
        import numpy as np

        carr = self.as_ctypes_array(offset, size, copy)
        return np.ctypeslib.as_array(carr)



[docs]
    @tecutil.lock()
    def copy(self, offset=0, size=None):
        """Copy the whole or part of the array into a ctypes array.

        Parameters:
            offset (`int`, optional): Zero-based offset for starting
                index to copy. (default: 0)
            size (`int`, optional): Number of values to copy into the
                resulting array. A value of `None` will copy to the end of the
                array. (default: `None`)

        Here we will copy out chunks of the data, do some operation and set the
        values back into the dataset:

        .. code-block:: python

            import tecplot as tp

            tp.new_layout()
            frame = tp.active_frame()
            dataset = frame.create_dataset('Dataset', ['x'])
            dataset.add_ordered_zone('Zone', (2, 2, 2))
            x = dataset.zone('Zone').values('x')

            # loop over array copying out 4 values at a time
            for i, offset in enumerate(range(0, len(x), 4)):
                x_array = x.copy(offset, 4)
                x_array[:] = [i] * 4
                x[offset:offset + 4] = x_array

            # will print: [0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0]
            print(x[:])
        """
        try:
            return self.as_numpy_array(offset, size, copy=True)
        except ImportError:
            msg = textwrap.dedent(
                """\
                Falling back to using basic Python for data operations.
                If installed, PyTecplot will make use of Numpy where
                appropriate for significant performance gains.
            """
            )
            log.warning(msg)
            return self.as_ctypes_array(offset, size, copy=True)


    def _slice_range(self, s):
        start = s.start or 0
        if start < 0:
            start += len(self)
        stop = s.stop or len(self)
        if stop < 0:
            stop += len(self)
        step = s.step or 1
        return range(start, stop, step)

    def __getitem__(self, i):
        if not isinstance(i, slice):
            return _tecutil.DataValueGetByRef(self, i + 1)
        else:
            s = self._slice_range(i)
            if s.step > 1:
                # i is a non-contiguous slice
                return [_tecutil.DataValueGetByRef(self, ii + 1) for ii in s]
            else:
                # i is a contiguous slice
                return self.copy(s.start, s.stop - s.start)

    @tecutil.lock()
    def __setitem__(self, i, val):
        """
        Developers note:
            This method avoids using raw pointers which may not be available
            for different reasons -- backing data does not support it, limited
            memory resources or we are in connected mode for example.
        """
        if not isinstance(i, slice):
            # i is an index
            ref = self._native_reference(True)
            _tecutil.DataValueSetByRef(ref, i + 1, val)
            session.data_altered(self.zone, self.variable, i)
        elif isinstance(val, Array) and val == self:
            # self assignment no-op
            return
        else:
            if callable(getattr(val, 'ravel', None)):
                val = val.ravel()
            s = self._slice_range(i)
            if len(s) != len(val):
                msg = 'Array length mismatch {} != {}'
                raise TecplotIndexError(msg.format(len(s), len(val)))
            if s.step > 1:
                # i is a non-contiguous slice
                # the following works, but is slow!
                for a, b in enumerate(s):
                    self[b] = val[a]
            else:
                # i is a contiguous slice
                offset = s.start
                size = s.stop - s.start

                if isinstance(val, Array):
                    if (
                        offset == 0
                        and size in (None, len(self))
                        and val.zone.dataset == self.zone.dataset
                    ):
                        # copy whole array
                        if val.zone == self.zone:
                            eqn = 'V{0} = V{1}'.format(
                                self.variable.index + 1, val.variable.index + 1
                            )
                            operate.execute_equation(eqn, self.zone)
                        else:
                            src_zone_idx = self.zone.index
                            tgt_zone_idx = val.zone.index
                            var_idx = val.variable.index
                            if not _tecutil.DataValueCopy(
                                src_zone_idx + 1, tgt_zone_idx + 1, var_idx + 1
                            ):
                                raise TecplotSystemError()
                        return
                    else:
                        # either sub array or different datasets
                        val = val.as_ctypes_array(copy=True)

                ctype = self.c_type
                if isinstance(val, ctypes.Array) and val._type_ == ctype:
                    arr = val
                else:
                    # coerce val to a ctypes array, using numpy if available
                    try:
                        import numpy as np

                        nparr = np.asarray(val, dtype=ctype)
                        ptarr = nparr.ctypes.data_as(POINTER(ctype))
                        ptaddr = addressof(ptarr.contents)
                        arr = (ctype * size).from_address(ptaddr)
                    except ImportError:
                        msg = textwrap.dedent(
                            """\
                            Falling back to using basic Python for data
                            operations. If installed, PyTecplot will make use
                            of Numpy where appropriate for significant
                            performance gains.
                        """
                        )
                        log.warning(msg)
                        arr = (ctype * size)(*val)

                ref = self._native_reference(True)
                _tecutil.DataValueArraySetByRef(ref, offset + 1, size, arr)
                session.data_altered(self.zone, self.variable)

    def __iter__(self):
        self.current_index = -1
        self.current_length = len(self)
        return self

    def __next__(self):
        self.current_index += 1
        if self.current_index < self.current_length:
            return self.__getitem__(self.current_index)
        else:
            del self.current_index
            del self.current_length
            raise StopIteration


[docs]
    def minmax(self):
        """Limits of the values stored in this array.

        :rtype: `tuple` of `floats <float>`

        This always returns `floats <float>` regardless of the underlying data
        type::

            >>> print(dataset.zone('Zone').values('x').minmax())
            (0, 10)
        """
        return _tecutil.DataValueGetMinMaxByRef(self)



[docs]
    def min(self):
        """Lower bound of the values stored in this array.

        :rtype: `float`

        This always returns a `float` regardless of the underlying data type::

            >>> print(dataset.zone('Zone').values('x').min())
            0
        """
        return self.minmax()[0]



[docs]
    def max(self):
        """Upper bound of the values stored in this array.

        :rtype: `float`

        This always returns a `float` regardless of the underlying data type::

            >>> print(dataset.zone('Zone').values('x').max())
            10
        """
        return self.minmax()[1]


    @property
    def shared_zones(self):
        """`list` of `Zones <data_access>`: All zones sharing this array.

        Example usage::

            >>> dataset.zone('My Zone').copy(share_variables=True)
            >>> for z in dataset.zone('My Zone').values(0).shared_zones:
            ...     print(z.index)
            0
            1
        """
        with self.zone.dataset.frame.activated():
            indices = _tecutil.DataValueGetShareZoneSet(
                self.zone.index + 1, self.variable.index + 1
            )
            try:
                ret = [self.zone.dataset.zone(i) for i in indices]
            finally:
                indices.dealloc()
        return ret

    @property
    def passive(self):
        """`bool`: An unallocated zone-variable combination.

        Passive variables are placeholders where no data is defined for a zone
        variable combination. Passive variables will always return zero when
        queried:

        .. code-block:: python

            import tecplot as tp

            ds = tp.active_page().add_frame().create_dataset('D', ['x','y'])
            z = ds.add_ordered_zone('Z1', (3,))
            assert not z.values(0).passive
        """
        with self.zone.dataset.frame.activated():
            return _tecutil.DataValueIsPassive(
                self.zone.index + 1, self.variable.index + 1
            )