Source code for PVGeo.readers.binaries

__all__ = [
    'PackedBinariesReader',
    'MadagascarReader',
]

__displayname__ = 'Binary/Serialized File I/O'

import warnings

import numpy as np
import vtk

from .. import _helpers, interface
from ..base import ReaderBase



[docs]
class PackedBinariesReader(ReaderBase):
    """This reads in float or double data that is packed into a binary file
    format. It will treat the data as one long array and make a ``vtkTable``
    with one column of that data. The reader uses defaults to import as floats
    with native endianness. Use the Table to Uniform Grid or the Reshape Table
    filters to give more meaning to the data. We chose to use a ``vtkTable``
    object as the output of this reader because it gives us more flexibility in
    the filters we can apply to this data down the pipeline and keeps things
    simple when using filters in this repository.
    """

    __displayname__ = 'Packed Binaries Reader'
    __category__ = 'reader'
    extensions = 'H@ bin rsf rsf@ HH npz'
    description = 'PVGeo: Packed Binaries Reader'

    def __init__(self, **kwargs):
        ReaderBase.__init__(self, nOutputPorts=1, outputType='vtkTable', **kwargs)
        # Other Parameters
        self.__data_name = kwargs.get('dataname', 'Data')
        self.__dtypechar = kwargs.get('dtype', 'f')
        self.__endian = kwargs.get('endian', '')
        self.__dtype, self.__vtktype = interface.get_dtypes(
            dtype=self.__dtypechar, endian=self.__endian
        )
        # Data objects to hold the read data for access by the pipeline methods
        self.__data = []


[docs]
    def _read_raw_file(self, filename):
        """Internal helper to read the raw data from the file"""
        dtype = self.__dtype
        if dtype == np.dtype('>f'):
            # Checks if big-endian and fixes read
            dtype = np.dtype('f')
        try:
            arr = np.fromfile(filename, dtype=dtype)
        except (IOError, OSError) as fe:
            raise _helpers.PVGeoError(str(fe))
        return np.asarray(arr, dtype=self.__dtype)



[docs]
    def _get_file_contents(self, idx=None):
        """Internal helper to get all contents for all files"""
        if idx is not None:
            filenames = [self.get_file_names(idx=idx)]
        else:
            filenames = self.get_file_names()
        contents = []
        for f in filenames:
            contents.append(self._read_raw_file(f))
        if idx is not None:
            return contents[0]
        return contents



[docs]
    def _read_up_front(self):
        """Should not need to be overridden"""
        # Perform Read
        self.__data = self._get_file_contents()
        self.need_to_read(flag=False)
        return 1



[docs]
    def _get_raw_data(self, idx=0):
        """This will return the proper data for the given timestep"""
        return self.__data[idx]



[docs]
    def convert_array(self, arr):
        """Converts the numpy array to a vtkDataArray"""
        # Put raw data into vtk array
        data = interface.convert_array(
            arr, name=self.__data_name, deep=True, array_type=self.__vtktype
        )
        return data



[docs]
    def RequestData(self, request, inInfo, outInfo):
        """Used by pipeline to request data for current timestep"""
        # Get output:
        output = vtk.vtkTable.GetData(outInfo)
        if self.need_to_read():
            self._read_up_front()
        # Get requested time index
        i = _helpers.get_requested_time(self, outInfo)
        # Generate the data object
        arr = self._get_raw_data(idx=i)
        data = self.convert_array(arr)
        output.AddColumn(data)
        return 1


    #### Setters and Getters ####


[docs]
    def set_endian(self, endian):
        """Set the endianness of the data file.

        Args:
            endian (int or char): no preference = '' or 0, Little = 1 or `<` or Big = 2 `>`.
        """
        pos = ['', '<', '>']
        if isinstance(endian, int):
            endian = pos[endian]
        if endian != self.__endian:
            self.__endian = endian
            self.__dtype, self.__vtktype = interface.get_dtypes(
                dtype=self.__dtypechar, endian=self.__endian
            )
            self.Modified()



[docs]
    def get_endian(self):
        """Get the endianness of the data file."""
        return self.__endian



[docs]
    def set_data_type(self, dtype):
        """Set the data type of the binary file: `double='d'`, `float='f'`, `int='i'`"""
        pos = ['d', 'f', 'i']
        if isinstance(dtype, int):
            dtype = pos[dtype]
        if dtype != self.__dtype:
            self.__dtypechar = dtype
            self.__dtype, self.__vtktype = interface.get_dtypes(
                dtype=self.__dtypechar, endian=self.__endian
            )
            self.Modified()



[docs]
    def get_data_types(self):
        """Get the data type of the binary file"""
        return self.__dtype, self.__vtktype



[docs]
    def set_data_name(self, data_name):
        """The string name of the data array generated from the input file."""
        if data_name != self.__data_name:
            self.__data_name = data_name
            self.Modified(read_again=False)  # Don't re-read. Just request data again



[docs]
    def get_data_name(self):
        """Get name used for the data array"""
        return self.__data_name





[docs]
class MadagascarReader(PackedBinariesReader):
    """This reads in float or double data that is packed into a Madagascar
    binary file format with a leader header. The reader ignores all of the ascii
    header details by searching for the sequence of three special characters:
    EOL EOL EOT and it will treat the following binary packed data as one long
    array and make a ``vtkTable`` with one column of that data. The reader uses
    defaults to import as floats with native endianness. Use the Table to
    Uniform Grid or the Reshape Table filters to give more meaning to the data.
    We will later implement the ability to create a gridded volume from the
    header info. This reader is a quick fix for Samir. We chose to use a
    ``vtkTable`` object as the output of this reader because it gives us more
    flexibility in the filters we can apply to this data down the pipeline and
    keeps thing simple when using filters in this repository.
    `Details Here`_.

    .. _Details Here: http://www.ahay.org/wiki/RSF_Comprehensive_Description#Single-stream_RSF
    """

    __displayname__ = 'Madagascar SSRSF Reader'
    __category__ = 'reader'
    # extensions are inherited from PackedBinariesReader
    description = 'PVGeo: Madagascar Single Stream RSF Files'

    def __init__(self, **kwargs):
        PackedBinariesReader.__init__(self, **kwargs)


[docs]
    def _read_raw_file(self, filename):
        """Reads the raw data from the file for Madagascar SSRSF files"""
        dtype, vtktype = self.get_data_types()
        CTLSEQ = b'\014\014\004'  # The control sequence to separate header from data
        rpl = b''
        raw = []
        with open(filename, 'rb') as file:
            raw = file.read()
            idx = raw.find(CTLSEQ)
            if idx == -1:
                warnings.warn(
                    'This is not a single stream RSF format file. Treating entire file as packed binary data.'
                )
            else:
                raw = raw[idx:]  # deletes the header
                raw = raw.replace(CTLSEQ, rpl)  # removes the control sequence
        arr = np.frombuffer(raw, dtype=dtype)
        return arr