Source code for crunchflow.output.spatial

"""Tools for loading, analyzing, and visualizing spatial profile output from CrunchFlow.

This module provides the `SpatialProfile` class and associated utility functions
to work with CrunchFlow spatial output files (commonly `.tec`, `.out`, or `.dat` files).
These files contain gridded data written at specified output times during a simulation,
and typically include variables such as mineral saturation, aqueous species concentrations,
porosity, and permeability across 1D, 2D, or 3D model domains.

Key Features
------------
- Automatically detects file format and loads output variables and metadata.
- Supports plotting 2D images or contour maps for any output variable.
- Enables comparison of results across time steps using `plot_series`.
- Extracts outlines of zones sharing a common attribute (e.g., permeability zone boundaries).
- Compatible with `.tec`, `.out`, and `.dat` formats written by CrunchFlow.
"""

import os
import re
import textwrap

import matplotlib.pyplot as plt
import numpy as np
from mpl_toolkits.axes_grid1 import make_axes_locatable

from crunchflow.input import InputFile



[docs]
def isnumeric_scientific(s):
    """Check if a string is numeric.

    Return True if a string is an integer, float or in scientific notation,
    and False otherwise.
    """
    try:
        float(s)
        return True
    except ValueError:
        return False




[docs]
def read_output_times(fname):
    """Given a CrunchFlow input file, return the spatial_profile output times.

    Parameters
    ----------
    fname : str
        Name of the input file to read

    Returns
    -------
    output_times : list
        Output times read from the input file
    """
    infile = InputFile.load(fname, warnings=False)

    sp_times_str = infile.output.spatial_profile

    if sp_times_str is None:
        return None
    else:
        # Split the string by whitespace and convert to float
        output_times = [float(t) for t in sp_times_str.split()]

        return output_times




[docs]
def get_tec_metadata(file, folder="."):
    """Return a list of the variables in a spatial_profile output file.

    Given a crunch .tec output file, read it in and return a list of the
    variables (e.g., 'X-Perm', 'Y-Perm', etc) included in the output file.

    Parameters
    ----------
    file : str
        Filename to read in
    folder : str
        Folder in which 'file' is located. The default is the current directory

    Returns
    -------
    columns : list, str
        ordered list of variables included in filename
    title : str
        Value included in this file, as output by CrunchFlow
    fmt : str
        Format of the file, either '.tec' or '.out'
    """
    # Instantiate empty list of columns
    columns = []

    # Open file and read line by line
    inpath = os.path.join(folder, file)
    with open(inpath) as f:
        lines = f.readlines()

        # Read the first line to determine the format of the file
        if "TITLE" in lines[0]:
            title = lines[0].split('"')[1]
            fmt = ".tec"
        elif "Time" in lines[0]:
            title = ""
            fmt = ".out"
        elif "Units" in lines[0]:
            title = ""
            fmt = ".dat"
        else:
            raise ValueError("Could not determine the format of this file")

        # Read the rest of the header
        if fmt == ".tec":
            columns = lines[1].split('"')

            # Remove x, y, z
            columns = [col.strip() for col in columns]
            for col in ["", "VARIABLES =", "X", "Y", "Z"]:
                if col in columns:
                    columns.remove(col)

            # Remove whitespace, which was reduced to len 0 via col.strip()
            remove_fields = [col for col in columns if len(col) == 0]

            for col in remove_fields:
                columns.remove(col)
        elif fmt == ".out":
            # pH files do not have a units line
            if "pH" in file:
                columns_line = lines[1]  # skip units line
            else:
                columns_line = lines[2]

            # Split on whitespace
            raw_cols = columns_line.split()

            # Some versions of CrunchFlow don't include column names
            # in this case, the column entries should be numeric and we'll
            # assign them names
            if isnumeric_scientific(raw_cols[0]):
                columns = ["col%d" % i for i in range(len(raw_cols))]
            else:
                columns = raw_cols

        elif fmt == ".dat":
            title = lines[1].split('"')[1]
            columns = lines[2].split('"')

            # Remove x, y, z
            columns = [col.strip() for col in columns]
            for col in ["VARIABLES ="]:
                if col in columns:
                    columns.remove(col)

            # Remove commas, which can be repeated so will not be removed with loop above
            columns = [col.replace(",", "") for col in columns]

            # Remove whitespace, which was reduced to len 0 via col.strip()
            remove_fields = [col for col in columns if len(col) == 0]
            for col in remove_fields:
                columns.remove(col)

            # With .dat files, the naming scheme for x, y and z varies
            # depending on the spatial units
            if len(lines[3].split(",")) == 3:
                # then this is 2d, so remove first two columns
                columns = columns[2:]
            elif len(lines[3].split(",")) == 4:
                # then this is 3d, so remove first three columns
                columns = columns[3:]
            else:
                raise ValueError("Could not determine the format of this file")

    return columns, title, fmt




[docs]
def get_out_output_time(file):
    """Get the output time from a CrunchFlow .out file.

    Given a CrunchFlow .out file, read it in and return the output time,
    which should be stored in the first line.

    Parameters
    ----------
    file : str
        Filename to read in

    Returns
    -------
    time : float
        output time of the file
    """
    with open(file) as f:
        line = f.readline()
        if "Time" not in line:
            raise ValueError(f"Could not find the output time of {file}")
        else:
            time = float(line.split()[-1])

    return time




[docs]
def get_tec_output_times(crunch_log, folder="."):
    """Given a CrunchFlow output log, get the spatial_profile output times.

    Search through a file containing all terminal output from a CrunchFlow
    run and return the spatial_profile output times. For example, during
    a simulation, CrunchFlow will print progress to the screen, including
    blocks that look like:

        >>> WRITING OUTPUT FILES
        >>> Time (days) =  9.000E+00
        >>> File number  =            2

    This function combs through that terminal output to create a list of
    times at which .tec files were written. Note that this function is
    no longer maintained and has been superseded by `read_output_times`.

    Parameters
    ----------
    crunch_log : str
        Filename of the crunchflow terminal output
    folder : str
        Folder in which 'crunch_log' is located.The default is the
        current directory

    Returns
    -------
    output_times : list of float
        Ordered list of the output times (in CrunchFlow time units)
        corresponding to each .tec file number.
    """
    output_times = {}

    filepath = os.path.join(folder, crunch_log)
    with open(filepath, "r") as f:
        lines = f.readlines()
        for i, line in enumerate(lines):
            if "WRITING OUTPUT FILES" in line:
                time = float(lines[i + 1].split()[3])
                fileno = int(lines[i + 2].split()[3])

                output_times[fileno] = time

    return output_times



class SpatialProfile:
    """The SpatialProfile class for working with spatial_profile (.tec, .out and .dat) files.

    Attributes
    ----------
    times : list of int
        relative times at which .tec files were output, sorted
    files : list of str
        ordered list of all files matching fileprefix
    columns : list of str
        list of all vars included within each .tec file
    nx : int
        # of grid cells in the x direction. Typically only defined for 2D and 3D output
    ny : int
        # of grid cells in the y direction. Typically only defined for 2D and 3D output
    nz : int
        # of grid cells in the z direction. Typically only defined for 2D and 3D output
    coords : ndarray of float
        (nx*ny*nz, 2) array of x, y coordinates of each node. Typically only defined
        for 2D and 3D output
    griddedX : ndarray of float
        (ny, nx) array of x coordinates; used for plotting. Typically only defined for
        2D and 3D output
    griddedY : ndarray of float
        (ny, nx) array of y coordinates; used for plotting. Typically only defined for
        2D and 3D output

    Methods
    -------
    __init__(fileprefix, folder, output_times, suffix)
        Read in and get basic info about all .tec files matching `fileprefix`.
        For example, `tec('volume')` will read in all files matching
        'volume[0-9]+.tec'
    extract(variable, time)
        Return the spatial profile of var at the given time.
    plot(variable, time)
        Plot .tec output from a single time step.
    plot_series(variable)
        Plot .tec output for a series of time steps.
    outline(variable, value, time)
        Get line segments that outline all the regions equal to
        the provided value.

    Parameters
    ----------
        fileprefix : str
            file prefix of the tec file to read in, without the timestep
            number or ".tec" file ending. For example, if your files are
            "volume1.tec", "volume2.tec", etc., then fileprefix should be
            "volume".
        folder : str, optional
            folder in which the .tec files are located. The default is the
            current directory
        output_times : list of float, optional
            list of the actual output times at which the .tec files were
            output, in CrunchFlow time units
        suffix : str, optional
            file ending of the tec files to read in. This can vary depending on the
            version of CrunchTope used. The default is '.tec', but '.out' is also
            tried if '.tec' files are not found.

    Examples
    --------
    >>> vol = SpatialProfile('volume')
    >>> print(vol.columns)
    >>> vol.plot('Calcite')
    >>> calcite = vol.extract('Calcite', time=2)
    """

    def __init__(self, fileprefix, folder=".", output_times=None, suffix=".tec", warnings=True):
        """Read in and get basic info about all .tec files matching `fileprefix`.
        For example, `SpatialProfile('volume')` will read in all files matching
        'volume[0-9]+.tec'

        Parameters
        ----------
        fileprefix : str
            file prefix of the tec file to read in, without the timestep
            number or ".tec" file ending. For example, if your files are
            "volume1.tec", "volume2.tec", etc., then fileprefix should be
            "volume".
        folder : str, optional
            folder in which the .tec files are located. The default is the
            current directory
        output_times : list of float, optional
            list of the actual output times at which the .tec files were
            output, in CrunchFlow time units
        suffix : str, optional
            file ending of the tec files to read in. This can vary depending on the
            version of CrunchTope used. The default is '.tec', but '.out' and '.dat'
            are also tried if '.tec' files are not found.
        warnings : bool, optional
            Whether to print warnings. Default is True.
        """
        # Glob doesn't support regex, so match manually using re and os
        search_str = "^" + fileprefix + "[0-9]+%s" % suffix
        unsort_files = [f for f in os.listdir(folder) if re.search(search_str, f)]

        # Try again with .out or .dat suffix
        if len(unsort_files) == 0:
            for try_suffix in [".out", ".dat"]:
                search_str = "^" + fileprefix + "[0-9]+" + try_suffix
                unsort_files = [f for f in os.listdir(folder) if re.search(search_str, f)]
                if len(unsort_files) > 0:
                    suffix = try_suffix
                    break

        if len(unsort_files) == 0:
            raise ValueError(
                "No files found matching %s. Double check the suffix and\n "
                "double check that the filename ends in a digit" % search_str
            )

        # Get the columns (variables) available in each .tec file
        self.columns, self.title, self.fmt = get_tec_metadata(unsort_files[0], folder=folder)

        # Get the output time in sequence for each file
        st = len(fileprefix)
        self.times = [int(f[st:-4]) for f in unsort_files]
        self.times.sort()

        # Create sorted list of files using the times (which are sorted numerically)
        # This solves the problem that sorted str print as ['vol1', 'vol10', 'vol2', etc.]
        self.files = [fileprefix + str(t) + suffix for t in self.times]
        self.files = [os.path.join(folder, f) for f in self.files]

        # Set output times if provided
        if output_times is not None:
            self.output_times = output_times
        else:
            # Otherwise, try setting it by reading from each .out file
            if self.fmt == ".out":
                self.output_times = [get_out_output_time(f) for f in self.files]
            elif self.fmt in [".tec", ".dat"]:
                # For .tec and .dat files, try reading it from an input file in the same folder
                inputfiles = [f for f in os.listdir(folder) if f.endswith(".in")]
                if len(inputfiles) > 1 and warnings:
                    msg = f"""\
                           Found multiple input files ({inputfiles}) and could not
                           determine which file to use to read output_times.
                           Disable this warning with `SpatialProfile(..., warnings=False)`"""
                    print(textwrap.dedent(msg))
                elif len(inputfiles) == 1:
                    infilepath = os.path.join(folder, inputfiles[0])
                    self.output_times = read_output_times(infilepath)
                    if warnings:
                        msg = f"""\
                               Reading output_times from ({infilepath}).
                               Disable this message with `SpatialProfile(..., warnings=False)`"""
                        print(textwrap.dedent(msg))
                else:
                    self.output_times = None

        # Get the grid size
        if self.fmt == ".tec":
            with open(self.files[0]) as f:
                for i, line in enumerate(f):
                    # Go to third line
                    if i == 2:
                        # Split on comma
                        fields = line.split(",")

                        # Workaround for CrunchFlow typo in AqRate.tec files
                        if "Aqueous Rate" not in self.title:
                            # Extract numeric digits from each field
                            # Regex \D removes non-numeric characters
                            self.nx = int(re.sub("\\D", "", fields[0]))
                            self.ny = int(re.sub("\\D", "", fields[1]))
                            self.nz = int(re.sub("\\D", "", fields[2]))

                        else:
                            self.nx = int(re.sub("\\D", "", fields[1]))
                            self.ny = int(re.sub("\\D", "", fields[2]))
                            self.nz = np.nan

            # Get gridded X and Y for plotting
            self.coords = np.loadtxt(self.files[0], skiprows=3, usecols=[0, 1])
            self.griddedX = self.coords[:, 0].reshape(self.ny, self.nx)
            self.griddedY = self.coords[:, 1].reshape(self.ny, self.nx)
        elif self.fmt == ".out":
            if self.columns[0] == "col0":
                skiprows = 2
            else:
                skiprows = 3
            self.coords = np.loadtxt(self.files[0], skiprows=skiprows, usecols=[0])
        elif self.fmt == ".dat":
            with open(self.files[0]) as f:
                lines = f.readlines()

                fields = lines[3].split(",")[1:]
                if len(fields) == 2:
                    self.nx = int(re.sub("\\D", "", fields[0]))
                    self.ny = int(re.sub("\\D", "", fields[1]))
                    self.nz = np.nan
                elif len(fields) == 3:
                    self.nx = int(re.sub("\\D", "", fields[0]))
                    self.ny = int(re.sub("\\D", "", fields[1]))
                    self.nz = int(re.sub("\\D", "", fields[2]))
                else:
                    raise ValueError("Could not determine the coordinates in this file")
            self.coords = np.loadtxt(self.files[0], skiprows=4, usecols=[0, 1])
            self.griddedX = self.coords[:, 0].reshape(self.ny, self.nx)
            self.griddedY = self.coords[:, 1].reshape(self.ny, self.nx)

    def extract(self, var, time=None, output_time=None):
        """Return the spatial profile of var at the given time.

        Parameters
        ----------
        var : str
            variable to return (e.g., 'Porosity')
        time : int
            time slice at which to return the profile. By default, returns
            the first time slice.
        output_time : float
            output time at which to return the profile. If provided, this
            will override the `time` parameter. If both `time` and
            `output_time` are provided, `time` will be ignored.

        Returns
        -------
        data : ndarray of float
            (ny, nx) numpy array of var
        """
        if var not in self.columns:
            raise ValueError("{} not found".format(var))

        if time is None and output_time is None:
            time = self.times[0]
        elif output_time is not None:
            # If output_time is provided, find the corresponding time
            if self.output_times is None:
                raise ValueError("Please define the output_times for this SpatialProfile")
            if output_time not in self.output_times:
                raise ValueError("output_time {} not found in output_times {}".format(output_time, self.output_times))
            itime = self.output_times.index(output_time)
            time = self.times[itime]

        if time not in self.times:
            raise ValueError("Requested time ({}) not in {}".format(time, self.times))

        # Get index of file to load, since self.times may not start at 0
        itime = self.times.index(time)

        # Get column number of var to retrieve
        if self.fmt == ".tec":
            col_no = self.columns.index(var) + 3  # Add 3 because we deleted X, Y and Z cols
            data = self._load_check_exponent(itime, skiprows=3, usecol=col_no)

            # Reshape to (ny, nx)
            data = data.reshape(self.ny, self.nx)
        elif self.fmt == ".out":
            # Check if this file has 3 header rows or two
            with open(self.files[itime]) as f:
                # Skip to third line
                for i in range(3):
                    line = f.readline()
                if isnumeric_scientific(line.split()[0]):
                    skiprows = 2
                else:
                    skiprows = 3
            col_no = self.columns.index(var)
            data = self._load_check_exponent(itime, skiprows=skiprows, usecol=col_no)
        elif self.fmt == ".dat":
            if np.isnan(self.nz):
                col_no = self.columns.index(var) + 2
                data = self._load_check_exponent(itime, skiprows=4, usecol=col_no)
                data = data.reshape(self.ny, self.nx)
            else:
                col_no = self.columns.index(var) + 3
                data = self._load_check_exponent(itime, skiprows=4, usecol=col_no)
                data = data.reshape(self.nz, self.ny, self.nx)

        else:
            raise ValueError("Could not determine the format of this file")

        return np.squeeze(data)

    def plot(self, var, time=None, output_time=None, plot_type="image", figsize=(12, 3), **kwargs):
        """Plot .tec output from a single time step.

        Parameters
        ----------
        var : str
            variable to plot (e.g., 'H+')
        time : int
            which time slice to show. Refers to the file number, not the
            output time. By default, plots the first time slice.
        output_time : float
            which output time to show. If provided, this will override the
            `time` parameter. If both `time` and `output_time` are provided,
            `time` will be ignored.
        figsize : tuple of int
            figure size; default (12, 3)
        plot_type : str
            whether to display an image ('image') or a color-filled
            contour plot ('contourf')
        **kwargs : dict
            args passed on to matplotlib plot function (either contourf
            or imshow)

        Returns
        -------
        fig : pyplot object
            matplotlib fig handle for the plot
        ax : pyplot object
            matplotlib ax handle for the plot
        """
        # If time is not given, plot the first time slice
        if time is None and output_time is None:
            time = self.times[0]
        elif output_time is not None:
            # If output_time is provided, find the corresponding time
            if self.output_times is None:
                raise ValueError("Please define the output_times for this SpatialProfile")
            if output_time not in self.output_times:
                raise ValueError("output_time {} not found in output_times {}".format(output_time, self.output_times))
            itime = self.output_times.index(output_time)
            time = self.times[itime]

        if plot_type not in ["image", "contour"]:
            raise ValueError("plot_type must be either 'image' or 'contour'")

        # Get column number of var to plot
        col_no = self.columns.index(var) + 3  # Add 3 after deleting X, Y and Z
        itime = self.times.index(time)  # Index of time, if self.times[0] != 0

        # Read in gridded data to numpy array
        z = np.loadtxt(self.files[itime], skiprows=3, usecols=col_no)
        z = z.reshape(self.ny, self.nx)
        z[np.isinf(z)] = np.nan  # Mark inf values as nan

        fig, ax = plt.subplots(figsize=figsize)

        # Plot data as color-filled contour
        if plot_type == "contour":
            # Define colorbar steps
            steps = np.linspace(np.nanmin(z), np.nanmax(z), 12)

            # Ensure that colorbar steps are strictly increasing
            if np.nanmin(z) == np.nanmax(z):
                if np.nanmin(z) == 0:
                    steps = np.arange(12)
                else:
                    factors = np.arange(12) / 100 + 1
                    steps = steps * factors

            cs = ax.contourf(self.griddedX, self.griddedY, z, steps, **kwargs)

        # Plot data as image
        elif plot_type == "image":
            extent = [self.griddedX[0, 0], self.griddedX[-1, -1], self.griddedY[0, 0], self.griddedY[-1, -1]]
            cs = ax.imshow(z, origin="lower", extent=extent, **kwargs)

        ax.set(aspect="equal")

        # Add colorbar
        divider = make_axes_locatable(ax)
        cax = divider.append_axes("right", size="2%", pad=0.2)
        plt.colorbar(cs, cax=cax)

        # Build title
        title = self.title

        # Add the output time if it was provided
        if self.output_times is not None:
            itime = self.times.index(time)
            title += " @ t=" + str(self.output_times[itime])

        ax.set(title=title + " -- " + var)

        return fig, ax

    def plot_series(self, var, times=None, output_times=None, plot_type="image", figsize=None, **kwargs):
        """Plot .tec output for a series of time steps.

        Parameters
        ----------
        var : str
            variable to plot (e.g., 'H+')
        times : list
            time steps to plot, must be either components of self.times or
            self.output_times; defaults to all time steps
        plot_type : str
            whether to display an image ('image') or a contour-filled contour
            plot ('contourf')
        output_times : list of float, optional
            list of the actual output times at which the .tec files were
            output, in CrunchFlow time units. If provided, this will override
            the `times` parameter. If both `times` and `output_times` are
            provided, `times` will be ignored.
        figsize : tuple of int
            figure size; default (12, 1.5 * # of timesteps)
        **kwargs : dict
            args passed on to matplotlib's imshow

        Returns
        -------
        fig : pyplot object
            matplotlib fig handle for the plot
        axes : list of pyplot objects
            list of matplotlib axes handles for each subplot
        """
        # Check input
        if plot_type not in ["image", "contour"]:
            raise ValueError("plot_type must be either 'image' or 'contour'")

        if times is None and output_times is None:
            times = self.times
        elif output_times is not None:
            # If output_times is provided, find the corresponding times
            if self.output_times is None:
                raise ValueError("output_times not provided for this SpatialProfile")
            if not isinstance(output_times, list):
                output_times = [output_times]
            times = [self.times[self.output_times.index(t)] for t in output_times]

        # Set up figsize if not provided
        if figsize is None:
            figsize = (12, 1.8 * len(times))

        # Interpret whether times are in output_times or self.times
        in_self_times = True
        for time in times:
            # Assume first that they are in self.times
            if time not in self.times:
                in_self_times = False
                if self.output_times is None:
                    raise ValueError("Could not find {} in self.times".format(time))
                else:
                    if time not in self.output_times:
                        raise ValueError("Could not find {} in self.output_times".format(time))

        # If times were given as components of self.output_times, convert
        # to self.times equivalent
        if not in_self_times:
            times = [self.times[self.output_times.index(t)] for t in times]

        # Get column number of var to plot
        col_no = self.columns.index(var) + 3

        # Set up minimum/maximum values observed across all time slices
        # Used for min/max of color range
        minz = np.Inf
        maxz = np.NINF

        # z is a dict of numpy arrays
        z = {}
        for time in times:
            # Get index of time within self.times
            itime = self.times.index(time)
            z[time] = np.loadtxt(self.files[itime], skiprows=3, usecols=col_no)
            z[time] = z[time].reshape(self.ny, self.nx)
            z[time][np.isinf(z[time])] = np.nan  # Mark inf values as nan

            # Update min/max for color range
            if np.nanmin(z[time]) < minz:
                minz = np.nanmin(z[time])
            if np.nanmax(z[time]) > maxz:
                maxz = np.nanmax(z[time])

        # If it's a contour plot, set up the color intervals/steps
        if plot_type == "contour":
            # Define colorbar steps
            steps = np.linspace(minz, maxz, 12)

            # Ensure that colors are strictly increasing for the colorbar
            if minz == maxz:
                if minz == 0:
                    steps = np.arange(12)
                else:
                    factors = np.arange(12) / 100 + 1
                    steps = steps * factors

        fig, axes = plt.subplots(len(times), sharex=True, figsize=figsize)

        # Loop through each time step and add to plot
        for i, time in enumerate(times):
            # itime is the index of time within self.times
            # i is the index of time within times
            itime = self.times.index(time)

            # In case plot_series is called when there's only one time step
            if len(times) > 1:
                ax = axes[i]
            else:
                ax = axes

            # Add a title to the first plot
            # (and to subsequent plots if output_times was provided)
            if i == 0:
                title = self.title

                # Add the output time if it was provided when tec was init
                if self.output_times is not None:
                    itime = self.times.index(time)
                    title += " @ t=" + str(self.output_times[itime])
                ax.set(title=title + " -- " + var)
            else:
                if self.output_times is not None:
                    title = "t = " + str(self.output_times[itime])
                    ax.set(title=title)

            if plot_type == "contour":
                cs = ax.contourf(self.griddedX, self.griddedY, z[time], steps, **kwargs)

            elif plot_type == "image":
                extent = [self.griddedX[0, 0], self.griddedX[-1, -1], self.griddedY[0, 0], self.griddedY[-1, -1]]
                cs = ax.imshow(z[time], origin="lower", extent=extent, vmin=minz, vmax=maxz, **kwargs)

            ax.set(aspect="equal")

            # Add colorbar
            divider = make_axes_locatable(ax)
            cax = divider.append_axes("right", size="2%", pad=0.2)
            plt.colorbar(cs, cax=cax)

        return fig, axes

    def outline(self, var, value=None, time=None, output_time=None):
        """For a given .tec file, get line segments that outline all the regions
        equal to the provided value. Useful for generating outlines of areas
        of a model domain sharing a single attribute (e.g., permeability) and
        later adding the outlines to a plot of a different variable.

        Parameters
        ----------
        var : str
            variable to outline (e.g., 'Porosity')
        value : float
            value to outline. The default is least-frequent value in array
        time : int
            time slice at which to create an outline. By default, outlines the first
            time slice.
        output_time : float
            output time at which to create an outline. If provided, this
            will override the `time` parameter. If both `time` and
            `output_time` are provided, `time` will be ignored.

        Returns
        -------
        segments : ndarray of float
            array of (x,y) coordinate pairs for each line segment that comprises
            the outline

        Examples
        --------
        >>> # Get stratigraphy from permeability map
        >>> perm = SpatialProfile('permeability')
        >>> segments = perm.outline('X-Perm')
        >>>
        >>> # Plot stratigraphy outlines on O2 map
        >>> conc = SpatialProfile('conc')
        >>> fig, ax = conc.plot('O2(aq)')
        >>> ax.plot(segments[:,0], segments[:,1])
        """
        # Determine which time slice to use
        if time is None and output_time is None:
            time = self.times[0]
        elif output_time is not None:
            # If output_time is provided, find the corresponding time
            if self.output_times is None:
                raise ValueError("Please define the output_times for this SpatialProfile")
            if output_time not in self.output_times:
                raise ValueError("output_time {} not found in output_times {}".format(output_time, self.output_times))
            itime = self.output_times.index(output_time)
            time = self.times[itime]

        # Extract the data for this var and time slice
        data = self.extract(var, time=time)

        # Assume least-frequent value if it isn't provided explicitly
        if value is None:
            vals, counts = np.unique(data, return_counts=True)
            value = vals[np.argmin(counts)]

        # Check that value is in data
        if np.count_nonzero(data == value) == 0:
            raise ValueError("{} not found in array".format(value))

        # Mask pixels to outline
        mask = data == value

        # Get coordinates of where to draw horizontal and vertical segments
        # I.e., where adjacent pixels are not equal to each other
        ver_seg = np.where(mask[:, 1:] != mask[:, :-1])
        hor_seg = np.where(mask[1:, :] != mask[:-1, :])

        # Create list of each line segment,
        # separated by NaN [(start_coord), (end_coord), (nan nan), ... ]
        line_segs = []
        for p in zip(*hor_seg):
            line_segs.append((p[1], p[0] + 1))
            line_segs.append((p[1] + 1, p[0] + 1))
            line_segs.append((np.nan, np.nan))

        # and the same for vertical segments
        for p in zip(*ver_seg):
            line_segs.append((p[1] + 1, p[0]))
            line_segs.append((p[1] + 1, p[0] + 1))
            line_segs.append((np.nan, np.nan))

        # Convert list to array
        segments = np.array(line_segs)

        # Before rescaling, get image extent
        x0 = self.griddedX[0, 0]
        x1 = self.griddedX[-1, -1]
        y0 = self.griddedY[0, 0]
        y1 = self.griddedY[-1, -1]

        # Rescale points according to the extent
        segments[:, 0] = x0 + (x1 - x0) * segments[:, 0] / data.shape[1]
        segments[:, 1] = y0 + (y1 - y0) * segments[:, 1] / data.shape[0]

        return segments

    def _load_check_exponent(self, ifile, skiprows, usecol):
        """Load the data from file, with error checking for a triple-digit exponent.

        Given a file, first try to read it using np.loadtxt. If that doesn't work,
        try to read it line-by-line, correcting for the missing "E" in triple-digit
        exponents.

        Parameters
        ----------
        ifile : int
            index of the file to read in from self.files
        skiprows : int
            number of header rows to skip when reading the file
        usecol : int
            column number to read in from the file (0-indexed)

        Returns
        -------
        data : ndarray of float
            1D numpy array of the data read from the file
        """
        # Pre-compile regex to save time
        neg_search = re.compile(r"([0-9][0-9])\-([0-9][0-9][0-9])")
        pos_search = re.compile(r"([0-9][0-9])\+([0-9][0-9][0-9])")

        # Try loading with .tec format first
        try:
            data = np.loadtxt(self.files[ifile], skiprows=skiprows, usecols=usecol)
        except ValueError:
            # If that fails, try parsing line-by-line
            with open(self.files[ifile], "r") as f:
                all_lines = f.readlines()

            data = np.empty(len(all_lines) - skiprows, dtype=np.float64)
            for i, line in enumerate(all_lines):
                if i < skiprows:
                    continue
                else:
                    raw_str = line.split()[usecol]
                    if re.search(neg_search, raw_str):
                        corr_val = re.sub(neg_search, r"\1E-\2", raw_str)
                    elif re.search(pos_search, raw_str):
                        corr_val = re.sub(pos_search, r"\1E+\2", raw_str)
                    else:
                        corr_val = raw_str

                data[i - skiprows] = float(corr_val)

        return data


if __name__ == "__main__":
    print(SpatialProfile.__doc__)