diff --git a/.gitignore b/.gitignore
index bf6a22fc6..957306f03 100644
--- a/.gitignore
+++ b/.gitignore
@@ -2,3 +2,6 @@
 *.patch
 _build
 *.pt
+*.vscode*
+.DS_Store
+generated_rtd*
diff --git a/.readthedocs.yml b/.readthedocs.yaml
similarity index 86%
rename from .readthedocs.yml
rename to .readthedocs.yaml
index e2c25ef5e..16f057784 100644
--- a/.readthedocs.yml
+++ b/.readthedocs.yaml
@@ -4,10 +4,13 @@
 
 version: 2
 
+build:
+  image: latest
+
 sphinx:
   configuration: doc/rtd/conf.py
 
 python:
-  version: 3.7
+  version: 3.8
   install:
     - requirements: doc/rtd/requirements.txt
diff --git a/.travis.yml b/.travis.yml
index 909717b1d..72b7b9552 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -17,7 +17,7 @@ env:
     - BUILD_TYPE=Debug
     - TECA_DIR=/travis_teca_dir
     - TECA_PYTHON_VERSION=3
-    - TECA_DATA_REVISION=101
+    - TECA_DATA_REVISION=117
   jobs:
     - DOCKER_IMAGE=ubuntu IMAGE_VERSION=20.04 IMAGE_NAME=ubuntu_20_04 REQUIRE_NETCDF_MPI=TRUE
     - DOCKER_IMAGE=ubuntu IMAGE_VERSION=20.04 IMAGE_NAME=ubuntu_20_04 REQUIRE_NETCDF_MPI=FALSE
diff --git a/CMake/teca_app.cmake b/CMake/teca_app.cmake
index fbaa0e923..82bb06234 100644
--- a/CMake/teca_app.cmake
+++ b/CMake/teca_app.cmake
@@ -31,6 +31,7 @@ function (teca_add_app app_name)
                 teca_system teca_core teca_data teca_io teca_alg
                 ${APP_LIBS})
         endif()
+        set_target_properties(${app_name} PROPERTIES APP_TYPE C++)
         install(TARGETS ${app_name} RUNTIME DESTINATION ${BIN_PREFIX})
     else()
         message(STATUS "command line application ${app_name} -- disabled")
diff --git a/CMake/teca_python.cmake b/CMake/teca_python.cmake
index 6ee3f7397..b94dcb80c 100644
--- a/CMake/teca_python.cmake
+++ b/CMake/teca_python.cmake
@@ -60,6 +60,8 @@ function (teca_add_python_app app_name)
             if (NOT APP_SOURCES)
                 set(APP_SOURCES "${app_name}.in")
             endif()
+            add_custom_target(${app_name})
+            set_target_properties(${app_name} PROPERTIES APP_TYPE Python)
             teca_py_install_apps(${APP_SOURCES})
         else()
             message(STATUS "command line application ${app_name} -- disabled")
diff --git a/CMake/teca_test.cmake b/CMake/teca_test.cmake
index 375c3524f..346eaf319 100644
--- a/CMake/teca_test.cmake
+++ b/CMake/teca_test.cmake
@@ -51,3 +51,9 @@ function (teca_add_test T_NAME)
         endif()
     endif()
 endfunction()
+
+function (teca_add_app_test T_NAME T_TARGET)
+    if (TARGET ${T_TARGET})
+        teca_add_test(${T_NAME} ${ARGV})
+    endif()
+endfunction()
diff --git a/CMakeLists.txt b/CMakeLists.txt
index c1ecb1fbb..4eb5ff0ff 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -387,26 +387,50 @@ if (BUILD_TESTING)
     # figure out how many cores we can use for parallel tests
     set(TECA_TEST_CORES 0 CACHE STRING
         "Max number of cores for use in parallel tests")
+
+    # by default assume 2 hyperthreads per core, if this is not
+    # the case override here
+    set(HYPERTHREADS_PER_CORE 2 CACHE STRING
+        "The number of hyperthreads per core.")
+
+    # use CMake to get the number of logical cores. includes hyperthreads
+    # in the count.
     if (TECA_TEST_CORES LESS 1)
         ProcessorCount(LOGICAL_CORES)
         if (LOGICAL_CORES EQUAL 0)
-            set(LOGICAL_CORES 4)
+            message(FATAL_ERROR "Failed to detect the number of cores. "
+                "Set TECA_TEST_CORES")
         endif()
     else()
-        math(EXPR LOGICAL_CORES "${TECA_TEST_CORES}*2")
+        math(EXPR LOGICAL_CORES "${TECA_TEST_CORES}*${HYPERTHREADS_PER_CORE}")
     endif()
-    math(EXPR PHYSICAL_CORES "${LOGICAL_CORES}/2")
-    if (PHYSICAL_CORES LESS 3)
-        set(TEST_CORES 2)
-        set(HALF_TEST_CORES 2)
-        set(TWICE_TEST_CORES 4)
-    else()
-        set(TEST_CORES ${PHYSICAL_CORES})
-        math(EXPR HALF_TEST_CORES "${TEST_CORES}/2")
-        set(TWICE_TEST_CORES ${LOGICAL_CORES})
+
+    # adjust count for hyperthreads.
+    math(EXPR PHYSICAL_CORES "${LOGICAL_CORES}/${HYPERTHREADS_PER_CORE}")
+    if (PHYSICAL_CORES LESS 1)
+        message(FATAL_ERROR "Invalid CPU configuration. "
+            "LOGICAL_CORES=${LOGICAL_CORES} HYPERTHREADS_PER_CORE="
+            "${HYPERTHREADS_PER_CORE}")
     endif()
+
+    # set the number of cores to use for pure MPI or purely threaded tests
+    set(TEST_CORES ${PHYSICAL_CORES})
     message(STATUS "regression testing -- enabled (${TEST_CORES} cores).")
 
+    # set the number of cores to use for MPI + threads tests. if there are too
+    # few physical cores then disable hybrid parallel tests
+    math(EXPR HALF_TEST_CORES "${TEST_CORES}/2")
+    if (HALF_TEST_CORES LESS 2)
+        message(STATUS "Hybrid parallel tests -- disabled.")
+        set(TEST_MPI_THREADS OFF)
+    else()
+        message(STATUS "Hybrid parallel tests -- enabled.")
+        set(TEST_MPI_THREADS ON)
+    endif()
+
+    # set the number of cores for oversubscription/streaming tests
+    math(EXPR TWICE_TEST_CORES "${TEST_CORES}*2")
+
     add_subdirectory(test)
 else()
     message(STATUS "regression testing -- disbaled")
diff --git a/README.md b/README.md
index 8e0485626..a10c5ad87 100644
--- a/README.md
+++ b/README.md
@@ -1,4 +1,8 @@
-<img src="doc/rtd/images/teca_logo_crop2_lg.png" width="48%">
+<table style="border: 1px; border-collapse: collapse; border-spacing: 0px;">
+<tr><td width="402px">
+<img src="https://raw.githubusercontent.com/LBL-EESA/TECA/8ea6a121c8c29cdab31be4226b0564c9ee5a9726/doc/rtd/images/teca_logo_crop2_lg.png" width="400px">
+</td></tr>
+</table>
 <a href="https://travis-ci.com/LBL-EESA/TECA"><img src="https://travis-ci.com/LBL-EESA/TECA.svg?token=zV3LhFtYvjcvo67W2uji&branch=master"></a>
 <a href="https://teca.readthedocs.io/en/latest/?badge=latest"><img src="https://readthedocs.org/projects/teca/badge/?version=latest"></a>
 <a href="https://badge.fury.io/py/teca"><img src="https://badge.fury.io/py/teca.svg" alt="PyPI version"></a>
@@ -8,7 +12,7 @@
 TECA is a collection of climate analysis algorithms geared toward extreme event detection and tracking implemented in a scalable parallel framework. The code has been successfully deployed and run at massive scales on current DOE supercomputers. TECA's core is written in modern C++ and exploits MPI + X parallelism where X is one of threads, OpenMP, or GPUs. The framework supports a number of parallel design patterns including distributed data parallelism and map-reduce. While modern C++ delivers the highest performance, Python bindings make the code approachable and easy to use.
 
 ### Documentation
-The [TECA User's Guide](https://teca.readthedocs.io/en/latest/) is the authorotative source for documentation on topics such as [installing TECA](https://teca.readthedocs.io/en/latest/installation.html), running TECA's [command line applications](https://teca.readthedocs.io/en/latest/applications.html), and [Python development](https://teca.readthedocs.io/en/latest/python.html).
+The [TECA User's Guide](https://teca.readthedocs.io/en/latest/) is the authorotative source for documentation on topics such as [installing TECA](https://teca.readthedocs.io/en/latest/installation.html), running TECA's [command line applications](https://teca.readthedocs.io/en/latest/applications.html), and [Python development](https://teca.readthedocs.io/en/latest/python.html). The TECA source code is documented on our [Doxygen site](https://teca.readthedocs.io/en/latest/doxygen/index.html).
 
 ### Tutorials
 The [TECA tutorials](https://sourceforge.net/p/teca/TECA_tutorials) subversion repository contains slides from previous tutorials.
diff --git a/alg/CMakeLists.txt b/alg/CMakeLists.txt
index 48038978d..d8f7e1734 100644
--- a/alg/CMakeLists.txt
+++ b/alg/CMakeLists.txt
@@ -21,16 +21,20 @@ set(teca_alg_cxx_srcs
     teca_component_statistics.cxx
     teca_derived_quantity.cxx
     teca_descriptive_statistics.cxx
+    teca_elevation_mask.cxx
     teca_evaluate_expression.cxx
     teca_face_to_cell_centering.cxx
     teca_geography.cxx
+    teca_indexed_dataset_cache.cxx
     teca_integrated_vapor_transport.cxx
+    teca_integrated_water_vapor.cxx
     teca_l2_norm.cxx
     teca_latitude_damper.cxx
     teca_laplacian.cxx
     teca_mask.cxx
     teca_normalize_coordinates.cxx
     teca_parser.cxx
+    teca_rename_variables.cxx
     teca_table_calendar.cxx
     teca_table_reduce.cxx
     teca_table_region_mask.cxx
@@ -41,7 +45,8 @@ set(teca_alg_cxx_srcs
     teca_tc_classify.cxx
     teca_tc_wind_radii.cxx
     teca_tc_trajectory.cxx
-    teca_temporal_average.cxx
+    teca_simple_moving_average.cxx
+    teca_unpack_data.cxx
     teca_valid_value_mask.cxx
     teca_variant_array_operand.cxx
     teca_vertical_coordinate_transform.cxx
diff --git a/alg/teca_2d_component_area.cxx b/alg/teca_2d_component_area.cxx
index 285d40f52..9bdcbac60 100644
--- a/alg/teca_2d_component_area.cxx
+++ b/alg/teca_2d_component_area.cxx
@@ -132,11 +132,13 @@ void teca_2d_component_area::get_properties_description(
             "name of the varibale containing region labels")
         TECA_POPTS_GET(int, prefix, contiguous_component_ids,
             "when the region label ids start at 0 and are consecutive "
-            "this flag enables use of an optimization (0)")
+            "this flag enables use of an optimization")
         TECA_POPTS_GET(long, prefix, background_id,
-            "the label id that corresponds to the background (-1)")
+            "the label id that corresponds to the background")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -144,6 +146,8 @@ void teca_2d_component_area::get_properties_description(
 void teca_2d_component_area::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, component_variable)
     TECA_POPTS_SET(opts, int, prefix, contiguous_component_ids)
     TECA_POPTS_SET(opts, long, prefix, background_id)
diff --git a/alg/teca_2d_component_area.h b/alg/teca_2d_component_area.h
index 5a9d57e6a..54f4a2e42 100644
--- a/alg/teca_2d_component_area.h
+++ b/alg/teca_2d_component_area.h
@@ -10,40 +10,40 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_2d_component_area)
 
-/// an algorithm that computes the area of labeled regions
+/// An algorithm that computes the areas of labeled regions
 /**
-Given a set of labels on a Cartesian mesh, the algorithm computes the area of
-each region. Regions are identified by assigning a unique integer value to each
-mesh point that belongs in the region. The component_variable property names
-the variable containing the region labels.
-
-if the region labels start at 0 and are contiguous then an optimization can be
-used. Set contiguous_component_ids property to enable the optimization. Note that
-TECA's connected component labeler assigns the background (i.e. cells not inside
-the segmentation) the label 0. One can identify the background region and area
-via this label. When processing data generated outside of TECA it might be
-necessary to supply the background label. Use -2 if there is no background.
-
-the input dataset is passed through and the results of the calculations are
-stored in the output dataset metadata in the following keys:
-
-    number_of_components - number of component ids for which area was
-                           computed. Note that this can include a background
-                           component i.e. for cells outside of the segmentation.
-
-    component_ids - a vector containing the label of each component. This is
-                    always starts with 0, where the label 0 identifies cells
-                    out side of the segmentation, and ranges up to
-                    number_of_components - 1, where the labels from 1 up to
-                    number_of_components - 1 identify connected regions of
-                    cells inside the segmentation.
-
-    component_area - a vector containing the area for the corresponding entry
-                     in the component_ids array.
-
-    background_id - the label used for cells outside of the segmentation,
-                    i.e. the background. This can be used to skip processing
-                    of the background when desirable.
+ * Given a set of labels on a Cartesian mesh, the algorithm computes the area
+ * of each region. Regions are identified by assigning a unique integer value
+ * to each mesh point that belongs in the region. The component_variable
+ * property names the variable containing the region labels.
+ *
+ * if the region labels start at 0 and are contiguous then an optimization can
+ * be used. Set contiguous_component_ids property to enable the optimization.
+ * Note that TECA's connected component labeler assigns the background (i.e.
+ * cells not inside the segmentation) the label 0. One can identify the
+ * background region and area via this label. When processing data generated
+ * outside of TECA it might be necessary to supply the background label. Use -2
+ * if there is no background.
+ *
+ * the input dataset is passed through and the results of the calculations are
+ * stored in the output dataset metadata in the following keys:
+ *
+ *  | name                 | description |
+ *  | ----                 | ----------- |
+ *  | number_of_components | number of component ids for which area was |
+ *  |                      | computed. Note that this can include a background |
+ *  |                      | component i.e. for cells outside of the segmentation. |
+ *  | component_ids        | a vector containing the label of each component. This is |
+ *  |                      | always starts with 0, where the label 0 identifies |
+ *  |                      | cells out side of the segmentation, and ranges up |
+ *  |                      | to number_of_components - 1, where the labels from |
+ *  |                      | 1 up to number_of_components - 1 identify |
+ *  |                      | connected regions of cells inside the segmentation. |
+ *  | component_area       | a vector containing the area for the corresponding |
+ *  |                      |  entry in the component_ids array. |
+ *  | background_id        | the label used for cells outside of the segmentation, |
+ *  |                      | i.e. the background. This can be used to skip processing |
+ *  |                      | of the background when desirable. |
 */
 class teca_2d_component_area : public teca_algorithm
 {
@@ -53,23 +53,40 @@ class teca_2d_component_area : public teca_algorithm
     TECA_ALGORITHM_CLASS_NAME(teca_2d_component_area)
     ~teca_2d_component_area();
 
-    // report/initialize to/from Boost program options objects.
+    /** @name program_options
+     * report/initialize to/from Boost program options objects.
+     */
+    ///@{
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
+    ///@}
 
-    // set the name of the input array
+    /** @name component_variable
+     * Sets the name of the array containing component labels to compute the
+     * area of.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_variable)
+    ///@}
 
-    // set this only if you know for certain that label ids are contiguous and
-    // start at 0. this enables use of a faster implementation.
+    /** @name contiguous_component_ids
+     * set this only if you know for certain that label ids are contiguous and
+     * start at 0. this enables use of a faster implementation.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, contiguous_component_ids)
-
-    // set this to override the component label used for background. By default
-    // this is set to -1 to indicate that the value should be obtained from the
-    // metadata key `background_id`.  Note that TECA's connected component
-    // labeler uses the id 0 for the background and passes this in a metadata
-    // key and as a result no action is required.
+    ///@}
+
+    /** @name background_id
+     * set this to override the component label used for background. By default
+     * this is set to -1 to indicate that the value should be obtained from the
+     * metadata key `background_id`.  Note that TECA's connected component
+     * labeler uses the id 0 for the background and passes this in a metadata
+     * key and as a result no action is required.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(long, background_id)
+    ///@}
 
 protected:
     teca_2d_component_area();
diff --git a/alg/teca_apply_binary_mask.cxx b/alg/teca_apply_binary_mask.cxx
index 4ec27d4df..0e2d9aa8b 100644
--- a/alg/teca_apply_binary_mask.cxx
+++ b/alg/teca_apply_binary_mask.cxx
@@ -1,26 +1,44 @@
 #include "teca_apply_binary_mask.h"
 
-#include "teca_mesh.h"
+#include "teca_cartesian_mesh.h"
 #include "teca_array_collection.h"
 #include "teca_variant_array.h"
 #include "teca_metadata.h"
-#include "teca_mesh.h"
+#include "teca_array_attributes.h"
+#include "teca_mpi_util.h"
 
 #include <algorithm>
 #include <iostream>
-#include <deque>
 #include <set>
 
-using std::deque;
-using std::vector;
-using std::set;
+#include <string>
+
+#if defined(TECA_HAS_BOOST)
+#include <boost/program_options.hpp>
+#endif
+
+//#define TECA_DEBUG
+
 using std::cerr;
 using std::endl;
 
-//#define TECA_DEBUG
+namespace internal
+{
+// output = mask*input
+template <typename mask_t, typename var_t>
+void apply_mask(var_t * __restrict__ output,
+    const mask_t * __restrict__ mask,
+    const var_t * __restrict__ input,
+    unsigned long n)
+{
+    for (size_t i = 0; i < n; ++i)
+        output[i] = mask[i]*input[i];
+}
+}
 
 // --------------------------------------------------------------------------
-teca_apply_binary_mask::teca_apply_binary_mask() : mask_variable("")
+teca_apply_binary_mask::teca_apply_binary_mask() :
+    mask_variable(""), output_variable_prefix("masked_")
 {
     this->set_number_of_input_connections(1);
     this->set_number_of_output_ports(1);
@@ -30,6 +48,125 @@ teca_apply_binary_mask::teca_apply_binary_mask() : mask_variable("")
 teca_apply_binary_mask::~teca_apply_binary_mask()
 {}
 
+#if defined(TECA_HAS_BOOST)
+// --------------------------------------------------------------------------
+void teca_apply_binary_mask::get_properties_description(
+    const std::string &prefix, options_description &global_opts)
+{
+    options_description opts("Options for "
+        + (prefix.empty()?"teca_apply_binary_mask":prefix));
+
+    opts.add_options()
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, masked_variables,
+            "A list of variables to apply the mask to.")
+        TECA_POPTS_GET(std::string, prefix, mask_variable,
+            "The name of the variable containing the mask values.")
+        TECA_POPTS_GET(std::string, prefix, output_variable_prefix,
+            "A string prepended to the output variable names. If empty the"
+            " input variables will be replaced by their masked results")
+        ;
+
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
+    global_opts.add(opts);
+}
+
+// --------------------------------------------------------------------------
+void teca_apply_binary_mask::set_properties(
+    const std::string &prefix, variables_map &opts)
+{
+    this->teca_algorithm::set_properties(prefix, opts);
+
+    TECA_POPTS_SET(opts, std::vector<std::string>, prefix, masked_variables)
+    TECA_POPTS_SET(opts, std::string, prefix, mask_variable)
+    TECA_POPTS_SET(opts, std::string, prefix, output_variable_prefix)
+}
+#endif
+
+// --------------------------------------------------------------------------
+std::string teca_apply_binary_mask::get_output_variable_name(std::string input_var)
+{
+    return this->output_variable_prefix + input_var;
+}
+
+// --------------------------------------------------------------------------
+void teca_apply_binary_mask::get_output_variable_names(
+    std::vector<std::string> &names)
+{
+    int n_inputs = this->masked_variables.size();
+    for (int i = 0; i < n_inputs; ++i)
+    {
+        names.push_back(
+            this->get_output_variable_name(this->masked_variables[i]));
+    }
+}
+
+// --------------------------------------------------------------------------
+teca_metadata teca_apply_binary_mask::get_output_metadata(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md)
+{
+#ifdef TECA_DEBUG
+    cerr << teca_parallel_id()
+        << "teca_apply_binary_mask::get_output_metadata" << endl;
+#endif
+    (void)port;
+
+    // check that the input variables have been specified.
+    // this is likely a user error.
+    if (this->masked_variables.empty() &&
+        teca_mpi_util::mpi_rank_0(this->get_communicator()))
+    {
+        TECA_WARNING("Nothing to do, masked_variables have not"
+            " been specified.")
+    }
+
+    // add in the array we will generate
+    teca_metadata out_md(input_md[0]);
+
+    // get the attributes
+    teca_metadata attributes;
+    out_md.get("attributes", attributes);
+
+    // construct the list of output variable names
+    for (auto& input_var : masked_variables)
+    {
+        std::string output_var = this->get_output_variable_name(input_var);
+
+        // add the varible to the list of output variables
+        out_md.append("variables", output_var);
+
+        // insert attributes to enable this variable to be written by the CF writer
+        teca_metadata input_atts;
+        if (attributes.get(input_var, input_atts))
+        {
+            TECA_WARNING("Failed to get attributes for \"" << input_var
+                << "\". Writing the result will not be possible")
+        }
+        else
+        {
+            // copy the attributes from the input. this will capture the
+            // data type, size, units, etc.
+            teca_array_attributes output_atts(input_atts);
+
+            // update description and long name
+            output_atts.description = input_var +
+                " multiplied by " + this->mask_variable;
+
+            output_atts.long_name.clear();
+
+            // update the array attributes
+            attributes.set(output_var, (teca_metadata)output_atts);
+        }
+
+    }
+
+    // update the attributes
+    out_md.set("attributes", attributes);
+
+    return out_md;
+}
+
 // --------------------------------------------------------------------------
 std::vector<teca_metadata> teca_apply_binary_mask::get_upstream_request(
     unsigned int port, const std::vector<teca_metadata> &input_md,
@@ -42,9 +179,9 @@ std::vector<teca_metadata> teca_apply_binary_mask::get_upstream_request(
     (void) port;
     (void) input_md;
 
-    vector<teca_metadata> up_reqs;
+    std::vector<teca_metadata> up_reqs;
 
-    // get the name of the array to request
+    // get the name of the mask array
     if (this->mask_variable.empty())
     {
         TECA_ERROR("A mask variable was not specified")
@@ -55,11 +192,36 @@ std::vector<teca_metadata> teca_apply_binary_mask::get_upstream_request(
     // add in what we need
     teca_metadata req(request);
     std::set<std::string> arrays;
+
     if (req.has("arrays"))
         req.get("arrays", arrays);
+
     arrays.insert(this->mask_variable);
-    if (!this->mask_arrays.empty())
-        arrays.insert(this->mask_arrays.begin(), this->mask_arrays.end());
+
+    // check that the input variables have been specified.
+    // this is likely a user error.
+    if (this->masked_variables.empty() &&
+        teca_mpi_util::mpi_rank_0(this->get_communicator()))
+    {
+        TECA_WARNING("Nothing to do, masked_variables have not"
+            " been specified.")
+    }
+
+    // request the arrays to mask
+    for (auto& input_var : masked_variables)
+    {
+        // request the needed variable
+        arrays.insert(input_var);
+
+        // intercept request for our output if the variable will have a new name
+        std::string out_var = this->get_output_variable_name(input_var);
+        if (out_var != input_var)
+        {
+            arrays.erase(out_var);
+        }
+    }
+
+    // update the list of arrays to request
     req.set("arrays", arrays);
 
     // send up
@@ -79,68 +241,80 @@ const_p_teca_dataset teca_apply_binary_mask::execute(
     (void)request;
 
     // get the input
-    const_p_teca_mesh in_mesh =
-        std::dynamic_pointer_cast<const teca_mesh>(input_data[0]);
+    const_p_teca_mesh in_mesh
+        = std::dynamic_pointer_cast<const teca_mesh>(input_data[0]);
     if (!in_mesh)
     {
-        TECA_ERROR("empty input, or not a mesh")
+        TECA_ERROR("Failed to apply mask. Dataset is not a teca_mesh")
         return nullptr;
     }
 
-    // create output and copy metadata, coordinates, etc
+    // create the output mesh, pass everything through
+    // masked arrays are added or replaced below
     p_teca_mesh out_mesh =
-        std::dynamic_pointer_cast<teca_mesh>(in_mesh->new_instance());
-    out_mesh->copy(in_mesh);
+        std::static_pointer_cast<teca_mesh>
+            (std::const_pointer_cast<teca_mesh>(in_mesh)->new_shallow_copy());
 
-    // get the mask array
+    // check that a masking variable has been provided
     if (this->mask_variable.empty())
     {
-        TECA_ERROR("A mask variable was not specified")
+        TECA_ERROR("The mask_variable name was not specified")
         return nullptr;
     }
 
-    p_teca_array_collection arrays = out_mesh->get_point_arrays();
-
-    p_teca_variant_array mask_array = arrays->get(this->mask_variable);
+    // get the mask array
+    const_p_teca_variant_array mask_array
+        = in_mesh->get_point_arrays()->get(this->mask_variable);
     if (!mask_array)
     {
-        TECA_ERROR("mask variable \"" << this->mask_variable
-            << "\" is not in the input")
+        TECA_ERROR("The mask_variable \"" << this->mask_variable
+            << "\" was requested but is not present in the input data.")
         return nullptr;
     }
 
     // apply the mask
-    unsigned long nelem = mask_array->size();
+    NESTED_TEMPLATE_DISPATCH(const teca_variant_array_impl,
+        mask_array.get(), _MASK,
 
-    NESTED_TEMPLATE_DISPATCH(teca_variant_array_impl,
-        mask_array.get(), _1,
+        // loop over input variables
+        for (auto& input_var : masked_variables)
+        {
+            std::string output_var = this->get_output_variable_name(input_var);
 
-        NT_1 *pmask = static_cast<TT_1*>(mask_array.get())->get();
+            // get the input array
+            const_p_teca_variant_array input_array
+                = in_mesh->get_point_arrays()->get(input_var);
+            if (!input_array)
+            {
+                TECA_ERROR("The masked_variable \"" << input_var
+                    << "\" was requested but is not present in the input data.")
+                return nullptr;
+            }
 
-        unsigned int narrays = arrays->size();
-        for (unsigned int i = 0; i < narrays; ++i)
-        {
-            // if the user provided a list, restrict masking to that
-            // list. and if not, mask everything
-            if (!this->mask_arrays.empty() &&
-                !std::count(this->mask_arrays.begin(),
-                this->mask_arrays.end(), arrays->get_name(i)))
-                continue;
+            // allocate the output array
+            size_t n = input_array->size();
 
-            p_teca_variant_array array = arrays->get(i);
+            p_teca_variant_array output_array = input_array->new_instance(n);
 
-            NESTED_TEMPLATE_DISPATCH(teca_variant_array_impl,
-                array.get(), _2,
+            //output_array->resize(n);
 
-                NT_2 *parray = static_cast<TT_2*>(array.get())->get();
+            // do the mask calculation
+            NESTED_TEMPLATE_DISPATCH(
+                teca_variant_array_impl,
+                output_array.get(), _VAR,
 
-                for (unsigned long q = 0; q < nelem; ++q)
-                {
-                    parray[q] *= static_cast<NT_2>(pmask[q]);
-                }
+                internal::apply_mask(
+                    dynamic_cast<TT_VAR*>(output_array.get())->get(),
+                    static_cast<const TT_MASK*>(mask_array.get())->get(),
+                    static_cast<const TT_VAR*>(input_array.get())->get(),
+                    n);
                 )
+
+            out_mesh->get_point_arrays()->set(
+                output_var, output_array);
         }
-        )
+    )
+
 
     return out_mesh;
 }
diff --git a/alg/teca_apply_binary_mask.h b/alg/teca_apply_binary_mask.h
index f30a1081e..ceeed4040 100644
--- a/alg/teca_apply_binary_mask.h
+++ b/alg/teca_apply_binary_mask.h
@@ -10,12 +10,26 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_apply_binary_mask)
 
-/// an algorithm that applies a binary mask multiplicatively
+/// Applies a mask to a given list of variables
 /**
-an algorithm that applies a binary mask multiplicatively to all
-arrays in the input dataset. where mask is 1 values are passed
-through, where mask is 0 values are removed.
-*/
+ * Given a mask variable, this routine applies the mask to a list of input
+ * variables.
+ *
+ * The mask variable can either be binary, or it can represent a probability
+ * ranging from 0 to 1. For mask variable `mask` and input variable `var`, this
+ * algorithm computes `mask * var` and sends the resulting array downstream; this
+ * masking operation is applied for all variables in the input list.
+ *
+ * A potential use-case for this algorithm is masking quantities like
+ * precipitation by the probability of atmospheric river presence; the average
+ * of this masked precipitation variable gives the average precipitation due to
+ * atmospheric rivers.
+ *
+ * The output variable names are given a prefix to distinguish them from the
+ * upstream versions. E.g., if the algorithm property `output_variable_prefix` is set
+ * to 'ar_', and the variable being masked is 'precip', then the output array
+ * name is 'ar_precip'.
+ */
 class teca_apply_binary_mask : public teca_algorithm
 {
 public:
@@ -24,19 +38,48 @@ class teca_apply_binary_mask : public teca_algorithm
     TECA_ALGORITHM_CLASS_NAME(teca_apply_binary_mask)
     ~teca_apply_binary_mask();
 
-    // set the name of the output array
+    // report/initialize to/from Boost program options
+    // objects.
+    TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
+    TECA_SET_ALGORITHM_PROPERTIES()
+
+    /** @name mask_variable
+     * set the name of the variable containing the mask values
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, mask_variable)
+    ///@}
+
+    /** @name masked_variable
+     * A list of of variables to apply the mask to. If empty no arrays will be
+     * requested, and no variables will be masked
+     */
+    ///@{
+    TECA_ALGORITHM_VECTOR_PROPERTY(std::string, masked_variable)
+    ///@}
 
-    // set the arrays to mask. if empty no arrays will be
-    // requested, but all present will be masked
-    TECA_ALGORITHM_VECTOR_PROPERTY(std::string, mask_array)
+    /** @name output_variable_prefix
+     * A prefix for the names of the variables that have been masked.  If this
+     * is empty masked data replaces its input, otherwise input data is
+     * preserved and masked data is added.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, output_variable_prefix)
+    ///@}
+
+    /** helper that constructs and returns the result variable names taking
+     * into account he list of masked_variables and the output_variable_prefix.
+     * use this to know what variables will be produced.
+     */
+    void get_output_variable_names(std::vector<std::string> &names);
 
 protected:
     teca_apply_binary_mask();
 
 private:
-    //teca_metadata get_output_metadata(unsigned int port,
-    //    const std::vector<teca_metadata> &input_md) override;
+    teca_metadata get_output_metadata(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md) override;
 
     std::vector<teca_metadata> get_upstream_request(
         unsigned int port, const std::vector<teca_metadata> &input_md,
@@ -46,9 +89,14 @@ class teca_apply_binary_mask : public teca_algorithm
         const std::vector<const_p_teca_dataset> &input_data,
         const teca_metadata &request) override;
 
+    // helper that given and input variable name constructs the result variable
+    // name taking into account the output_variable_prefix
+    std::string get_output_variable_name(std::string input_var);
+
 private:
     std::string mask_variable;
-    std::vector<std::string> mask_arrays;
+    std::vector<std::string> masked_variables;
+    std::string output_variable_prefix;
 };
 
 #endif
diff --git a/alg/teca_ar_detect.cxx b/alg/teca_ar_detect.cxx
deleted file mode 100644
index 23b848c3b..000000000
--- a/alg/teca_ar_detect.cxx
+++ /dev/null
@@ -1,1347 +0,0 @@
-#include "teca_ar_detect.h"
-
-#include "teca_cartesian_mesh.h"
-#include "teca_variant_array.h"
-#include "teca_table.h"
-#include "teca_calendar.h"
-#include "teca_coordinate_util.h"
-
-#include <iostream>
-#include <sstream>
-#include <limits>
-#include <algorithm>
-#include <cmath>
-
-#if defined(TECA_HAS_BOOST)
-#include <boost/program_options.hpp>
-#endif
-
-using std::cerr;
-using std::endl;
-
-#define TECA_DEBUG 0
-#if TECA_DEBUG > 0
-#include "teca_cartesian_mesh_writer.h"
-#include "teca_programmable_algorithm.h"
-int write_mesh(
-    const const_p_teca_cartesian_mesh &mesh,
-    const const_p_teca_variant_array &vapor,
-    const const_p_teca_variant_array &thres,
-    const const_p_teca_variant_array &ccomp,
-    const const_p_teca_variant_array &lsmask,
-    const std::string &base_name);
-#endif
-
-// a description of the atmospheric river
-struct atmospheric_river
-{
-    atmospheric_river() :
-        pe(false), length(0.0),
-        min_width(0.0), max_width(0.0),
-        end_top_lat(0.0), end_top_lon(0.0),
-        end_bot_lat(0.0), end_bot_lon(0.0)
-    {}
-
-    bool pe;
-    double length;
-    double min_width;
-    double max_width;
-    double end_top_lat;
-    double end_top_lon;
-    double end_bot_lat;
-    double end_bot_lon;
-};
-
-std::ostream &operator<<(std::ostream &os, const atmospheric_river &ar)
-{
-    os << " type=" << (ar.pe ? "PE" : "AR")
-        << " length=" << ar.length
-        << " width=" << ar.min_width << ", " << ar.max_width
-        << " bounds=" << ar.end_bot_lon << ", " << ar.end_bot_lat << ", "
-        << ar.end_top_lon << ", " << ar.end_top_lat;
-    return os;
-}
-
-unsigned sauf(const unsigned nrow, const unsigned ncol, unsigned int *image);
-
-bool ar_detect(
-    const_p_teca_variant_array lat,
-    const_p_teca_variant_array lon,
-    const_p_teca_variant_array land_sea_mask,
-    p_teca_unsigned_int_array con_comp,
-    unsigned long n_comp,
-    double river_start_lat,
-    double river_start_lon,
-    double river_end_lat_low,
-    double river_end_lon_low,
-    double river_end_lat_high,
-    double river_end_lon_high,
-    double percent_in_mesh,
-    double river_width,
-    double river_length,
-    double land_threshold_low,
-    double land_threshold_high,
-    atmospheric_river &ar);
-
-// set locations in the output where the input array
-// has values within the low high range.
-template <typename T>
-void threshold(
-    const T *input, unsigned int *output,
-    size_t n_vals, T low, T high)
-{
-    for (size_t i = 0; i < n_vals; ++i)
-        output[i] = ((input[i] >= low) && (input[i] <= high)) ? 1 : 0;
-}
-
-
-
-// --------------------------------------------------------------------------
-teca_ar_detect::teca_ar_detect() :
-    water_vapor_variable("prw"),
-    land_sea_mask_variable(""),
-    low_water_vapor_threshold(20),
-    high_water_vapor_threshold(75),
-    search_lat_low(19.0),
-    search_lon_low(180.0),
-    search_lat_high(56.0),
-    search_lon_high(250.0),
-    river_start_lat_low(18.0),
-    river_start_lon_low(180.0),
-    river_end_lat_low(29.0),
-    river_end_lon_low(233.0),
-    river_end_lat_high(56.0),
-    river_end_lon_high(238.0),
-    percent_in_mesh(5.0),
-    river_width(1250.0),
-    river_length(2000.0),
-    land_threshold_low(1.0),
-    land_threshold_high(std::numeric_limits<double>::max())
-{
-    this->set_number_of_input_connections(1);
-    this->set_number_of_output_ports(1);
-}
-
-// --------------------------------------------------------------------------
-teca_ar_detect::~teca_ar_detect()
-{}
-
-#if defined(TECA_HAS_BOOST)
-// --------------------------------------------------------------------------
-void teca_ar_detect::get_properties_description(
-    const std::string &prefix, options_description &opts)
-{
-    options_description ard_opts("Options for "
-        + (prefix.empty()?"teca_ar_detect":prefix));
-
-    ard_opts.add_options()
-        TECA_POPTS_GET(std::string, prefix, water_vapor_variable,
-            "name of variable containing water vapor values")
-        TECA_POPTS_GET(double, prefix, low_water_vapor_threshold,
-            "low water vapor threshold")
-        TECA_POPTS_GET(double, prefix, high_water_vapor_threshold,
-            "high water vapor threshold")
-        TECA_POPTS_GET(double, prefix, search_lat_low,
-            "search space low latitude")
-        TECA_POPTS_GET(double, prefix, search_lon_low,
-            "search space low longitude")
-        TECA_POPTS_GET(double, prefix, search_lat_high,
-            "search space high latitude")
-        TECA_POPTS_GET(double, prefix, search_lon_high,
-            "search space high longitude")
-        TECA_POPTS_GET(double, prefix, river_start_lat_low,
-            "latitude used to classify as AR or PE")
-        TECA_POPTS_GET(double, prefix, river_start_lon_low,
-            "longitude used to classify as AR or PE")
-        TECA_POPTS_GET(double, prefix, river_end_lat_low,
-            "CA coastal region low latitude")
-        TECA_POPTS_GET(double, prefix, river_end_lon_low,
-            "CA coastal region low longitude")
-        TECA_POPTS_GET(double, prefix, river_end_lat_high,
-            "CA coastal region high latitude")
-        TECA_POPTS_GET(double, prefix, river_end_lon_high,
-            "CA coastal region high longitude")
-        TECA_POPTS_GET(double, prefix, percent_in_mesh,
-            "size of river in relation to search space area")
-        TECA_POPTS_GET(double, prefix, river_width,
-            "minimum river width")
-        TECA_POPTS_GET(double, prefix, river_length,
-            "minimum river length")
-        TECA_POPTS_GET(std::string, prefix, land_sea_mask_variable,
-            "name of variable containing land-sea mask values")
-        TECA_POPTS_GET(double, prefix, land_threshold_low,
-            "low land value")
-        TECA_POPTS_GET(double, prefix, land_threshold_high,
-            "high land value")
-        ;
-
-    opts.add(ard_opts);
-}
-
-// --------------------------------------------------------------------------
-void teca_ar_detect::set_properties(
-    const std::string &prefix, variables_map &opts)
-{
-    TECA_POPTS_SET(opts, std::string, prefix, water_vapor_variable)
-    TECA_POPTS_SET(opts, double, prefix, low_water_vapor_threshold)
-    TECA_POPTS_SET(opts, double, prefix, high_water_vapor_threshold)
-    TECA_POPTS_SET(opts, double, prefix, search_lat_low)
-    TECA_POPTS_SET(opts, double, prefix, search_lon_low)
-    TECA_POPTS_SET(opts, double, prefix, search_lat_high)
-    TECA_POPTS_SET(opts, double, prefix, search_lon_high)
-    TECA_POPTS_SET(opts, double, prefix, river_start_lat_low)
-    TECA_POPTS_SET(opts, double, prefix, river_start_lon_low)
-    TECA_POPTS_SET(opts, double, prefix, river_end_lat_low)
-    TECA_POPTS_SET(opts, double, prefix, river_end_lon_low)
-    TECA_POPTS_SET(opts, double, prefix, river_end_lat_high)
-    TECA_POPTS_SET(opts, double, prefix, river_end_lon_high)
-    TECA_POPTS_SET(opts, double, prefix, percent_in_mesh)
-    TECA_POPTS_SET(opts, double, prefix, river_width)
-    TECA_POPTS_SET(opts, double, prefix, river_length)
-    TECA_POPTS_SET(opts, std::string, prefix, land_sea_mask_variable)
-    TECA_POPTS_SET(opts, double, prefix, land_threshold_low)
-    TECA_POPTS_SET(opts, double, prefix, land_threshold_high)
-}
-
-#endif
-
-// --------------------------------------------------------------------------
-teca_metadata teca_ar_detect::get_output_metadata(
-    unsigned int port,
-    const std::vector<teca_metadata> &input_md)
-{
-#if TECA_DEBUG > 1
-    cerr << teca_parallel_id()
-        << "teca_ar_detect::get_output_metadata" << endl;
-#endif
-    (void)port;
-
-    teca_metadata output_md(input_md[0]);
-    return output_md;
-}
-
-// --------------------------------------------------------------------------
-std::vector<teca_metadata> teca_ar_detect::get_upstream_request(
-    unsigned int port,
-    const std::vector<teca_metadata> &input_md,
-    const teca_metadata &request)
-{
-#if TECA_DEBUG > 1
-    cerr << teca_parallel_id()
-        << "teca_ar_detect::get_upstream_request" << endl;
-#endif
-    (void)port;
-
-    std::vector<teca_metadata> up_reqs;
-
-    teca_metadata md = input_md[0];
-
-    // locate the extents of the user supplied region of
-    // interest
-    teca_metadata coords;
-    if (md.get("coordinates", coords))
-    {
-        TECA_ERROR("metadata is missing \"coordinates\"")
-        return up_reqs;
-    }
-
-    p_teca_variant_array lat;
-    p_teca_variant_array lon;
-    if (!(lat = coords.get("y")) || !(lon = coords.get("x")))
-    {
-        TECA_ERROR("metadata missing lat lon coordinates")
-        return up_reqs;
-    }
-
-    std::vector<double> bounds = {this->search_lon_low,
-        this->search_lon_high, this->search_lat_low,
-        this->search_lat_high, 0.0, 0.0};
-
-    // build the request
-    std::vector<std::string> arrays;
-    request.get("arrays", arrays);
-    arrays.push_back(this->water_vapor_variable);
-    if (!this->land_sea_mask_variable.empty())
-        arrays.push_back(this->land_sea_mask_variable);
-
-    teca_metadata up_req(request);
-    up_req.set("arrays", arrays);
-    up_req.set("bounds", bounds);
-
-    up_reqs.push_back(up_req);
-    return up_reqs;
-}
-
-// --------------------------------------------------------------------------
-const_p_teca_dataset teca_ar_detect::execute(
-    unsigned int port,
-    const std::vector<const_p_teca_dataset> &input_data,
-    const teca_metadata &request)
-{
-#if TECA_DEBUG > 1
-    cerr << teca_parallel_id() << "teca_ar_detect::execute";
-    this->to_stream(cerr);
-    cerr << endl;
-#endif
-    (void)port;
-    (void)request;
-
-    // get the input dataset
-    const_p_teca_cartesian_mesh mesh
-        = std::dynamic_pointer_cast<const teca_cartesian_mesh>(input_data[0]);
-    if (!mesh)
-    {
-        TECA_ERROR("invalid input. teca_cartesian_mesh is required")
-        return nullptr;
-    }
-
-    // get coordinate arrays
-    const_p_teca_variant_array lat = mesh->get_y_coordinates();
-    const_p_teca_variant_array lon = mesh->get_x_coordinates();
-
-    if (!lon || !lat)
-    {
-        TECA_ERROR("invalid mesh. missing lat lon coordinates")
-        return nullptr;
-    }
-
-    // get land sea mask
-    const_p_teca_variant_array land_sea_mask;
-    if (this->land_sea_mask_variable.empty() ||
-        !(land_sea_mask = mesh->get_point_arrays()->get(this->land_sea_mask_variable)))
-    {
-        // input doesn't have it, generate a stand in such
-        // that land fall criteria will evaluate true
-        size_t n = lat->size()*lon->size();
-        p_teca_double_array lsm = teca_double_array::New(n, this->land_threshold_low);
-        land_sea_mask = lsm;
-    }
-
-    // get the mesh extents
-    std::vector<unsigned long> extent;
-    mesh->get_extent(extent);
-
-    unsigned long num_rows = extent[3] - extent[2] + 1;
-    unsigned long num_cols = extent[1] - extent[0] + 1;
-    unsigned long num_rc = num_rows*num_cols;
-
-    // get water vapor data
-    const_p_teca_variant_array water_vapor
-        = mesh->get_point_arrays()->get(this->water_vapor_variable);
-
-    if (!water_vapor)
-    {
-        TECA_ERROR(
-            << "Dataset missing water vapor variable \""
-            << this->water_vapor_variable << "\"")
-        return nullptr;
-    }
-
-    p_teca_table event = teca_table::New();
-
-    event->declare_columns(
-        "time", double(), "time_step", long(),
-        "length", double(), "min width", double(),
-        "max width", double(), "end_top_lat", double(),
-        "end_top_lon", double(), "end_bot_lat", double(),
-        "end_bot_lon", double(), "type", std::string());
-
-    // get calendar
-    std::string calendar;
-    mesh->get_calendar(calendar);
-    event->set_calendar(calendar);
-
-    // get units
-    std::string units;
-    mesh->get_time_units(units);
-    event->set_time_units(units);
-
-    // get time step
-    unsigned long time_step;
-    mesh->get_time_step(time_step);
-
-    // get offset of the current timestep
-    double time = 0.0;
-    mesh->get_time(time);
-
-    TEMPLATE_DISPATCH(
-        const teca_variant_array_impl,
-        water_vapor.get(),
-
-        const NT *p_wv = dynamic_cast<TT*>(water_vapor.get())->get();
-
-        // threshold
-        p_teca_unsigned_int_array con_comp
-            = teca_unsigned_int_array::New(num_rc, 0);
-
-        unsigned int *p_con_comp = con_comp->get();
-
-        threshold(p_wv, p_con_comp, num_rc,
-            static_cast<NT>(this->low_water_vapor_threshold),
-            static_cast<NT>(this->high_water_vapor_threshold));
-
-#if TECA_DEBUG > 0
-        p_teca_variant_array thresh = con_comp->new_copy();
-#endif
-
-        // label
-        int num_comp = sauf(num_rows, num_cols, p_con_comp);
-
-#if TECA_DEBUG > 0
-        write_mesh(mesh, water_vapor, thresh, con_comp,
-            land_sea_mask, "ar_mesh_%t%.%e%");
-#endif
-
-        // detect ar
-        atmospheric_river ar;
-        if (num_comp &&
-            ar_detect(lat, lon, land_sea_mask, con_comp, num_comp,
-                this->river_start_lat_low, this->river_start_lon_low,
-                this->river_end_lat_low, this->river_end_lon_low,
-                this->river_end_lat_high, this->river_end_lon_high,
-                this->percent_in_mesh, this->river_width,
-                this->river_length, this->land_threshold_low,
-                this->land_threshold_high, ar))
-        {
-#if TECA_DEBUG > 0
-            cerr << teca_parallel_id() << " event detected " << time_step << endl;
-#endif
-            event << time << time_step
-                << ar.length << ar.min_width << ar.max_width
-                << ar.end_top_lat << ar.end_top_lon
-                << ar.end_bot_lat << ar.end_bot_lon
-                << std::string(ar.pe ? "PE" : "AR");
-        }
-        )
-
-    return event;
-}
-
-// --------------------------------------------------------------------------
-void teca_ar_detect::to_stream(std::ostream &os) const
-{
-    os << " water_vapor_variable=" << this->water_vapor_variable
-        << " land_sea_mask_variable=" << this->land_sea_mask_variable
-        << " low_water_vapor_threshold=" << this->low_water_vapor_threshold
-        << " high_water_vapor_threshold=" << this->high_water_vapor_threshold
-        << " river_start_lon_low=" << this->river_start_lon_low
-        << " river_start_lat_low=" << this->river_start_lat_low
-        << " river_end_lon_low=" << this->river_end_lon_low
-        << " river_end_lat_low=" << this->river_end_lat_low
-        << " river_end_lon_high=" << this->river_end_lon_high
-        << " river_end_lat_high=" << this->river_end_lat_high
-        << " percent_in_mesh=" << this->percent_in_mesh
-        << " river_width=" << this->river_width
-        << " river_length=" << this->river_length
-        << " land_threshodl_low=" << this->land_threshold_low
-        << " land_threshodl_high=" << this->land_threshold_high;
-}
-
-
-// Code borrowed from John Wu's sauf.cpp
-// Find the minimal value starting @arg ind.
-inline unsigned afind(const std::vector<unsigned>& equiv,
-              const unsigned ind)
-{
-    unsigned ret = ind;
-    while (equiv[ret] < ret)
-    {
-        ret = equiv[ret];
-    }
-    return ret;
-}
-
-// Set the values starting with @arg ind.
-inline void aset(std::vector<unsigned>& equiv,
-         const unsigned ind, const unsigned val)
-{
-    unsigned i = ind;
-    while (equiv[i] < i)
-    {
-        unsigned j = equiv[i];
-        equiv[i] = val;
-        i = j;
-    }
-    equiv[i] = val;
-}
-
-/*
-* Purpose:        Scan with Array-based Union-Find
-* Return vals:    Number of connected components
-* Description:    SAUF -- Scan with Array-based Union-Find.
-* This is an implementation that follows the decision try to minimize
-* number of neighbors visited and uses the array-based union-find
-* algorithms to minimize work on the union-find data structure.  It works
-* with each pixel/cell of the 2D binary image individually.
-* The 2D binary image is passed to sauf as a unsigned*.  On input, the
-* zero value is treated as the background, and non-zero is treated as
-* object.  On successful completion of this function, the non-zero values
-* in array image is replaced by its label.
-* The return value is the number of components found.
-*/
-unsigned sauf(const unsigned nrow, const unsigned ncol, unsigned *image)
-{
-    const unsigned ncells = ncol * nrow;
-    const unsigned ncp1 = ncol + 1;
-    const unsigned ncm1 = ncol - 1;
-    std::vector<unsigned int> equiv;    // equivalence array
-    unsigned nextLabel = 1;
-
-    equiv.reserve(ncol);
-    equiv.push_back(0);
-
-    // the first cell of the first line
-    if (*image != 0)
-    {
-    *image = nextLabel;
-    equiv.push_back(nextLabel);
-    ++ nextLabel;
-    }
-    // first row of cells
-    for (unsigned i = 1; i < ncol; ++ i)
-    {
-    if (image[i] != 0)
-    {
-        if (image[i-1] != 0)
-        {
-        image[i] = image[i-1];
-        }
-        else
-        {
-        equiv.push_back(nextLabel);
-        image[i] = nextLabel;
-        ++ nextLabel;
-        }
-    }
-    }
-
-    // scan the rest of lines, check neighbor b first
-    for (unsigned j = ncol; j < ncells; j += ncol)
-    {
-    unsigned nc, nd, k, l;
-
-    // the first point of the line has two neighbors, and the two
-    // neighbors must have at most one label (recorded as nc)
-    if (image[j] != 0)
-    {
-        if (image[j-ncm1] != 0)
-        nc = image[j-ncm1];
-        else if (image[j-ncol] != 0)
-        nc = image[j-ncol];
-        else
-        nc = nextLabel;
-        if (nc != nextLabel) { // use existing label
-        nc = equiv[nc];
-        image[j] = nc;
-        }
-        else { // need a new label
-        equiv.push_back(nc);
-        image[j] = nc;
-        ++ nextLabel;
-        }
-    }
-
-    // the rest of the line
-    for (unsigned i = j+1; i < j+ncol; ++ i)
-    {
-        if (image[i] != 0) {
-        if (image[i-ncol] != 0) {
-            nc = image[i-ncol];
-            l = afind(equiv, nc);
-            aset(equiv, nc, l);
-            image[i] = l;
-        }
-        else if (i-ncm1<j && image[i-ncm1] != 0) {
-            nc = image[i-ncm1];
-
-            if (image[i-1] != 0)
-            nd = image[i-1];
-            else if (image[i-ncp1] != 0)
-            nd = image[i-ncp1];
-            else
-            nd = nextLabel;
-            if (nd < nextLabel) {
-            k = afind(equiv, nc);
-            l = afind(equiv, nd);
-            if (l <= k) {
-                aset(equiv, nc, l);
-                aset(equiv, nd, l);
-            }
-            else {
-                l = k;
-                aset(equiv, nc, k);
-                aset(equiv, nd, k);
-            }
-            image[i] = l;
-            }
-            else {
-            l = afind(equiv, nc);
-            aset(equiv, nc, l);
-            image[i] = l;
-            }
-        }
-        else if (image[i-1] != 0) {
-            nc = image[i-1];
-            l = afind(equiv, nc);
-            aset(equiv, nc, l);
-            image[i] = l;
-        }
-        else if (image[i-ncp1] != 0) {
-            nc = image[i-ncp1];
-            l = afind(equiv, nc);
-            aset(equiv, nc, l);
-            image[i] = l;
-        }
-        else { // need a new label
-            equiv.push_back(nextLabel);
-            image[i] = nextLabel;
-            ++ nextLabel;
-        }
-        }
-    }
-    } // for (unsigned j ...
-
-    // phase II: re-number the labels to be consecutive
-    nextLabel = 0;
-    const unsigned nequiv = equiv.size();
-    for (unsigned i = 0; i < nequiv;  ++ i) {
-    if (equiv[i] < i) { // chase one more time
-#if defined(_DEBUG) || defined(DEBUG)
-        std::cout << i << " final " << equiv[i] << " ==> "
-              << equiv[equiv[i]] << std::endl;
-#endif
-        equiv[i] = equiv[equiv[i]];
-    }
-    else { // change to the next smallest unused label
-#if defined(_DEBUG) || defined(DEBUG)
-        std::cout << i << " final " << equiv[i] << " ==> "
-              << nextLabel << std::endl;
-#endif
-        equiv[i] = nextLabel;
-        ++ nextLabel;
-    }
-    }
-
-    if (nextLabel < nequiv) {// relabel all cells to their minimal labels
-    for (unsigned i = 0; i < ncells; ++ i)
-        image[i] = equiv[image[i]];
-    }
-
-#if defined(_DEBUG) || defined(DEBUG)
-    std::cout << "sauf(" << nrow << ", " << ncol << ") assigned "
-          << nextLabel-1 << " label" << (nextLabel>2?"s":"")
-          << ", used " << nequiv << " provisional labels"
-          << std::endl;
-#endif
-    return nextLabel-1;
-}
-
-// do any of the detected points meet the river start
-// criteria. retrun true if so.
-template<typename T>
-bool river_start_criteria_lat(
-    const std::vector<int> &con_comp_r,
-    const T *p_lat,
-    T river_start_lat)
-{
-    unsigned long n = con_comp_r.size();
-    for (unsigned long q = 0; q < n; ++q)
-    {
-        if (p_lat[con_comp_r[q]] >= river_start_lat)
-            return true;
-    }
-    return false;
-}
-
-// do any of the detected points meet the river start
-// criteria. retrun true if so.
-template<typename T>
-bool river_start_criteria_lon(
-    const std::vector<int> &con_comp_c,
-    const T *p_lon,
-    T river_start_lon)
-{
-    unsigned long n = con_comp_c.size();
-    for (unsigned long q = 0; q < n; ++q)
-    {
-        if (p_lon[con_comp_c[q]] >= river_start_lon)
-            return true;
-    }
-    return false;
-}
-
-// helper return true if the start criteria is
-// met, and classifies the ar as PE if it starts
-// in the bottom boundary.
-template<typename T>
-bool river_start_criteria(
-    const std::vector<int> &con_comp_r,
-    const std::vector<int> &con_comp_c,
-    const T *p_lat,
-    const T *p_lon,
-    T start_lat,
-    T start_lon,
-    atmospheric_river &ar)
-{
-    return
-         ((ar.pe = river_start_criteria_lat(con_comp_r, p_lat, start_lat))
-         || river_start_criteria_lon(con_comp_c, p_lon, start_lon));
-}
-
-// do any of the detected points meet the river end
-// criteria? (ie. does it hit the west coasts?) if so
-// store a bounding box covering the river and return
-// true.
-template<typename T>
-bool river_end_criteria(
-    const std::vector<int> &con_comp_r,
-    const std::vector<int> &con_comp_c,
-    const T *p_lat,
-    const T *p_lon,
-    T river_end_lat_low,
-    T river_end_lon_low,
-    T river_end_lat_high,
-    T river_end_lon_high,
-    atmospheric_river &ar)
-{
-    bool end_criteria = false;
-
-    std::vector<int> end_col_idx;
-
-    unsigned int count = con_comp_r.size();
-    for (unsigned int i = 0; i < count; ++i)
-    {
-        // approximate land mask boundaries for the western coast of the US,
-        T lon_val = p_lon[con_comp_c[i]];
-        if ((lon_val >= river_end_lon_low) && (lon_val <= river_end_lon_high))
-            end_col_idx.push_back(i);
-    }
-
-    // look for rows that fall between lat boundaries
-    T top_lat = T();
-    T top_lon = T();
-    T bot_lat = T();
-    T bot_lon = T();
-
-    bool top_touch = false;
-    unsigned int end_col_count = end_col_idx.size();
-    for (unsigned int i = 0; i < end_col_count; ++i)
-    {
-        // approximate land mask boundaries for the western coast of the US,
-        T lat_val = p_lat[con_comp_r[end_col_idx[i]]];
-        if ((lat_val >= river_end_lat_low) && (lat_val <= river_end_lat_high))
-        {
-            T lon_val = p_lon[con_comp_c[end_col_idx[i]]];
-            end_criteria = true;
-            if (!top_touch)
-            {
-                top_touch = true;
-                top_lat = lat_val;
-                top_lon = lon_val;
-            }
-            bot_lat = lat_val;
-            bot_lon = lon_val;
-        }
-    }
-
-    ar.end_top_lat = top_lat;
-    ar.end_top_lon = top_lon;
-    ar.end_bot_lat = bot_lat;
-    ar.end_bot_lon = bot_lon;
-
-    return end_criteria;
-}
-
-/*
-* Calculate geodesic distance between two lat, long pairs
-* CODE borrowed from: from http://www.geodatasource.com/developers/c
-* from http://osiris.tuwien.ac.at/~wgarn/gis-gps/latlong.html
-* from http://www.codeproject.com/KB/cpp/Distancecplusplus.aspx
-*/
-template<typename T>
-T geodesic_distance(T lat1, T lon1, T lat2, T lon2)
-{
-    T deg_to_rad = T(M_PI/180.0);
-
-    T dlat1 = lat1*deg_to_rad;
-    T dlon1 = lon1*deg_to_rad;
-    T dlat2 = lat2*deg_to_rad;
-    T dlon2 = lon2*deg_to_rad;
-
-    T dLon = dlon1 - dlon2;
-    T dLat = dlat1 - dlat2;
-
-    T sin_dLat_half_sq = sin(dLat/T(2.0));
-    sin_dLat_half_sq *= sin_dLat_half_sq;
-
-    T sin_dLon_half_sq = sin(dLon/T(2.0));
-    sin_dLon_half_sq *= sin_dLon_half_sq;
-
-    T aHarv = sin_dLat_half_sq
-        + cos(dlat1)*cos(dlat2)*sin_dLon_half_sq;
-
-    T cHarv = T(2.0)*atan2(sqrt(aHarv), sqrt(T(1.0) - aHarv));
-
-    T R = T(6371.0);
-    T distance = R*cHarv;
-
-    return distance;
-}
-
-/*
-* This function calculates the average geodesic width
-* As each pixel represents certain area, the total area
-* is the product of the number of pixels and the area of
-* one pixel. The average width is: the total area divided
-* by the medial axis length
-* We are calculating the average width, since we are not
-* determining where exactly to cut off the tropical region
-* to calculate the real width of an atmospheric river
-*/
-template <typename T>
-T avg_width(
-    const std::vector<int> &con_comp_r,
-    const std::vector<int> &con_comp_c,
-    T ar_len,
-    const T *p_lat,
-    const T *p_lon)
-{
-/*
-    // TODO -- need bounds checking when doing things like
-    // p_lat[con_comp_r[0] + 1]. also because it's potentially
-    // a stretched cartesian mesh need to compute area of
-    // individual cells
-
-    // length of cell in lat direction
-    T lat_val[2] = {p_lat[con_comp_r[0]], p_lat[con_comp_r[0] + 1]};
-    T lon_val[2] = {p_lon[con_comp_c[0]], p_lon[con_comp_c[0]]};
-    T dlat = geodesic_distance(lat_val[0], lon_val[0], lat_val[1], lon_val[1]);
-
-    // length of cell in lon direction
-    lat_val[1] = lat_val[0];
-    lon_val[1] = p_lon[con_comp_c[0] + 1];
-    T dlon = geodesic_distance(lat_val[0], lon_val[0], lat_val[1], lon_val[1]);
-*/
-    (void)con_comp_c;
-    // compute area of the first cell in the input mesh
-    // length of cell in lat direction
-    T lat_val[2] = {p_lat[0], p_lat[1]};
-    T lon_val[2] = {p_lon[0], p_lon[0]};
-    T dlat = geodesic_distance(lat_val[0], lon_val[0], lat_val[1], lon_val[1]);
-
-    // length of cell in lon direction
-    lat_val[1] = lat_val[0];
-    lon_val[1] = p_lon[1];
-    T dlon = geodesic_distance(lat_val[0], lon_val[0], lat_val[1], lon_val[1]);
-
-    // area
-    T pixel_area = dlat*dlon;
-    T total_area = pixel_area*con_comp_r.size();
-
-    // avg width
-    T avg_width = total_area/ar_len;
-    return avg_width;
-}
-
-/*
-* Find the middle point between two pairs of lat and lon values
-* http://stackoverflow.com/questions/4164830/geographic-midpoint-between-two-coordinates
-*/
-template<typename T>
-void geodesic_midpoint(T lat1, T lon1, T lat2, T lon2, T &mid_lat, T &mid_lon)
-{
-    T deg_to_rad = T(M_PI/180.0);
-    T dLon = (lon2 - lon1) * deg_to_rad;
-    T dLat1 = lat1 * deg_to_rad;
-    T dLat2 = lat2 * deg_to_rad;
-    T dLon1 = lon1 * deg_to_rad;
-
-    T Bx = cos(dLat2) * cos(dLon);
-    T By = cos(dLat2) * sin(dLon);
-
-    mid_lat = atan2(sin(dLat1)+sin(dLat2),
-        sqrt((cos(dLat1)+Bx)*(cos(dLat1)+Bx)+By*By));
-
-    mid_lon = dLon1 + atan2(By, (cos(dLat1)+Bx));
-
-    T rad_to_deg = T(180.0/M_PI);
-    mid_lat *= rad_to_deg;
-    mid_lon *= rad_to_deg;
-}
-
-/*
-* Find the length along the medial axis of a connected component
-* Medial length is the sum of the distances between the medial
-* points in the connected component
-*/
-template<typename T>
-T medial_length(
-    const std::vector<int> &con_comp_r,
-    const std::vector<int> &con_comp_c,
-    const T *p_lat,
-    const T *p_lon)
-{
-    std::vector<int> jb_r1;
-    std::vector<int> jb_c1;
-    std::vector<int> jb_c2;
-
-    long row_track = -1;
-
-    unsigned long count = con_comp_r.size();
-    for (unsigned long i = 0; i < count; ++i)
-    {
-        if (row_track != con_comp_r[i])
-        {
-            jb_r1.push_back(con_comp_r[i]);
-            jb_c1.push_back(con_comp_c[i]);
-
-            jb_c2.push_back(con_comp_c[i]);
-
-            row_track = con_comp_r[i];
-        }
-        else
-        {
-            jb_c2.back() = con_comp_c[i];
-        }
-    }
-
-    T total_dist = T();
-
-    long b_count = jb_r1.size() - 1;
-    for (long i = 0; i < b_count; ++i)
-    {
-        T lat_val[2];
-        T lon_val[2];
-
-        lat_val[0] = p_lat[jb_r1[i]];
-        lat_val[1] = p_lat[jb_r1[i]];
-
-        lon_val[0] = p_lon[jb_c1[i]];
-        lon_val[1] = p_lon[jb_c2[i]];
-
-        T mid_lat1;
-        T mid_lon1;
-
-        geodesic_midpoint(
-            lat_val[0], lon_val[0], lat_val[1], lon_val[1],
-            mid_lat1, mid_lon1);
-
-        lat_val[0] = p_lat[jb_r1[i+1]];
-        lat_val[1] = p_lat[jb_r1[i+1]];
-
-        lon_val[0] = p_lon[jb_c1[i+1]];
-        lon_val[1] = p_lon[jb_c2[i+1]];
-
-        T mid_lat2;
-        T mid_lon2;
-
-        geodesic_midpoint(
-            lat_val[0], lon_val[0], lat_val[1], lon_val[1],
-            mid_lat2, mid_lon2);
-
-        total_dist
-            += geodesic_distance(mid_lat1, mid_lon1, mid_lat2, mid_lon2);
-    }
-
-    return total_dist;
-}
-
-/*
-// Suren's function
-// helper return true if the geometric conditions
-// on an ar are satisfied. also stores the length
-// and width of the river.
-template <typename T>
-bool river_geometric_criteria(
-    const std::vector<int> &con_comp_r,
-    const std::vector<int> &con_comp_c,
-    const T *p_lat,
-    const T *p_lon,
-    double river_length,
-    double river_width,
-    atmospheric_river &ar)
-{
-    ar.length = medial_length(con_comp_r, con_comp_c, p_lat, p_lon);
-
-    ar.width = avg_width(con_comp_r, con_comp_c,
-        static_cast<T>(ar.length), p_lat, p_lon);
-
-    return (ar.length >= river_length) && (ar.width <= river_width);
-}
-*/
-
-// Junmin's function for height of a triangle
-template<typename T>
-T triangle_height(T base, T s1, T s2)
-{
-    // area from Heron's fomula
-    T p = (base + s1 + s2)/T(2);
-    T area = p*(p - base)*(p - s1)*(p - s2);
-    // detect impossible triangle
-    if (area < T())
-        return std::min(s1, s2);
-    // height from A = 1/2 b h
-    return T(2)*sqrt(area)/base;
-}
-
-// TDataProcessor::check_geodesic_width_top_down
-// Junmin's function for detecting river based on
-// it's geometric properties
-template <typename T>
-bool river_geometric_criteria(
-    const std::vector<int> &con_comp_r,
-    const std::vector<int> &con_comp_c,
-    const T *p_lat,
-    const T *p_lon,
-    double river_length,
-    double river_width,
-    atmospheric_river &ar)
-{
-    std::vector<int> distinct_rows;
-    std::vector<int> leftmost_col;
-    std::vector<int> rightmost_col;
-
-    int row_track = -1;
-    size_t count = con_comp_r.size();
-    for (size_t i = 0; i < count; ++i)
-    {
-        if (row_track != con_comp_r[i])
-        {
-            row_track = con_comp_r[i];
-
-            distinct_rows.push_back(con_comp_r[i]);
-            leftmost_col.push_back(con_comp_c[i]);
-            rightmost_col.push_back(con_comp_c[i]);
-        }
-        else
-        {
-            rightmost_col.back() = con_comp_c[i];
-        }
-    }
-
-    // river metrics
-    T length_from_top = T();
-    T min_width = std::numeric_limits<T>::max();
-    T max_width = std::numeric_limits<T>::lowest();
-
-    for (long i = distinct_rows.size() - 2; i >= 0; --i)
-    {
-        // for each row w respect to row above it. triangulate
-        // a quadrilateral composed of left and right most points
-        // in this and the above rows. ccw ordering from lower
-        // left corner is A,B,D,C.
-
-        // low left-right distance
-        T AB = geodesic_distance(
-            p_lat[distinct_rows[i]], p_lon[leftmost_col[i]],
-            p_lat[distinct_rows[i]], p_lon[rightmost_col[i]]);
-
-        // left side bottom-top distance
-        T AC = geodesic_distance(
-            p_lat[distinct_rows[i]], p_lon[leftmost_col[i]],
-            p_lat[distinct_rows[i+1]], p_lon[leftmost_col[i]]);
-
-        // distance from top left to bottom right, across
-        T BC = geodesic_distance(
-            p_lat[distinct_rows[i]], p_lon[rightmost_col[i]],
-            p_lat[distinct_rows[i+1]], p_lon[leftmost_col[i+1]]);
-
-        // high left-right distance
-        T CD = geodesic_distance(
-            p_lat[distinct_rows[i+1]], p_lon[leftmost_col[i+1]],
-            p_lat[distinct_rows[i+1]], p_lon[rightmost_col[i+1]]);
-
-        // right side bottom-top distance
-        T BD = geodesic_distance(
-            p_lat[distinct_rows[i]], p_lon[rightmost_col[i]],
-            p_lat[distinct_rows[i+1]], p_lon[rightmost_col[i+1]]);
-
-        T height_from_b = triangle_height(AC, AB, BC);
-        T height_from_c = triangle_height(BD, BC, CD);
-
-        T curr_min = std::min(height_from_b, height_from_c);
-
-        // test width criteria
-        if (curr_min > river_width)
-        {
-            // TODO -- first time through the loop length == 0. is it intentional
-            // to discard the detection or should length calc take place before this test?
-            // note: first time through loop none of the event details have been recoreded
-            if (length_from_top <= river_length)
-            {
-                 // too short to be a river
-                return false;
-            }
-            else
-            {
-                 // part of a connected region is AR
-                ar.min_width = static_cast<double>(min_width);
-                ar.max_width = static_cast<double>(max_width);
-                ar.length = static_cast<double>(length_from_top);
-                return true;
-            }
-        }
-
-        // update width
-        min_width = std::min(min_width, curr_min);
-        max_width = std::max(max_width, curr_min);
-
-        // update length
-        T mid_bot_lat;
-        T mid_bot_lon;
-        geodesic_midpoint(
-            p_lat[distinct_rows[i]], p_lon[leftmost_col[i]],
-            p_lat[distinct_rows[i]], p_lon[rightmost_col[i]],
-            mid_bot_lat, mid_bot_lon);
-
-        T mid_top_lat;
-        T mid_top_lon;
-        geodesic_midpoint(
-            p_lat[distinct_rows[i+1]], p_lon[leftmost_col[i+1]],
-            p_lat[distinct_rows[i+1]], p_lon[rightmost_col[i+1]],
-            mid_top_lat, mid_top_lon);
-
-        length_from_top += geodesic_distance(
-            mid_bot_lat, mid_bot_lon, mid_top_lat, mid_top_lon);
-    }
-
-    // check the length criteria.
-    // TODO: if we are here the widtrh critera was not met
-    // so the following detection is based solely on the length?
-    if (length_from_top > river_length)
-    {
-        // AR
-        ar.min_width = static_cast<double>(min_width);
-        ar.max_width = static_cast<double>(max_width);
-        ar.length = static_cast<double>(length_from_top);
-        return true;
-    }
-
-    return false;
-}
-
-
-
-// Junmin's function checkRightBoundary
-// note: if land sea mask is not available land array
-// must all be true.
-template<typename T>
-bool river_end_criteria(
-    const std::vector<int> &con_comp_r,
-    const std::vector<int> &con_comp_c,
-    const std::vector<bool> &land,
-    const T *p_lat,
-    const T *p_lon,
-    T river_end_lat_low,
-    T river_end_lon_low,
-    T river_end_lat_high,
-    T river_end_lon_high,
-    atmospheric_river &ar)
-{
-    // locate component points within shoreline
-    // box
-    bool first_crossing = false;
-    bool event_detected = false;
-
-    T top_lat = T();
-    T top_lon = T();
-    T bot_lat = T();
-    T bot_lon = T();
-
-    std::vector<int> right_bound_col_idx;
-    size_t count = con_comp_c.size();
-    for (size_t i = 0; i < count; ++i)
-    {
-        T lat = p_lat[con_comp_r[i]];
-        T lon = p_lon[con_comp_c[i]];
-
-        if ((lat >= river_end_lat_low) && (lat <= river_end_lat_high)
-            && (lon >= river_end_lon_low) && (lon <= river_end_lon_high))
-        {
-            if (!event_detected)
-                event_detected = land[i];
-
-            if (!first_crossing)
-            {
-                first_crossing = true;
-                top_lat = lat;
-                top_lon = lon;
-            }
-            bot_lat = lat;
-            bot_lon = lon;
-        }
-    }
-
-    ar.end_top_lat = top_lat;
-    ar.end_top_lon = top_lon;
-    ar.end_bot_lat = bot_lat;
-    ar.end_bot_lon = bot_lon;
-
-    return event_detected;
-}
-
-// Junmin's function
-template<typename T>
-void classify_event(
-    const std::vector<int> &con_comp_r,
-    const std::vector<int> &con_comp_c,
-    const T *p_lat,
-    const T *p_lon,
-    T start_lat,
-    T start_lon,
-    atmospheric_river &ar)
-{
-    // classification determined by first detected point in event
-    // is closer to left or to bottom
-    T lat = p_lat[con_comp_r[0]];
-    T lon = p_lon[con_comp_c[0]];
-
-    ar.pe = false;
-    if ((lat - start_lat) < (lon - start_lon))
-        ar.pe = true; // PE
-}
-
-/*
-* The main function that checks whether an AR event exists in
-* given sub-plane of data. This currently applies only to the Western
-* coast of the USA. return true if an ar is found.
-*/
-bool ar_detect(
-    const_p_teca_variant_array lat,
-    const_p_teca_variant_array lon,
-    const_p_teca_variant_array land_sea_mask,
-    p_teca_unsigned_int_array con_comp,
-    unsigned long n_comp,
-    double river_start_lat,
-    double river_start_lon,
-    double river_end_lat_low,
-    double river_end_lon_low,
-    double river_end_lat_high,
-    double river_end_lon_high,
-    double percent_in_mesh,
-    double river_width,
-    double river_length,
-    double land_threshold_low,
-    double land_threshold_high,
-    atmospheric_river &ar)
-{
-    NESTED_TEMPLATE_DISPATCH_FP(
-        const teca_variant_array_impl,
-        lat.get(),
-        1,
-
-        NESTED_TEMPLATE_DISPATCH(
-            const teca_variant_array_impl,
-            land_sea_mask.get(),
-            2,
-
-            const NT1 *p_lat = dynamic_cast<TT1*>(lat.get())->get();
-            const NT1 *p_lon = dynamic_cast<TT1*>(lon.get())->get();
-
-            const NT2 *p_land_sea_mask
-                = dynamic_cast<TT2*>(land_sea_mask.get())->get();
-
-            NT1 start_lat = static_cast<NT1>(river_start_lat);
-            NT1 start_lon = static_cast<NT1>(river_start_lon);
-            NT1 end_lat_low = static_cast<NT1>(river_end_lat_low);
-            NT1 end_lon_low = static_cast<NT1>(river_end_lon_low);
-            NT1 end_lat_high = static_cast<NT1>(river_end_lat_high);
-            NT1 end_lon_high = static_cast<NT1>(river_end_lon_high);
-
-            unsigned long num_rows = lat->size();
-            unsigned long num_cols = lon->size();
-
-            // # in PE is % of points in regious mesh
-            unsigned long num_rc = num_rows*num_cols;
-            unsigned long thr_count = num_rc*percent_in_mesh/100.0;
-
-            unsigned int *p_labels = con_comp->get();
-            for (unsigned int i = 1; i <= n_comp; ++i)
-            {
-                // for all discrete connected component labels
-                // verify if there exists an AR
-                std::vector<int> con_comp_r;
-                std::vector<int> con_comp_c;
-                std::vector<bool> land;
-
-                for (unsigned long r = 0, q = 0; r < num_rows; ++r)
-                {
-                    for (unsigned long c = 0; c < num_cols; ++c, ++q)
-                    {
-                        if (p_labels[q] == i)
-                        {
-                            // gather points of this connected component
-                            con_comp_r.push_back(r);
-                            con_comp_c.push_back(c);
-
-                            // identify them as land or not
-                            land.push_back(
-                                (p_land_sea_mask[q] >= land_threshold_low)
-                                && (p_land_sea_mask[q] < land_threshold_high));
-                        }
-                    }
-                }
-
-                // check for ar criteria
-                unsigned long count = con_comp_r.size();
-                if ((count > thr_count)
-                    && river_end_criteria(
-                        con_comp_r, con_comp_c, land,
-                        p_lat, p_lon,
-                        end_lat_low, end_lon_low,
-                        end_lat_high, end_lon_high,
-                        ar)
-                    && river_geometric_criteria(
-                        con_comp_r, con_comp_c, p_lat, p_lon,
-                        river_length, river_width, ar))
-                {
-                    // determine if PE or AR
-                    classify_event(
-                        con_comp_r, con_comp_c, p_lat, p_lon,
-                        start_lat, start_lon, ar);
-                    return true;
-                }
-            }
-            )
-        )
-    return false;
-}
-
-#if TECA_DEBUG > 0
-// helper to dump a dataset for debugging
-int write_mesh(
-    const const_p_teca_cartesian_mesh &mesh,
-    const const_p_teca_variant_array &vapor,
-    const const_p_teca_variant_array &thresh,
-    const const_p_teca_variant_array &ccomp,
-    const const_p_teca_variant_array &lsmask,
-    const std::string &file_name)
-{
-    p_teca_cartesian_mesh m = teca_cartesian_mesh::New();
-    m->copy_metadata(mesh);
-
-    p_teca_array_collection pac = m->get_point_arrays();
-    pac->append("vapor", std::const_pointer_cast<teca_variant_array>(vapor));
-    pac->append("thresh", std::const_pointer_cast<teca_variant_array>(thresh));
-    pac->append("ccomp", std::const_pointer_cast<teca_variant_array>(ccomp));
-    pac->append("lsmask", std::const_pointer_cast<teca_variant_array>(lsmask));
-
-    p_teca_programmable_algorithm s = teca_programmable_algorithm::New();
-    s->set_name("serve_mesh");
-    s->set_number_of_input_connections(0);
-    s->set_number_of_output_ports(1);
-    s->set_execute_callback(
-        [m] (unsigned int, const std::vector<const_p_teca_dataset> &,
-        const teca_metadata &) -> const_p_teca_dataset { return m; }
-        );
-
-    p_teca_cartesian_mesh_writer w
-        = teca_cartesian_mesh_writer::New();
-
-    w->set_file_name(file_name);
-    w->set_input_connection(s->get_output_port());
-    w->update();
-
-    return 0;
-}
-#endif
diff --git a/alg/teca_ar_detect.h b/alg/teca_ar_detect.h
deleted file mode 100644
index 11ef0f199..000000000
--- a/alg/teca_ar_detect.h
+++ /dev/null
@@ -1,136 +0,0 @@
-#ifndef teca_ar_detect_h
-#define teca_ar_detect_h
-
-#include "teca_shared_object.h"
-#include "teca_algorithm.h"
-#include "teca_metadata.h"
-
-#include <string>
-#include <vector>
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_ar_detect)
-
-/**
-Suren and Junmin's atmospheric river detector.
-
-The algorithm searches for atmospheric rivers that
-end on the California coast in water vapor data over
-a specific subset of the input data. A river is detected
-based on it's length, width, and percent area of the
-search space. The algorithm can optionally use a
-land-sea mask to increase accuracy of the California
-coast. Without the land-sea mask a box is used.
-*/
-class teca_ar_detect : public teca_algorithm
-{
-public:
-    TECA_ALGORITHM_STATIC_NEW(teca_ar_detect)
-    TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_ar_detect)
-    TECA_ALGORITHM_CLASS_NAME(teca_ar_detect)
-    ~teca_ar_detect();
-
-    // report/initialize to/from Boost program options
-    // objects.
-    TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
-    TECA_SET_ALGORITHM_PROPERTIES()
-
-    // set/get the name of the integrated water vapor variable
-    TECA_ALGORITHM_PROPERTY(std::string, water_vapor_variable)
-
-    // set/get threshold on water vapor variable used
-    // to segment the data
-    TECA_ALGORITHM_PROPERTY(double, low_water_vapor_threshold)
-    TECA_ALGORITHM_PROPERTY(double, high_water_vapor_threshold)
-
-    // set/get the region of interest in lat lon coordinate system
-    // defaults are 19 56 180 250
-    TECA_ALGORITHM_PROPERTY(double, search_lat_low)
-    TECA_ALGORITHM_PROPERTY(double, search_lon_low)
-    TECA_ALGORITHM_PROPERTY(double, search_lat_high)
-    TECA_ALGORITHM_PROPERTY(double, search_lon_high)
-
-    // set/get the river source region in lat lon coordinate system
-    // defaults are 18 180
-    TECA_ALGORITHM_PROPERTY(double, river_start_lat_low)
-    TECA_ALGORITHM_PROPERTY(double, river_start_lon_low)
-
-    // set/get the river ladfall region in lat lon coordinate system
-    // defaults are  29 233 56 238
-    TECA_ALGORITHM_PROPERTY(double, river_end_lat_low)
-    TECA_ALGORITHM_PROPERTY(double, river_end_lon_low)
-    TECA_ALGORITHM_PROPERTY(double, river_end_lat_high)
-    TECA_ALGORITHM_PROPERTY(double, river_end_lon_high)
-
-    // set/get the area as a percent of the search space that
-    // a potential river must occupy
-    TECA_ALGORITHM_PROPERTY(double, percent_in_mesh)
-
-    // set/get the minimum river width and length. defaults
-    // are 1250 2000
-    TECA_ALGORITHM_PROPERTY(double, river_width)
-    TECA_ALGORITHM_PROPERTY(double, river_length)
-
-    // set/get the land-sea mask variable. this array
-    // will be used to identify land from ocean using
-    // land_threshold properties.
-    TECA_ALGORITHM_PROPERTY(std::string, land_sea_mask_variable)
-
-    // set/get the land classification range [low high). defaults
-    // are [1.0 DOUBLE_MAX)
-    TECA_ALGORITHM_PROPERTY(double, land_threshold_low)
-    TECA_ALGORITHM_PROPERTY(double, land_threshold_high)
-
-    // send humand readable representation to the
-    // stream
-    virtual void to_stream(std::ostream &os) const override;
-
-protected:
-    teca_ar_detect();
-
-    // helper that computes the output extent
-    int get_active_extent(
-        p_teca_variant_array lat,
-        p_teca_variant_array lon,
-        std::vector<unsigned long> &extent) const;
-
-private:
-    virtual
-    teca_metadata get_output_metadata(
-        unsigned int port,
-        const std::vector<teca_metadata> &input_md) override;
-
-    virtual
-    std::vector<teca_metadata> get_upstream_request(
-        unsigned int port,
-        const std::vector<teca_metadata> &input_md,
-        const teca_metadata &request) override;
-
-    virtual
-    const_p_teca_dataset execute(
-        unsigned int port,
-        const std::vector<const_p_teca_dataset> &input_data,
-        const teca_metadata &request) override;
-
-private:
-    std::string water_vapor_variable;
-    std::string land_sea_mask_variable;
-    double low_water_vapor_threshold;
-    double high_water_vapor_threshold;
-    double search_lat_low;
-    double search_lon_low;
-    double search_lat_high;
-    double search_lon_high;
-    double river_start_lat_low;
-    double river_start_lon_low;
-    double river_end_lat_low;
-    double river_end_lon_low;
-    double river_end_lat_high;
-    double river_end_lon_high;
-    double percent_in_mesh;
-    double river_width;
-    double river_length;
-    double land_threshold_low;
-    double land_threshold_high;
-};
-
-#endif
diff --git a/alg/teca_bayesian_ar_detect.cxx b/alg/teca_bayesian_ar_detect.cxx
index 8a7705a09..c14dd6f1f 100644
--- a/alg/teca_bayesian_ar_detect.cxx
+++ b/alg/teca_bayesian_ar_detect.cxx
@@ -608,8 +608,10 @@ void teca_bayesian_ar_detect::internals_t::clear()
 teca_bayesian_ar_detect::teca_bayesian_ar_detect() :
     min_component_area_variable("min_component_area"),
     min_ivt_variable("min_water_vapor"),
-    hwhm_latitude_variable("hwhm_latitude"), thread_pool_size(1),
-    verbose(0), internals(new internals_t)
+    hwhm_latitude_variable("hwhm_latitude"),
+    ar_probability_variable("ar_probability"),
+    thread_pool_size(1),
+    internals(new internals_t)
 {
     this->set_number_of_input_connections(1);
     this->set_number_of_output_ports(1);
@@ -631,23 +633,25 @@ void teca_bayesian_ar_detect::get_properties_description(
 
     opts.add_options()
         TECA_POPTS_GET(std::string, prefix, ivt_variable,
-            "name of the water vapor variable (\"\")")
+            "Set the name of the integrated vaopr transport(IVT) variable to"
+            " compute AR probability from.")
         TECA_POPTS_GET(std::string, prefix, min_component_area_variable,
-            "name of the column in the parameter table containing the "
-            "component area threshold (\"min_component_area\")")
+            "Set the name of the column in the parameter table containing the "
+            "minimum feature area threshold.")
         TECA_POPTS_GET(std::string, prefix, min_ivt_variable,
-            "name of the column in the parameter table containing the "
-            "water vapor threshold (\"min_water_vapor\")")
+            "Set the name of the column in the parameter table containing the "
+            "minimum percentile IVT threshold.")
         TECA_POPTS_GET(std::string, prefix, hwhm_latitude_variable,
-            "name of the column in the parameter table containing the "
-            "half width at half max latitude (\"hwhm_latitude\")")
+            "Set the name of the column in the parameter table containing the "
+            "half width at half max latitude mask value.")
+        TECA_POPTS_GET(std::string, prefix, ar_probability_variable,
+            "Set the name of the variable to store the computed AR probability in.")
         TECA_POPTS_GET(int, prefix, thread_pool_size,
-            "number of threads to parallelize execution over (1)")
-        TECA_POPTS_GET(int, prefix, verbose,
-            "flag indicating diagnostic info should be displayed in "
-            "the terminal (0)")
+            "Set the number of threads to parallelize execution over.")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -655,10 +659,13 @@ void teca_bayesian_ar_detect::get_properties_description(
 void teca_bayesian_ar_detect::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, ivt_variable)
     TECA_POPTS_SET(opts, std::string, prefix, min_component_area_variable)
     TECA_POPTS_SET(opts, std::string, prefix, min_ivt_variable)
     TECA_POPTS_SET(opts, std::string, prefix, hwhm_latitude_variable)
+    TECA_POPTS_SET(opts, std::string, prefix, ar_probability_variable)
     TECA_POPTS_SET(opts, int, prefix, thread_pool_size)
     TECA_POPTS_SET(opts, int, prefix, verbose)
 }
@@ -693,7 +700,10 @@ void teca_bayesian_ar_detect::set_thread_pool_size(int n)
 // --------------------------------------------------------------------------
 unsigned int teca_bayesian_ar_detect::get_thread_pool_size() const noexcept
 {
-    return this->internals->queue->size();
+    unsigned int n_threads = 0;
+    if (this->internals->queue)
+        n_threads = this->internals->queue->size();
+    return n_threads;
 }
 
 // --------------------------------------------------------------------------
@@ -805,7 +815,7 @@ teca_metadata teca_bayesian_ar_detect::get_output_metadata(
     // report the variable that we compute, for each timestep from the
     // parameter tables.
     teca_metadata md(input_md[0]);
-    md.append("variables", std::string("ar_probability"));
+    md.append("variables", std::string(this->ar_probability_variable));
 
     // add attributes to enable CF I/O
     teca_metadata atts;
@@ -816,7 +826,7 @@ teca_metadata teca_bayesian_ar_detect::get_output_metadata(
         0, "unitless", "posterior AR flag",
         "the posterior probability of the presence of an atmospheric river");
 
-    atts.set("ar_probability", (teca_metadata)prob_atts);
+    atts.set(this->ar_probability_variable, (teca_metadata)prob_atts);
 
     unsigned long num_params =
         this->internals->parameter_table->get_number_of_rows();
@@ -875,7 +885,7 @@ std::vector<teca_metadata> teca_bayesian_ar_detect::get_upstream_request(
     arrays.insert(this->ivt_variable);
 
     // remove what we produce
-    arrays.erase("ar_probability");
+    arrays.erase(this->ar_probability_variable);
     arrays.erase("ar_count");
     arrays.erase("parameter_table_row");
 
@@ -1039,7 +1049,7 @@ const_p_teca_dataset teca_bayesian_ar_detect::execute(
     // set up the reduction which computes the average over runs of all control
     // parameter combinations provided in the parameter table
     ::parameter_table_reduction reduce(parameter_table_size,
-        "wv_cc", "ar_probability");
+        "wv_cc", this->ar_probability_variable);
 
     p_teca_programmable_reduce pr = teca_programmable_reduce::New();
     pr->set_name("parameter_table_reduce");
diff --git a/alg/teca_bayesian_ar_detect.h b/alg/teca_bayesian_ar_detect.h
index c2805cf99..aecbd9411 100644
--- a/alg/teca_bayesian_ar_detect.h
+++ b/alg/teca_bayesian_ar_detect.h
@@ -10,31 +10,35 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_bayesian_ar_detect)
 
-/// CASCADE BARD atmospheric river detector
+/// The TECA BARD atmospheric river detector.
 /**
-Given a point wise IVT (integrated vapor transport) field and a training
-parameter table computes the point wise probability of an atmospheric river
-using the CASCADE BARD algorithm.
-
-Required inputs:
-
-    1. IVT (integrated vapor transport) array on a Cartesian nesh.
-    2. a compatible parameter table. columns of which are : min IVT,
-       component area, HWHM lattitude
-
-The names of the input varibale and columns can be specified at run time
-through algorithm properties.
-
-Produces:
-
-    A Cartesian mesh with probability of an AR stored in the point centered
-    array named "ar_probability". The diagnostic quantites "ar_count" amd
-    "parameter_table_row" are stored in information arrays.
-
-For more information see:
-
-Detection of Atmospheric Rivers with Inline Uncertainty Quantification: TECA-BARD v1.0
-O'Brien, T. A et al. Geoscientific Model Development, 2020
+ * Given a point wise IVT (integrated vapor transport) field and a training
+ * parameter table computes the point wise probability of an atmospheric river
+ * using the TECA BARD algorithm.
+ *
+ * Required inputs:
+ *
+ *     1. IVT (integrated vapor transport) array on a Cartesian nesh.
+ *     2. a compatible parameter table. columns of which are : min IVT,
+ *        component area, HWHM lattitude
+ *
+ * The names of the input varibale and columns can be specified at run time
+ * through algorithm properties.
+ *
+ * Produces:
+ *
+ *     A Cartesian mesh with probability of an AR stored in the point centered
+ *     array named "ar_probability". The diagnostic quantites "ar_count" amd
+ *     "parameter_table_row" are stored in information arrays.
+ *
+ * For more information see:
+ *
+ * O’Brien, T. A., Risser, M. D., Loring, B., Elbashandy, A. A., Krishnan, H.,
+ * Johnson, J., Patricola, C. M., O’Brien, J. P., Mahesh, A., Arriaga Ramirez,
+ * S., Rhoades, A. M., Charn, A., Inda Díaz, H., & Collins, W. D. (2020).
+ * Detection of atmospheric rivers with inline uncertainty quantification:
+ * TECA-BARD v1.0.1. Geoscientific Model Development, 13(12), 6131–6148.
+ * https://doi.org/10.5194/gmd-13-6131-2020
 */
 class teca_bayesian_ar_detect : public teca_algorithm
 {
@@ -49,28 +53,54 @@ class teca_bayesian_ar_detect : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the name of the input array
+    /** @name ivt_variable
+     * Sets the name of the array containing the IVT field to detect ARs in.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, ivt_variable)
+    ///@}
 
-    // set the names of columns in the parameter table.
+    /** @name min_ivt_variable
+     * Set the names of the minimum IVT column in the parameter table.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, min_ivt_variable)
-    TECA_ALGORITHM_PROPERTY(std::string, min_component_area_variable)
-    TECA_ALGORITHM_PROPERTY(std::string, hwhm_latitude_variable)
+    ///@}
 
-    // flag indicating verbose terminal output is desired.
-    // default is 0
-    TECA_ALGORITHM_PROPERTY(int, verbose)
+    /** @name min_component_area_variable
+     * Set the names of the minimum area column in the parameter table.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, min_component_area_variable)
+    ///@}
 
-    // set/get the number of threads in the pool. setting
-    // to -1 results in a thread per core factoring in all MPI
-    // ranks running on the node. the default is -1.
+    /** @name hwhm_latitude_variable
+     * Set the names of the HWHM column in the parameter table.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, hwhm_latitude_variable)
+    ///@}
+
+    /** @name probability variable
+     * Set the name of the variable to store output probability as.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, ar_probability_variable)
+    ///@}
+
+    /** Set the number of threads in the pool. Setting to -1 results in a
+     * thread per core factoring in all MPI ranks running on the node. the
+     * default is -1.
+     */
     void set_thread_pool_size(int n_threads);
+
+    /// Get the number of threads in the pool.
     unsigned int get_thread_pool_size() const noexcept;
 
-    // override the input connections because we are going to
-    // take the first input and use it to generate metadata.
-    // the second input then becomes the only one the pipeline
-    // knows about.
+    /** override the input connections because we are going to take the first
+     * input and use it to generate metadata.  the second input then becomes
+     * the only one the pipeline knows about.
+     */
     void set_input_connection(unsigned int id,
         const teca_algorithm_output_port &port) override;
 
@@ -98,8 +128,8 @@ class teca_bayesian_ar_detect : public teca_algorithm
     std::string min_component_area_variable;
     std::string min_ivt_variable;
     std::string hwhm_latitude_variable;
+    std::string ar_probability_variable;
     int thread_pool_size;
-    int verbose;
 
     struct internals_t;
     internals_t *internals;
diff --git a/alg/teca_bayesian_ar_detect_parameters.cxx b/alg/teca_bayesian_ar_detect_parameters.cxx
index ca58d5c85..23511a112 100644
--- a/alg/teca_bayesian_ar_detect_parameters.cxx
+++ b/alg/teca_bayesian_ar_detect_parameters.cxx
@@ -973,9 +973,11 @@ void teca_bayesian_ar_detect_parameters::get_properties_description(
 
     opts.add_options()
         TECA_POPTS_GET(long, prefix, number_of_rows,
-            "the number of parameter table rows to serve (-1)")
+            "the number of parameter table rows to serve")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -983,6 +985,8 @@ void teca_bayesian_ar_detect_parameters::get_properties_description(
 void teca_bayesian_ar_detect_parameters::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, long, prefix, number_of_rows)
 }
 #endif
diff --git a/alg/teca_bayesian_ar_detect_parameters.h b/alg/teca_bayesian_ar_detect_parameters.h
index 7f5b1dc56..518305301 100644
--- a/alg/teca_bayesian_ar_detect_parameters.h
+++ b/alg/teca_bayesian_ar_detect_parameters.h
@@ -5,10 +5,10 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_bayesian_ar_detect_parameters)
 
-/**
-An algorithm that constructs and serves up the parameter
-table needed to run the Bayesain AR detector
-*/
+/** @brief
+ * An algorithm that constructs and serves up the parameter
+ * table needed to run the Bayesian AR detector.
+ */
 class teca_bayesian_ar_detect_parameters : public teca_algorithm
 {
 public:
@@ -22,12 +22,16 @@ class teca_bayesian_ar_detect_parameters : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // control the number of rows coppied into the table.  The rows are
-    // copppied in sequential order starting from row zero. The default value
-    // of -1 is used to serve all rows. See also get_parameter_table_size.
+    /** @name number_of_rows
+     * control the number of rows copied into the table.  The rows are copied
+     * in sequential order starting from row zero. The default value of -1 is
+     * used to serve all rows. See also get_parameter_table_size.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(long, number_of_rows)
+    ///@}
 
-    // return the number of rows in the internal parameter table.
+    /// return the number of rows in the internal parameter table.
     unsigned long get_parameter_table_size();
 
 protected:
diff --git a/alg/teca_binary_segmentation.h b/alg/teca_binary_segmentation.h
index 983a497fb..138a28b03 100644
--- a/alg/teca_binary_segmentation.h
+++ b/alg/teca_binary_segmentation.h
@@ -10,17 +10,17 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_binary_segmentation)
 
-/// an algorithm that computes a binary segmentation
+/// An algorithm that computes a binary segmentation.
 /**
-an algorithm that computes a binary segmentation for 1D, 2D, and 3D data. The
-segmentation is computed using threshold operation where values in a range
-(low, high] are in the segmentation (assigned 1). Values outside the range
-are outside of the segmentation (assigned 0).
-
-The algorithm has 2 modes, BY_VALUE and BY_PERCENTILE. In the BY_VALUE mode,
-the test for inclusion is applied on the raw data. In the BY_PERCENTILE mode
-the range is given in percentiles and each data point is converted to a
-percentile before applying the test for inclusion.
+ * an algorithm that computes a binary segmentation for 1D, 2D, and 3D data.
+ * The segmentation is computed using threshold operation where values in a
+ * range (low, high] are in the segmentation (assigned 1). Values outside the
+ * range are outside of the segmentation (assigned 0).
+ *
+ * The algorithm has 2 modes, BY_VALUE and BY_PERCENTILE. In the BY_VALUE mode,
+ * the test for inclusion is applied on the raw data. In the BY_PERCENTILE mode
+ * the range is given in percentiles and each data point is converted to a
+ * percentile before applying the test for inclusion.
 */
 class teca_binary_segmentation : public teca_algorithm
 {
@@ -31,26 +31,59 @@ class teca_binary_segmentation : public teca_algorithm
     ~teca_binary_segmentation();
 
     // set the name of the output array to store the resulting segmentation in
+    /** @name segmentation_variable
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, segmentation_variable)
+    ///@}
+
 
     // set extra metadata for the segmentation variable
+    /** @name segmentation_variable_attributes
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(teca_metadata, segmentation_variable_attributes)
+    ///@}
+
 
-    // set the name of the input array to segment
+    /** @name threshold_variable
+     * set the name of the input array to segment
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, threshold_variable)
+    ///@}
 
-    // Set the threshold range. The defaults are (-infinity, infinity].
+    /** @name low_threshold_value
+     * Set the threshold range. The defaults are (-infinity, infinity].
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(double, low_threshold_value)
-    TECA_ALGORITHM_PROPERTY(double, high_threshold_value)
+    ///@}
 
-    // Set the threshold mode. In BY_PERCENTILE mode low and high thresholds
-    // define the percentiles (0 to 100) between which data is in the
-    // segmentation. default is BY_VALUE.
+    /** @name high_threshold_value
+     * Set the threshold range. The defaults are (-infinity, infinity].
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(double, high_threshold_value)
+    ///@}
+
+    /** @name threshold_mode
+     * Set the threshold mode. In BY_PERCENTILE mode low and high thresholds
+     * define the percentiles (0 to 100) between which data is in the
+     * segmentation. default is BY_VALUE.
+     */
+    ///@{
+    /// The threshold_mode modes
     enum {BY_VALUE=0, BY_PERCENTILE=1};
-    TECA_ALGORITHM_PROPERTY(int, threshold_mode);
 
+    TECA_ALGORITHM_PROPERTY(int, threshold_mode)
+
+    /// Set the threshold_mode to percentile.
     void set_threshold_by_percentile() { set_threshold_mode(BY_PERCENTILE); }
+
+    /// Set the threshold_mode to value.
     void set_threshold_by_value() { set_threshold_mode(BY_VALUE); }
+    ///@}
 
 protected:
     teca_binary_segmentation();
diff --git a/alg/teca_cartesian_mesh_regrid.cxx b/alg/teca_cartesian_mesh_regrid.cxx
index 632738efa..b8f90aa35 100644
--- a/alg/teca_cartesian_mesh_regrid.cxx
+++ b/alg/teca_cartesian_mesh_regrid.cxx
@@ -18,6 +18,28 @@ using std::endl;
 
 //#define TECA_DEBUG
 
+// always use nearest neighbor interpolation for integers
+// to avoid truncation errors. an alternative would be to
+// implement rounding in the interpolator for integer types
+template <typename data_t>
+int get_interpolation_mode(int desired_mode,
+    typename std::enable_if<std::is_integral<data_t>::value>::type* = 0)
+{
+    (void)desired_mode;
+    return teca_cartesian_mesh_regrid::nearest;
+}
+
+// use the requested interpolation mode for floating point
+// data
+template <typename data_t>
+int get_interpolation_mode(int desired_mode,
+    typename std::enable_if<std::is_floating_point<data_t>::value>::type* = 0)
+{
+    return desired_mode;
+}
+
+
+// 3D
 template<typename NT1, typename NT2, typename NT3, class interp_t>
 int interpolate(unsigned long target_nx, unsigned long target_ny,
     unsigned long target_nz, const NT1 *p_target_xc, const NT1 *p_target_yc,
@@ -53,31 +75,100 @@ int interpolate(unsigned long target_nx, unsigned long target_ny,
     return 0;
 }
 
+// 2D - x-y
+template<typename NT1, typename NT2, typename NT3, class interp_t>
+int interpolate(unsigned long target_nx, unsigned long target_ny,
+    const NT1 *p_target_xc, const NT1 *p_target_yc,
+    NT3 *p_target_a, const NT2 *p_source_xc,
+    const NT2 *p_source_yc, const NT3 *p_source_a,
+    unsigned long source_ihi, unsigned long source_jhi,
+    unsigned long source_nx)
+{
+    interp_t f;
+    unsigned long q = 0;
+    for (unsigned long j = 0; j < target_ny; ++j)
+    {
+        NT2 ty = static_cast<NT2>(p_target_yc[j]);
+        for (unsigned long i = 0; i < target_nx; ++i, ++q)
+        {
+            NT2 tx = static_cast<NT2>(p_target_xc[i]);
+            if (f(tx,ty,
+                p_source_xc, p_source_yc,
+                p_source_a, source_ihi, source_jhi,
+                source_nx, p_target_a[q]))
+            {
+                TECA_ERROR("failed to interpolate i=(" << i << ", " << j
+                    << ") x=(" << tx << ", " << ty << ", " << ")")
+                return -1;
+            }
+        }
+    }
+    return 0;
+}
+
 template<typename taget_coord_t, typename source_coord_t, typename array_t>
 int interpolate(int mode, unsigned long target_nx, unsigned long target_ny,
-    unsigned long target_nz, const taget_coord_t *p_target_xc, const taget_coord_t *p_target_yc,
-    const taget_coord_t *p_target_zc, array_t *p_target_a, const source_coord_t *p_source_xc,
-    const source_coord_t *p_source_yc, const source_coord_t *p_source_zc, const array_t *p_source_a,
-    unsigned long source_ihi, unsigned long source_jhi, unsigned long source_khi,
-    unsigned long source_nx, unsigned long source_nxy)
+    unsigned long target_nz, const taget_coord_t *p_target_xc,
+    const taget_coord_t *p_target_yc, const taget_coord_t *p_target_zc,
+    array_t *p_target_a, const source_coord_t *p_source_xc,
+    const source_coord_t *p_source_yc, const source_coord_t *p_source_zc,
+    const array_t *p_source_a, unsigned long source_ihi, unsigned long source_jhi,
+    unsigned long source_khi, unsigned long source_nx, unsigned long source_ny,
+    unsigned long source_nz)
 {
     using nearest_interp_t = teca_coordinate_util::interpolate_t<0>;
     using linear_interp_t = teca_coordinate_util::interpolate_t<1>;
 
-    switch (mode)
+    unsigned long source_nxy = source_nx*source_ny;
+
+    switch (get_interpolation_mode<array_t>(mode))
     {
         case teca_cartesian_mesh_regrid::nearest:
-            return interpolate<taget_coord_t,source_coord_t,array_t,nearest_interp_t>(
-                target_nx, target_ny, target_nz, p_target_xc, p_target_yc, p_target_zc,
-                p_target_a, p_source_xc, p_source_yc, p_source_zc, p_source_a,
-                source_ihi, source_jhi, source_khi, source_nx, source_nxy);
+        {
+            if ((target_nz == 1) && (source_nz == 1))
+            {
+                // 2D in the x-y plane
+                return interpolate<taget_coord_t,
+                    source_coord_t, array_t, nearest_interp_t>(
+                        target_nx, target_ny, p_target_xc, p_target_yc,
+                        p_target_a, p_source_xc, p_source_yc, p_source_a,
+                        source_ihi, source_jhi, source_nx);
+            }
+            else
+            {
+                // 3D
+                return interpolate<taget_coord_t,
+                    source_coord_t, array_t, nearest_interp_t>(
+                        target_nx, target_ny, target_nz, p_target_xc,
+                        p_target_yc, p_target_zc, p_target_a, p_source_xc,
+                        p_source_yc, p_source_zc, p_source_a, source_ihi,
+                        source_jhi, source_khi, source_nx, source_nxy);
+            }
             break;
+        }
         case teca_cartesian_mesh_regrid::linear:
-            return interpolate<taget_coord_t,source_coord_t,array_t,linear_interp_t>(
-                target_nx, target_ny, target_nz, p_target_xc, p_target_yc, p_target_zc,
-                p_target_a, p_source_xc, p_source_yc, p_source_zc, p_source_a,
-                source_ihi, source_jhi, source_khi, source_nx, source_nxy);
+        {
+            if ((target_nz == 1) && (source_nz == 1))
+            {
+                // 2D in the x-y plane
+                return interpolate<taget_coord_t,
+                    source_coord_t, array_t, linear_interp_t>(
+                        target_nx, target_ny, p_target_xc, p_target_yc,
+                        p_target_a, p_source_xc, p_source_yc, p_source_a,
+                        source_ihi, source_jhi, source_nx);
+            }
+            else
+            {
+                // 3D
+                return interpolate<taget_coord_t,
+                    source_coord_t, array_t, linear_interp_t>(
+                        target_nx, target_ny, target_nz, p_target_xc,
+                        p_target_yc, p_target_zc, p_target_a, p_source_xc,
+                        p_source_yc, p_source_zc, p_source_a, source_ihi,
+                        source_jhi, source_khi, source_nx, source_nxy);
+            }
             break;
+        }
     }
 
     TECA_ERROR("invalid interpolation mode \"" << mode << "\"")
@@ -86,6 +177,7 @@ int interpolate(int mode, unsigned long target_nx, unsigned long target_ny,
 
 
 
+
 // --------------------------------------------------------------------------
 teca_cartesian_mesh_regrid::teca_cartesian_mesh_regrid()
     : target_input(0), interpolation_mode(nearest)
@@ -109,13 +201,15 @@ void teca_cartesian_mesh_regrid::get_properties_description(
 
     opts.add_options()
         TECA_POPTS_GET(int, prefix, target_input,
-            "select input connection that contains metadata (0)")
-        TECA_POPTS_GET(std::vector<std::string>, prefix, arrays,
-            "list of arrays to move from source to target mesh ("")")
+            "select input connection that contains metadata")
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, arrays,
+            "list of arrays to move from source to target mesh")
         TECA_POPTS_GET(int, prefix, interpolation_mode,
-            "linear or nearest interpolation (1)")
+            "linear or nearest interpolation")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -123,6 +217,8 @@ void teca_cartesian_mesh_regrid::get_properties_description(
 void teca_cartesian_mesh_regrid::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, int, prefix, target_input)
     TECA_POPTS_SET(opts, std::vector<std::string>, prefix, arrays)
     TECA_POPTS_SET(opts, int, prefix, interpolation_mode)
@@ -276,7 +372,9 @@ std::vector<teca_metadata> teca_cartesian_mesh_regrid::get_upstream_request(
     else
     {
         if (teca_coordinate_util::bounds_to_extent(request_bounds,
-            target_x, target_y, target_z, target_extent))
+                target_x, target_y, target_z, target_extent) ||
+            teca_coordinate_util::validate_extent(target_x->size(),
+                target_y->size(), target_z->size(), target_extent, true))
         {
             TECA_ERROR("invalid bounds requested [" << request_bounds[0]  << ", "
                 << request_bounds[1] << ", " << request_bounds[2] << ", "
@@ -294,6 +392,24 @@ std::vector<teca_metadata> teca_cartesian_mesh_regrid::get_upstream_request(
     target_z->get(target_extent[4], target_bounds[4]);
     target_z->get(target_extent[5], target_bounds[5]);
 
+    // if the source is 2D, the cf_reader may have faked the vertical dimension.
+    // in that case, use the source's vertical coordinate in the requested bounds
+    teca_metadata source_coords;
+    p_teca_variant_array source_z;
+
+    if (input_md[md_src].get("coordinates", source_coords)
+        || !(source_z = source_coords.get("z")))
+    {
+        TECA_ERROR("failed to locate source mesh coordinates")
+        return up_reqs;
+    }
+
+    if (source_z->size() == 1)
+    {
+        source_z->get(0, target_bounds[4]);
+        source_z->get(0, target_bounds[5]);
+    }
+
     // send the target bounds to the source as well
     source_req.set("bounds", target_bounds, 6);
 
@@ -301,10 +417,19 @@ std::vector<teca_metadata> teca_cartesian_mesh_regrid::get_upstream_request(
     up_reqs[md_tgt] = target_req;
     up_reqs[md_src] = source_req;
 
+#ifdef TECA_DEBUG
+    std::cerr << "source request = ";
+    source_req.to_stream(std::cerr);
+    std::cerr << std::endl;
+
+    std::cerr << "target request = ";
+    target_req.to_stream(std::cerr);
+    std::cerr << std::endl;
+#endif
+
     return up_reqs;
 }
 
-
 // --------------------------------------------------------------------------
 const_p_teca_dataset teca_cartesian_mesh_regrid::execute(
     unsigned int port, const std::vector<const_p_teca_dataset> &input_data,
@@ -347,7 +472,7 @@ const_p_teca_dataset teca_cartesian_mesh_regrid::execute(
 
     // get the list of arrays to move
     std::vector<std::string> req_arrays;
-    request.get("regrid_arrays", req_arrays);
+    request.get("arrays", req_arrays);
 
     // add any explicitly named
     std::copy(this->arrays.begin(), this->arrays.end(),
@@ -362,7 +487,25 @@ const_p_teca_dataset teca_cartesian_mesh_regrid::execute(
     for (; it != end; ++it)
     {
         if (!target->get_point_arrays()->has(*it))
-            source_arrays.push_back(*it);
+        {
+            if (source->get_point_arrays()->has(*it))
+            {
+                source_arrays.push_back(*it);
+            }
+            else
+            {
+                TECA_ERROR("Array \"" << *it
+                    << "\" is neither present in source or target mesh")
+                return nullptr;
+            }
+        }
+    }
+
+    // catch a user error
+    if (!source_arrays.size() &&
+        teca_mpi_util::mpi_rank_0(this->get_communicator()))
+    {
+        TECA_WARNING("No arrays will be interpolated")
     }
 
     // move the arrays
@@ -384,7 +527,6 @@ const_p_teca_dataset teca_cartesian_mesh_regrid::execute(
     unsigned long source_nx = source_xc->size();
     unsigned long source_ny = source_yc->size();
     unsigned long source_nz = source_zc->size();
-    unsigned long source_nxy = source_nx*source_ny;
     unsigned long source_ihi = source_nx - 1;
     unsigned long source_jhi = source_ny - 1;
     unsigned long source_khi = source_nz - 1;
@@ -392,20 +534,20 @@ const_p_teca_dataset teca_cartesian_mesh_regrid::execute(
     NESTED_TEMPLATE_DISPATCH_FP(
         const teca_variant_array_impl,
         target_xc.get(),
-        1,
+        _TGT,
 
-        const NT1 *p_target_xc = std::dynamic_pointer_cast<TT1>(target_xc)->get();
-        const NT1 *p_target_yc = std::dynamic_pointer_cast<TT1>(target_yc)->get();
-        const NT1 *p_target_zc = std::dynamic_pointer_cast<TT1>(target_zc)->get();
+        const NT_TGT *p_target_xc = std::dynamic_pointer_cast<TT_TGT>(target_xc)->get();
+        const NT_TGT *p_target_yc = std::dynamic_pointer_cast<TT_TGT>(target_yc)->get();
+        const NT_TGT *p_target_zc = std::dynamic_pointer_cast<TT_TGT>(target_zc)->get();
 
         NESTED_TEMPLATE_DISPATCH_FP(
             const teca_variant_array_impl,
             source_xc.get(),
-            2,
+            _SRC,
 
-            const NT2 *p_source_xc = std::dynamic_pointer_cast<TT2>(source_xc)->get();
-            const NT2 *p_source_yc = std::dynamic_pointer_cast<TT2>(source_yc)->get();
-            const NT2 *p_source_zc = std::dynamic_pointer_cast<TT2>(source_zc)->get();
+            const NT_SRC *p_source_xc = std::dynamic_pointer_cast<TT_SRC>(source_xc)->get();
+            const NT_SRC *p_source_yc = std::dynamic_pointer_cast<TT_SRC>(source_yc)->get();
+            const NT_SRC *p_source_zc = std::dynamic_pointer_cast<TT_SRC>(source_zc)->get();
 
             size_t n_arrays = source_arrays.size();
             for (size_t i = 0; i < n_arrays; ++i)
@@ -417,25 +559,37 @@ const_p_teca_dataset teca_cartesian_mesh_regrid::execute(
                 NESTED_TEMPLATE_DISPATCH(
                     teca_variant_array_impl,
                     target_a.get(),
-                    3,
+                    _DATA,
 
-                    const NT3 *p_source_a = std::static_pointer_cast<const TT3>(source_a)->get();
-                    NT3 *p_target_a = std::static_pointer_cast<TT3>(target_a)->get();
+                    const NT_DATA *p_source_a = std::static_pointer_cast<const TT_DATA>(source_a)->get();
+                    NT_DATA *p_target_a = std::static_pointer_cast<TT_DATA>(target_a)->get();
 
                     if (interpolate(this->interpolation_mode, target_nx, target_ny, target_nz,
                         p_target_xc, p_target_yc, p_target_zc, p_target_a, p_source_xc,
                         p_source_yc, p_source_zc, p_source_a, source_ihi, source_jhi,
-                        source_khi, source_nx, source_nxy))
+                        source_khi, source_nx, source_ny, source_nz))
                     {
                         TECA_ERROR("Failed to move \"" << source_arrays[i] << "\"")
                         return nullptr;
                     }
-
-                    target_ac->set(source_arrays[i], target_a);
                     )
+                else
+                {
+                    TECA_ERROR("Unsupported array type " << source_a->get_class_name())
                 }
-                )
+
+                target_ac->set(source_arrays[i], target_a);
+            }
             )
+        else
+        {
+            TECA_ERROR("Unupported coordinate type " << source_xc->get_class_name())
+        }
+        )
+    else
+    {
+        TECA_ERROR("Unupported coordinate type " << target_xc->get_class_name())
+    }
 
     return target;
 }
diff --git a/alg/teca_cartesian_mesh_regrid.h b/alg/teca_cartesian_mesh_regrid.h
index f9ae85da2..d67c5f7f0 100644
--- a/alg/teca_cartesian_mesh_regrid.h
+++ b/alg/teca_cartesian_mesh_regrid.h
@@ -4,26 +4,29 @@
 #include "teca_shared_object.h"
 #include "teca_algorithm.h"
 #include "teca_metadata.h"
-#include "teca_variant_array_fwd.h"
+#include "teca_variant_array.h"
 
 #include <string>
 #include <vector>
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_cartesian_mesh_regrid)
 
-/// transfer data between overlapping meshes of potentially different resolution
-/**
-an algorithm that transfers data between cartesian meshes defined in the same
-world coordinate system but potentially different resolutions. nearest or
-linear interpolation are supported.
-
-By default the first input is the target mesh. the second input is the source
-mesh. This can be changed by setting the target_input property.
-
-the arrays to move from source to target can be selected using add_array api or
-in the request key regrid_source_arrays. this is a spatial regriding operation
-for temporal regriding see teca_mesh_temporal_regrid.
-*/
+/** @brief
+ * Transfers data between spatially overlapping meshes of potentially different
+ * resolutions.
+ *
+ * @details
+ * an algorithm that transfers data between cartesian meshes defined in the
+ * same world coordinate system but potentially different resolutions. nearest
+ * or linear interpolation are supported.
+ *
+ * By default the first input is the target mesh. the second input is the
+ * source mesh. This can be changed by setting the target_input property.
+ *
+ * the arrays to move from source to target can be selected using add_array api
+ * or in the request key "arrays". this is a spatial regriding operation for
+ * temporal regriding see teca_mesh_temporal_regrid.
+ */
 class teca_cartesian_mesh_regrid : public teca_algorithm
 {
 public:
@@ -37,23 +40,33 @@ class teca_cartesian_mesh_regrid : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the list of arrays to move from the source
-    // to the target
+    /** @name array
+     * set the list of arrays to move from the source to the target
+     */
+    //@{
     TECA_ALGORITHM_VECTOR_PROPERTY(std::string, array)
+    //@}
 
-    // set the input connection from which metadata such as arrays
-    // and time steps are taken from.
+    /** @name target_input
+     * set the input connection which provides the output geometry.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, target_input)
-
-    // set the interpolation mode used in transfering
-    // data between meshes of differing resolution.
-    // in nearest mode value at the nearest grid point
-    // is used, in linear mode bi/tri linear interpolation
-    // is used.
+    ///@}
+
+    /** @name interpolation_mode
+     * set the interpolation mode used in transfering data between meshes of
+     * differing resolution.  in nearest mode value at the nearest grid point
+     * is used, in linear mode bi/tri linear interpolation is used.
+     */
+    //@{
     enum {nearest=0, linear=1};
     TECA_ALGORITHM_PROPERTY(int, interpolation_mode)
     void set_interpolation_mode_nearest(){ interpolation_mode = nearest; }
     void set_interpolation_mode_linear(){ interpolation_mode = linear; }
+    //@}
+
+
 
 protected:
     teca_cartesian_mesh_regrid();
diff --git a/alg/teca_cartesian_mesh_source.cxx b/alg/teca_cartesian_mesh_source.cxx
index 7946d188f..2139a9864 100644
--- a/alg/teca_cartesian_mesh_source.cxx
+++ b/alg/teca_cartesian_mesh_source.cxx
@@ -26,12 +26,19 @@ struct teca_cartesian_mesh_source::internals_t
     // the world space [x0 x1 y0 y1 z0 z1 t0 t1] generate
     // equally spaced coordinate axes x,y,z,t
     static
-    void initialize_axes(int type_code, unsigned long *extent,
-        double *bounds, p_teca_variant_array &x_axis,
+    void initialize_axes(int type_code, const unsigned long *extent,
+        const double *bounds, p_teca_variant_array &x_axis,
         p_teca_variant_array &y_axis, p_teca_variant_array &z_axis,
         p_teca_variant_array &t_axis);
 
+    static
+    void initialize_axes(int type_code, const unsigned long *extent,
+        const double *bounds, p_teca_variant_array &x_axis,
+        p_teca_variant_array &y_axis, p_teca_variant_array &z_axis);
+
+    // cached metadata
     teca_metadata metadata;
+    p_teca_variant_array t_axis;
 };
 
 
@@ -45,21 +52,25 @@ void teca_cartesian_mesh_source::internals_t::initialize_axis(
     unsigned long nx = i1 - i0 + 1;
     x->resize(nx);
 
+    num_t *px = x->get();
+
     // avoid divide by zero
     if (nx < 2)
+    {
+        px[0] = x0;
         return;
+    }
 
     num_t dx = (x1 - x0)/(nx - 1l);
     num_t xx = x0 + i0*dx;
 
-    num_t *px = x->get();
     for (unsigned long i = 0; i < nx; ++i)
         px[i] = xx + dx*i;
 }
 
 // --------------------------------------------------------------------------
 void teca_cartesian_mesh_source::internals_t::initialize_axes(int type_code,
-    unsigned long *extent, double *bounds, p_teca_variant_array &x_axis,
+    const unsigned long *extent, const double *bounds, p_teca_variant_array &x_axis,
     p_teca_variant_array &y_axis, p_teca_variant_array &z_axis,
     p_teca_variant_array &t_axis)
 {
@@ -86,6 +97,30 @@ void teca_cartesian_mesh_source::internals_t::initialize_axes(int type_code,
         )
 }
 
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::internals_t::initialize_axes(int type_code,
+    const unsigned long *extent, const double *bounds, p_teca_variant_array &x_axis,
+    p_teca_variant_array &y_axis, p_teca_variant_array &z_axis)
+{
+    // gernate equally spaced coordinate axes x,y,z,t
+    x_axis = teca_variant_array_factory::New(type_code);
+    y_axis = x_axis->new_instance();
+    z_axis = x_axis->new_instance();
+
+    TEMPLATE_DISPATCH(teca_variant_array_impl,
+        x_axis.get(),
+
+        internals_t::initialize_axis<NT>(std::static_pointer_cast<TT>(x_axis),
+            extent[0], extent[1], bounds[0], bounds[1]);
+
+        internals_t::initialize_axis<NT>(std::static_pointer_cast<TT>(y_axis),
+            extent[2], extent[3], bounds[2], bounds[3]);
+
+        internals_t::initialize_axis<NT>(std::static_pointer_cast<TT>(z_axis),
+            extent[4], extent[5], bounds[4], bounds[5]);
+        )
+}
+
 
 
 // --------------------------------------------------------------------------
@@ -93,9 +128,7 @@ teca_cartesian_mesh_source::teca_cartesian_mesh_source() :
     coordinate_type_code(teca_variant_array_code<double>::get()),
     field_type_code(teca_variant_array_code<double>::get()),
     x_axis_variable("lon"), y_axis_variable("lat"), z_axis_variable("plev"),
-    t_axis_variable("time"), x_axis_units("degrees_east"),
-    y_axis_units("degrees_north"), z_axis_units("pascals"),
-    calendar("Gregorian"), time_units("seconds since 1970-01-01 00:00:00"),
+    t_axis_variable("time"),
     whole_extents{0l, 359l, 0l, 179l, 0l, 0l, 0l, 0l},
     bounds{0., 360, -90., 90., 0., 0., 0., 0.},
     internals(new internals_t)
@@ -129,7 +162,6 @@ void teca_cartesian_mesh_source::set_properties(const std::string &prefix,
 }
 #endif
 
-
 // --------------------------------------------------------------------------
 void teca_cartesian_mesh_source::set_modified()
 {
@@ -143,11 +175,311 @@ void teca_cartesian_mesh_source::set_modified()
 void teca_cartesian_mesh_source::clear_cached_metadata()
 {
     this->internals->metadata.clear();
+    teca_algorithm::set_modified();
+}
+
+
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_x_axis_variable(const std::string &name)
+{
+    this->x_axis_variable = name;
+    this->x_axis_attributes.clear();
+    teca_algorithm::set_modified();
+}
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_x_axis_variable(const std::string &name,
+    const teca_metadata &atts)
+{
+    this->x_axis_variable = name;
+    this->x_axis_attributes = atts;
+    teca_algorithm::set_modified();
+}
+
+// --------------------------------------------------------------------------
+int teca_cartesian_mesh_source::set_x_axis_variable(const teca_metadata &md)
+{
+    teca_metadata coords;
+    if (md.get("coordinates", coords))
+        return -1;
+
+    if (coords.get("x_variable", this->x_axis_variable))
+        return -1;
+
+    teca_metadata atts;
+    if (md.get("attributes", atts))
+        return -1;
+
+    if (atts.get(this->x_axis_variable, this->x_axis_attributes))
+        return -1;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_y_axis_variable(const std::string &name)
+{
+    this->y_axis_variable = name;
+    this->y_axis_attributes.clear();
+    teca_algorithm::set_modified();
+}
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_y_axis_variable(const std::string &name,
+    const teca_metadata &atts)
+{
+    this->y_axis_variable = name;
+    this->y_axis_attributes = atts;
+    teca_algorithm::set_modified();
+}
+
+// --------------------------------------------------------------------------
+int teca_cartesian_mesh_source::set_y_axis_variable(const teca_metadata &md)
+{
+    teca_metadata coords;
+    if (md.get("coordinates", coords))
+        return -1;
+
+    if (coords.get("y_variable", this->y_axis_variable))
+        return -1;
+
+    teca_metadata atts;
+    if (md.get("attributes", atts))
+        return -1;
+
+    if (atts.get(this->y_axis_variable, this->y_axis_attributes))
+        return -1;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_z_axis_variable(const std::string &name)
+{
+    this->z_axis_variable = name;
+    this->z_axis_attributes.clear();
+    teca_algorithm::set_modified();
+}
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_z_axis_variable(const std::string &name,
+    const teca_metadata &atts)
+{
+    this->z_axis_variable = name;
+    this->z_axis_attributes = atts;
+    teca_algorithm::set_modified();
+}
+
+// --------------------------------------------------------------------------
+int teca_cartesian_mesh_source::set_z_axis_variable(const teca_metadata &md)
+{
+    // get coordinates and attributes, fail if either are missing
+    teca_metadata coords;
+    if (md.get("coordinates", coords))
+        return -1;
+
+    if (coords.get("x_variable", this->z_axis_variable))
+        return -1;
+
+    teca_metadata atts;
+    if (md.get("attributes", atts))
+        return -1;
+
+    if (atts.get(this->z_axis_variable, this->z_axis_attributes))
+        return -1;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_t_axis_variable(const std::string &name)
+{
+    this->t_axis_variable = name;
+    this->t_axis_attributes.clear();
+    teca_algorithm::set_modified();
+}
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_calendar(
+    const std::string &calendar, const std::string &units)
+{
+    this->t_axis_attributes.clear();
+    this->t_axis_attributes.set("calendar", calendar);
+    this->t_axis_attributes.set("units", units);
+    teca_algorithm::set_modified();
+}
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_t_axis_variable(const std::string &name,
+    const teca_metadata &atts)
+{
+    this->t_axis_variable = name;
+    this->t_axis_attributes = atts;
+    teca_algorithm::set_modified();
+}
+
+// --------------------------------------------------------------------------
+int teca_cartesian_mesh_source::set_t_axis_variable(const teca_metadata &md)
+{
+    teca_metadata coords;
+    if (md.get("coordinates", coords))
+        return -1;
+
+    if (coords.get("t_variable", this->t_axis_variable))
+        return -1;
+
+    teca_metadata atts;
+    if (md.get("attributes", atts))
+        return -1;
+
+    if (atts.get(this->t_axis_variable, this->t_axis_attributes))
+        return -1;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int teca_cartesian_mesh_source::set_t_axis(const teca_metadata &md)
+{
+    teca_metadata coords;
+    if (md.get("coordinates", coords))
+        return -1;
+
+    this->internals->t_axis = coords.get("t");
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+void teca_cartesian_mesh_source::set_t_axis(const p_teca_variant_array &t)
+{
+    this->internals->t_axis = t;
+}
+
+// --------------------------------------------------------------------------
+int teca_cartesian_mesh_source::set_output_metadata(const teca_metadata &md)
+{
+    teca_metadata coords;
+    if (md.get("coordinates", coords))
+        return -1;
+
+    teca_metadata atts;
+    if (md.get("attributes", atts))
+        return -1;
+
+    // get the coordinate axes.
+    const_p_teca_variant_array x = coords.get("x");
+    const_p_teca_variant_array y = coords.get("y");
+    const_p_teca_variant_array z = coords.get("z");
+    const_p_teca_variant_array t = coords.get("t");
+
+    // because of assumptions made in execute, all must be provided
+    if (!x || !y || !z || !t)
+        return -1;
+
+    unsigned long nx = x->size();
+    unsigned long ny = y->size();
+    unsigned long nz = z->size();
+    unsigned long nxyz = nx*ny*nz;
+
+    // clear out any variables, and replace with those that we provide.
+    std::vector<std::string> vars;
+    std::vector<field_generator_t>::iterator it = this->field_generators.begin();
+    std::vector<field_generator_t>::iterator end = this->field_generators.end();
+    for (; it != end; ++it)
+    {
+        vars.push_back(it->name);
+
+        // correct size
+        teca_metadata var_atts = it->attributes;
+        var_atts.set("size", nxyz);
+
+        atts.set(it->name, var_atts);
+    }
+
+    // copy the metadata
+    this->set_modified();
+
+    this->internals->metadata = md;
+    this->internals->metadata.set("variables", vars);
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int teca_cartesian_mesh_source::set_spatial_extents(const teca_metadata &md,
+    bool three_d)
+{
+    // get coordinates and attributes, fail if either are missing
+    teca_metadata coords;
+    if (md.get("coordinates", coords))
+        return -1;
+
+    teca_metadata attributes;
+    if (md.get("attributes", attributes))
+        return -1;
+
+    // get the coordinate axes
+    p_teca_variant_array x = coords.get("x");
+    p_teca_variant_array y = coords.get("y");
+    p_teca_variant_array z = coords.get("z");
+
+    // verify
+    if (!x || !y || (three_d && !z))
+        return -1;
+
+    // set the extents
+    this->whole_extents[0] = 0;
+    this->whole_extents[1] = x->size() - 1;
+    this->whole_extents[2] = 0;
+    this->whole_extents[3] = y->size() - 1;
+    this->whole_extents[4] = 0;
+    this->whole_extents[5] = three_d ? z->size() - 1 : 0;
+
+    return 0;
+}
+// --------------------------------------------------------------------------
+int teca_cartesian_mesh_source::set_spatial_bounds(const teca_metadata &md,
+    bool three_d)
+{
+    // get coordinates and attributes, fail if either are missing
+    teca_metadata coords;
+    if (md.get("coordinates", coords))
+        return -1;
+
+    teca_metadata attributes;
+    if (md.get("attributes", attributes))
+        return -1;
+
+    // get the coordinate axes
+    p_teca_variant_array x = coords.get("x");
+    p_teca_variant_array y = coords.get("y");
+    p_teca_variant_array z = coords.get("z");
+
+    // verify
+    if (!x || !y || (three_d && !z))
+        return -1;
+
+    // get the bounds
+    x->get(0lu, this->bounds[0]);
+    x->get(x->size() - 1lu, this->bounds[1]);
+    y->get(0lu, this->bounds[2]);
+    y->get(y->size() - 1lu, this->bounds[3]);
+    z->get(0lu, this->bounds[4]);
+
+    unsigned long khi = three_d ? z->size() - 1lu : 0lu;
+    z->get(khi, this->bounds[5]);
+
+    // set the coordinate type
+    this->set_coordinate_type_code(x->type_code());
+
+    return 0;
 }
 
 // --------------------------------------------------------------------------
 void teca_cartesian_mesh_source::append_field_generator(
-    const std::string &name, const teca_array_attributes &atts,
+    const std::string &name, const teca_metadata &atts,
     field_generator_callback &callback)
 {
     this->append_field_generator({name, atts, callback});
@@ -181,59 +513,59 @@ teca_metadata teca_cartesian_mesh_source::get_output_metadata(
     // generate cooridnate axes
     p_teca_variant_array x_axis, y_axis, z_axis, t_axis;
 
-    internals_t::initialize_axes(this->coordinate_type_code,
-        this->whole_extents.data(), this->bounds.data(), x_axis,
-        y_axis, z_axis, t_axis);
+    if (this->internals->t_axis)
+    {
+        // generate x,y,z axes but use cached time axis
+        internals_t::initialize_axes(this->coordinate_type_code,
+            this->whole_extents.data(), this->bounds.data(), x_axis,
+            y_axis, z_axis);
 
-    size_t nx = this->whole_extents[1] - this->whole_extents[0] + 1;
-    size_t ny = this->whole_extents[3] - this->whole_extents[2] + 1;
-    size_t nz = this->whole_extents[5] - this->whole_extents[4] + 1;
-    size_t nt = this->whole_extents[7] - this->whole_extents[6] + 1;
-    size_t nxyz = nx*ny*nz;
+        t_axis = this->internals->t_axis;
+    }
+    else
+    {
+        // generate x,y,z and t axes
+        internals_t::initialize_axes(this->coordinate_type_code,
+            this->whole_extents.data(), this->bounds.data(), x_axis,
+            y_axis, z_axis, t_axis);
+    }
 
-    std::string x_ax_var_name = (this->x_axis_variable.empty() ? "x" : this->x_axis_variable);
-    std::string y_ax_var_name = (this->y_axis_variable.empty() ? "y" : this->y_axis_variable);
-    std::string z_ax_var_name = (this->z_axis_variable.empty() ? "z" : this->z_axis_variable);
-    std::string t_ax_var_name = (this->t_axis_variable.empty() ? "t" : this->t_axis_variable);
+    size_t nx = x_axis->size();
+    size_t ny = y_axis->size();
+    size_t nz = z_axis->size();
+    size_t nt = t_axis->size();
 
     // construct attributes
-    teca_metadata x_atts;
-    x_atts.set("units", (this->x_axis_units.empty() ? "meters" : this->x_axis_units));
-    x_atts.set("type_code", this->coordinate_type_code);
+    teca_metadata x_atts = this->x_axis_attributes;
+    x_atts.set("type_code", x_axis->type_code());
     x_atts.set("size", nx);
 
-    teca_metadata y_atts;
-    y_atts.set("units", (this->y_axis_units.empty() ? "meters" : this->y_axis_units));
-    y_atts.set("type_code", this->coordinate_type_code);
+    teca_metadata y_atts = this->y_axis_attributes;
+    y_atts.set("type_code", y_axis->type_code());
     y_atts.set("size", ny);
 
-    teca_metadata z_atts;
-    z_atts.set("units", (this->z_axis_units.empty() ? "meters" : this->z_axis_units));
-    z_atts.set("type_code", this->coordinate_type_code);
+    teca_metadata z_atts = this->z_axis_attributes;
+    z_atts.set("type_code", z_axis->type_code());
     z_atts.set("size", nz);
 
-    teca_metadata t_atts;
-    t_atts.set("units", (this->time_units.empty() ?
-        "seconds since 1970-01-01 00:00:00" : this->time_units));
-
-    t_atts.set("calendar", (this->calendar.empty() ?
-        "standard" : this->calendar));
-
-    t_atts.set("type_code", this->coordinate_type_code);
+    teca_metadata t_atts = this->t_axis_attributes;
+    t_atts.set("type_code", t_axis->type_code());
     t_atts.set("size", nt);
 
     teca_metadata atts;
-    atts.set(x_ax_var_name, x_atts);
-    atts.set(y_ax_var_name, y_atts);
-    atts.set(z_ax_var_name, z_atts);
-    atts.set(t_ax_var_name, t_atts);
+    atts.set(this->x_axis_variable, x_atts);
+    atts.set(this->y_axis_variable, y_atts);
+    atts.set(this->z_axis_variable, z_atts);
+
+    if (!this->t_axis_variable.empty())
+        atts.set(this->t_axis_variable, t_atts);
 
     // construct dataset metadata
     teca_metadata coords;
-    coords.set("x_variable", x_ax_var_name);
-    coords.set("y_variable", y_ax_var_name);
-    coords.set("z_variable", z_ax_var_name);
-    coords.set("t_variable", t_ax_var_name);
+    coords.set("x_variable", this->x_axis_variable);
+    coords.set("y_variable", this->y_axis_variable);
+    coords.set("z_variable", this->z_axis_variable);
+    coords.set("t_variable", this->t_axis_variable);
 
     coords.set("x", x_axis);
     coords.set("y", y_axis);
@@ -243,6 +575,7 @@ teca_metadata teca_cartesian_mesh_source::get_output_metadata(
     this->internals->metadata.set("whole_extent", this->whole_extents);
     this->internals->metadata.set("coordinates", coords);
 
+    size_t nxyz = nx*ny*nz;
     std::vector<std::string> vars;
     std::vector<field_generator_t>::iterator it = this->field_generators.begin();
     std::vector<field_generator_t>::iterator end = this->field_generators.end();
@@ -251,18 +584,24 @@ teca_metadata teca_cartesian_mesh_source::get_output_metadata(
         vars.push_back(it->name);
 
         // correct size
-        teca_array_attributes var_atts = it->attributes;
-        var_atts.size = nxyz;
+        teca_metadata var_atts = it->attributes;
+        var_atts.set("size", nxyz);
 
-        atts.set(it->name, teca_metadata(var_atts));
+        atts.set(it->name, var_atts);
     }
 
     this->internals->metadata.set("variables", vars);
     this->internals->metadata.set("attributes", atts);
 
-    this->internals->metadata.set("number_of_time_steps", t_axis->size());
-    this->internals->metadata.set("index_initializer_key", std::string("number_of_time_steps"));
-    this->internals->metadata.set("index_request_key", std::string("time_step"));
+    // setup the execution control keys
+    this->internals->metadata.set("number_of_time_steps",
+        t_axis->size());
+
+    this->internals->metadata.set("index_initializer_key",
+        std::string("number_of_time_steps"));
+
+    this->internals->metadata.set("index_request_key",
+        std::string("time_step"));
 
     return this->internals->metadata;
 }
@@ -320,25 +659,44 @@ const_p_teca_dataset teca_cartesian_mesh_source::execute(unsigned int port,
     {
         // bounds key was present, convert the bounds to an
         // an extent that covers them.
-        if (teca_coordinate_util::bounds_to_extent(
-            req_bounds, in_x, in_y, in_z, req_extent))
+        if (teca_coordinate_util::bounds_to_extent(req_bounds,
+                in_x, in_y, in_z, req_extent) ||
+            teca_coordinate_util::validate_extent(in_x->size(),
+                in_y->size(), in_z->size(), req_extent, true))
         {
             TECA_ERROR("invalid bounds requested.")
             return nullptr;
         }
     }
 
-    // get the timestep
-    unsigned long time_step = 0;
-    if (request.get("time_step", time_step))
+    // get the timestep, no matter what the key is named we treat it as
+    // a time step. this is to support metadata provided by another source
+    // eg. a different reader.
+    std::string request_key;
+    if (request.get("index_request_key", request_key))
+    {
+        TECA_ERROR("Request is missing the \"index_request_key\"")
+        return nullptr;
+    }
+
+    unsigned long req_index = 0;
+    if (request.get(request_key, req_index))
+    {
+        TECA_ERROR("Request is missing \"" << request_key << "\"")
+        return nullptr;
+    }
+
+    // check that the we have a time value for the requested index.
+    if (req_index >= in_t->size())
     {
-        TECA_ERROR("Request is missing time_step")
+        TECA_ERROR("The requested index " << req_index
+            << " is out of bounds [0, " << in_t->size() << "]")
         return nullptr;
     }
 
     // get the time
     double t = 0.;
-    in_t->get(time_step, t);
+    in_t->get(req_index, t);
 
     // slice axes on the requested extent
     p_teca_variant_array out_x = in_x->new_copy(req_extent[0], req_extent[1]);
@@ -351,22 +709,29 @@ const_p_teca_dataset teca_cartesian_mesh_source::execute(unsigned int port,
     std::string x_variable = this->x_axis_variable.empty() ? "x" : this->x_axis_variable;
     std::string y_variable = this->y_axis_variable.empty() ? "y" : this->y_axis_variable;
     std::string z_variable = this->z_axis_variable.empty() ? "z" : this->z_axis_variable;
-    std::string t_variable = this->t_axis_variable.empty() ? "t" : this->t_axis_variable;
 
     mesh->set_x_coordinates(x_variable, out_x);
     mesh->set_y_coordinates(y_variable, out_y);
     mesh->set_z_coordinates(z_variable, out_z);
 
+    // get the calendar
+    std::string calendar;
+    std::string units;
+    teca_metadata atts;
+    this->internals->metadata.get("attributes", atts);
+    atts.get("calendar", calendar);
+    atts.get("units", units);
+
     // set metadata
     mesh->set_whole_extent(md_whole_extent);
     mesh->set_extent(req_extent);
-    mesh->set_time_step(time_step);
+    mesh->set_time_step(req_index);
     mesh->set_time(t);
-    mesh->set_calendar(this->calendar);
-    mesh->set_time_units(this->time_units);
+    mesh->set_calendar(calendar);
+    mesh->set_time_units(units);
 
     teca_metadata &mesh_md = mesh->get_metadata();
-    mesh_md.set("index_request_key", std::string("time_step"));
+    mesh_md.set("index_request_key", request_key);
 
     // generate fields over the requested subset
     std::vector<field_generator_t>::iterator it = this->field_generators.begin();
@@ -378,8 +743,6 @@ const_p_teca_dataset teca_cartesian_mesh_source::execute(unsigned int port,
     }
 
     // pass the attributes
-    teca_metadata atts;
-    this->internals->metadata.get("attributes", atts);
     mesh_md.set("attributes", atts);
 
     return mesh;
diff --git a/alg/teca_cartesian_mesh_source.h b/alg/teca_cartesian_mesh_source.h
index be1e5039a..d357ad0ba 100644
--- a/alg/teca_cartesian_mesh_source.h
+++ b/alg/teca_cartesian_mesh_source.h
@@ -2,7 +2,7 @@
 #define teca_cartesian_mesh_source_h
 
 #include "teca_algorithm.h"
-#include "teca_array_attributes.h"
+#include "teca_metadata.h"
 
 #include <functional>
 #include <map>
@@ -10,19 +10,27 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_cartesian_mesh_source)
 
-// f(x, y, z, t)
-// given spatial coordinate axes x,y,z and the time t, return the field
+/** The signature of the callback used to specify user defined fields.
+ * f(x, y, z, t) -> w
+ * Given spatial coordinate axes x,y,z and the time t, return the
+ * 3D field w.
+ */
 using field_generator_callback = std::function<p_teca_variant_array(
     const const_p_teca_variant_array &, const const_p_teca_variant_array &,
     const const_p_teca_variant_array &, double)>;
 
+/** An object that bundles field name, the metadata attributes needed for I/O,
+ * and a field generator callback. Use this with append_field_generator
+ */
 struct field_generator
 {
     std::string name;
-    teca_array_attributes attributes;
+    teca_metadata attributes;
     field_generator_callback generator;
 };
 
+using field_generator_t = field_generator;
+
 inline
 bool operator==(const field_generator &l, const field_generator &r)
 {
@@ -35,12 +43,25 @@ bool operator!=(const field_generator &l, const field_generator &r)
     return l.name != r.name;
 }
 
-using field_generator_t = field_generator;
-
-/**
-An algorithm that constructs and serves up a Cartesian mesh
-of the specified dimensions.
-*/
+/** @brief
+ * An algorithm that generates a teca_cartesian_mesh of the requested
+ * spatial and temporal dimensions with optional user defined fields.
+ *
+ * @details
+ * User defined fields are specified by passing callbacks and metadata
+ * via field_generator and append_field_generator
+ *
+ * The spatial and temporal dimensions are set by the combination of
+ *  whole_extent and  bounds.
+ *
+ * The names of coordinate axes are set by the combination
+ * of  x_axis_variable,  y_axis_variable,  z_axis_variable,
+ * and  t_axis_variable
+ *
+ * The units of the coordinate axes are set by the combination of
+ *  x_axis_units,  y_axis_units,  z_axis_units,  calendar,
+ * and  time_units.
+ */
 class teca_cartesian_mesh_source : public teca_algorithm
 {
 public:
@@ -54,65 +75,211 @@ class teca_cartesian_mesh_source : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set/get the type code for generated coordinates.
-    // default is a 64 bit floating point type. Use
-    // teca_variant_array_type<NT>::get() to get specific type
-    // codes for C++ POD types NT.
+    /** @name coordinate_type_code
+     * set/get the type code for generated coordinates. The default is a 64 bit
+     * floating point type. Use teca_variant_array_code<NT>::get() to get
+     * specific type codes for C++ POD types NT.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(unsigned int, coordinate_type_code)
+    ///@}
+
+    /** @name field_type_code
+     * set/get the type code for generated fields. The default is a 64 bit
+     * floating point type. Use teca_variant_array_code<NT>::get() to get
+     * specific type codes for C++ POD types NT.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(unsigned int, field_type_code)
+    ///@}
 
-    // set/get the global index space extent of the data.  the extents are
-    // given by 8 values, 6 spatial plus 2 temporal, in the following order
-    // [i0 i1 j0 j1 k0 k1 q0 q1]
-    // this should be the same on all ranks elements.
+    /** @name whole_extent
+     * set/get the global index space extent of the data.  the extents are
+     * given by 8 values, 6 spatial plus 2 temporal, in the following order
+     * [i0 i1 j0 j1 k0 k1 q0 q1] This should be the same on all ranks
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(unsigned long, whole_extent)
 
-    // set/get the global bounds of the data. the bounds are 8 values 6 spatial
-    // plus 2 temporal in the following order.
-    // [x0 x1 y0 y1 z0 z1 t0 t1]
-    // this should be the same on all ranks elements.
+    /** Set the spatial extents from a metadata object following the
+     * conventions defined by the  teca_cf_reader. If three_d is true the
+     * extents in the z-direction are copied, otherwise they are set to 0.
+     * Returns zero if successful and non-zero if the supplied metadata is
+     * missing any of the requisite information.
+     **/
+    int set_spatial_extents(const teca_metadata &md, bool three_d = true);
+    ///@}
+
+    /** @name bounds
+     * set/get the global bounds of the data. the bounds are 8 values 6 spatial
+     * plus 2 temporal in the following order. [x0 x1 y0 y1 z0 z1 t0 t1]
+     * this should be the same on all ranks.
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(double, bound)
 
-    // set the variable to use for the coordinate axes.
-    // the defaults are: x => lon, y => lat, z = plev,
-    // t => time
-    TECA_ALGORITHM_PROPERTY(std::string, x_axis_variable)
-    TECA_ALGORITHM_PROPERTY(std::string, y_axis_variable)
-    TECA_ALGORITHM_PROPERTY(std::string, z_axis_variable)
-    TECA_ALGORITHM_PROPERTY(std::string, t_axis_variable)
-
-    // set the units of spatial axes. The defaults are:
-    // degrees_east, degrees_north, and pressure_level
-    TECA_ALGORITHM_PROPERTY(std::string, x_axis_units)
-    TECA_ALGORITHM_PROPERTY(std::string, y_axis_units)
-    TECA_ALGORITHM_PROPERTY(std::string, z_axis_units)
-
-    // number of time steps to generate
-    TECA_ALGORITHM_PROPERTY(std::string, calendar)
-    TECA_ALGORITHM_PROPERTY(std::string, time_units)
-
-    // set the named callbacks to generate fields on the mesh.  A callback
-    // function must have the signature f(x,y,z,t).
-    TECA_ALGORITHM_VECTOR_PROPERTY(field_generator_t, field_generator);
-
-    // set a callback function f(x,y,z,t) that generates a field named name
-    // x,y,z are coordinate axes in variant arrays, t is the double precision
-    // time value.
+    /** Set the spatial bounds from a metadata object following the conventions
+     * defined by the  teca_cf_reader. Returns zero if successful and
+     * non-zero if the supplied metadata is missing any of the requisite
+     * information.
+     */
+    int set_spatial_bounds(const teca_metadata &md, bool three_d = true);
+
+    ///@}
+
+    /** @name x_axis_variable
+     * set the name of the variable to use for the coordinate axes and
+     * optionally associated attributes.
+     */
+    ///@{
+    /** set the name of the t_axis_variable */
+    void set_x_axis_variable(const std::string &name);
+
+    /** Set the name of the variable and its attributes. See 
+     * teca_array_attributes for more information.
+     */
+    void set_x_axis_variable(const std::string &name, const teca_metadata &atts);
+
+    /** Set the name of the variable and its attributes using conventions
+     * defined by the  teca_cf_reader. Returns zero if successful and
+     * non-zero if the supplied metadata is missing any of the requisite
+     * information.
+     */
+    int set_x_axis_variable(const teca_metadata &md);
+    ///@}
+
+    /** @name y_axis_variable
+     * set the name of the variable to use for the coordinate axes and
+     * optionally associated attributes.
+     */
+    ///@{
+    /** set the name of the y_axis_variable */
+    void set_y_axis_variable(const std::string &name);
+
+    /** Set the name of the variable and its attributes. See 
+     * teca_array_attributes for more information.
+     */
+    void set_y_axis_variable(const std::string &name, const teca_metadata &atts);
+
+    /** Set the name of the variable and its attributes using conventions
+     * defined by the  teca_cf_reader. Returns zero if successful and
+     * non-zero if the supplied metadata is missing any of the requisite
+     * information.
+     */
+    int set_y_axis_variable(const teca_metadata &md);
+    ///@}
+
+    /** @name z_axis_variable
+     * set the name of the variable to use for the coordinate axes and
+     * optionally associated attributes.
+     */
+    ///@{
+    /** set the name of the z_axis_variable */
+    void set_z_axis_variable(const std::string &name);
+
+    /** Set the name of the variable and its attributes. See 
+     * teca_array_attributes for more information.
+     */
+    void set_z_axis_variable(const std::string &name, const teca_metadata &atts);
+
+    /** Set the name of the variable and its attributes using conventions
+     * defined by the  teca_cf_reader. Returns zero if successful and
+     * non-zero if the supplied metadata is missing any of the requisite
+     * information.
+     */
+    int set_z_axis_variable(const teca_metadata &md);
+    ///@}
+
+    /** @name t_axis_variable
+     * set the name of the variable to use for the coordinate axes and
+     * optionally associated attributes.
+     */
+    ///@{
+    /** set the name of the t_axis_variable */
+    void set_t_axis_variable(const std::string &name);
+
+    /** Set the calendar, and time units of the t_axis_variable */
+    void set_calendar(const std::string &calendar, const std::string &units);
+
+    /** Set the name of the variable and its attributes. See 
+     * teca_array_attributes for more information.
+     */
+    void set_t_axis_variable(const std::string &name,
+        const teca_metadata &atts);
+
+    /** Set the name of the variable and its attributes using conventions
+     * defined by the  teca_cf_reader. Returns zero if successful and
+     * non-zero if the supplied metadata is missing any of the requisite
+     * information.
+     */
+    int set_t_axis_variable(const teca_metadata &md);
+
+    /** Set the time axis using coordinate conventions defined by the 
+     * teca_cf_reader. When a time axis is provided values are served up from
+     * the array rather than being generated. Execution control keys are also
+     * made use of if present. Returns zero if successful and non-zero if the
+     * supplied metadata is missing any of the requisite information.
+     */
+    int set_t_axis(const teca_metadata &md);
+
+    /** Set the time axis directly.  When a time axis is provided values are
+     * served up from the array rather than being generated. Execution control
+     * keys are also made use of if present.
+     */
+    void set_t_axis(const p_teca_variant_array &t);
+    ///@}
+
+    /** @name output_metadata
+     * Set the output metadata directly. The provided metadata must contain
+     * "coordinates" as defined by the  teca_cf_reader because these are
+     * required for mesh generation. Pipeline execution control keys as defined
+     * by  teca_index_executive are also required. Calendaring metadata is
+     * recommended. A copy of the passed object is made but "variables" are
+     * replaced with those generated by this class, if any. As a result be sure
+     * to specifiy field generators before calling this method. Returns 0 if
+     * successful, and non-zero if the supplied metadata doesn't contain the
+     * expected information. No error messages are sent to the terminal.
+     */
+    ///@{
+    int set_output_metadata(const teca_metadata &md);
+    ///@}
+
+    /** @name append_field_generator
+     * set a callback function f(x,y,z,t) that generates a field named name
+     * x,y,z are coordinate axes in variant arrays, t is the double precision
+     * time value.
+     */
+    ///@{
     void append_field_generator(const std::string &name,
-        const teca_array_attributes &atts, field_generator_callback &callback);
+        const teca_metadata &atts, field_generator_callback &callback);
+    ///@}
+
+    /** @name field_generator
+     * Set/get the named callbacks that generate fields on the mesh. These
+     * should be packaged in the field_generator struct so that field name
+     * and attributes for I/O are provided together with the callback.
+     */
+    ///@{
+    TECA_ALGORITHM_VECTOR_PROPERTY(field_generator_t, field_generator)
+    ///@}
 
 protected:
     teca_cartesian_mesh_source();
 
 private:
+    /// implements the report phase of pipeline execution
     teca_metadata get_output_metadata(unsigned int port,
         const std::vector<teca_metadata> &input_md) override;
 
+    /// implements the execute phase of pipeline execution
     const_p_teca_dataset execute(unsigned int port,
         const std::vector<const_p_teca_dataset> &input_data,
         const teca_metadata &request) override;
 
+    /// updates the modification state
     void set_modified() override;
+
+    /// clears cached metadata in response to modification of algorithm properties
     void clear_cached_metadata();
 
 private:
@@ -122,11 +289,10 @@ class teca_cartesian_mesh_source : public teca_algorithm
     std::string y_axis_variable;
     std::string z_axis_variable;
     std::string t_axis_variable;
-    std::string x_axis_units;
-    std::string y_axis_units;
-    std::string z_axis_units;
-    std::string calendar;
-    std::string time_units;
+    teca_metadata x_axis_attributes;
+    teca_metadata y_axis_attributes;
+    teca_metadata z_axis_attributes;
+    teca_metadata t_axis_attributes;
     std::vector<unsigned long> whole_extents;
     std::vector<double> bounds;
 
diff --git a/alg/teca_cartesian_mesh_subset.cxx b/alg/teca_cartesian_mesh_subset.cxx
index e9b21991d..81837966d 100644
--- a/alg/teca_cartesian_mesh_subset.cxx
+++ b/alg/teca_cartesian_mesh_subset.cxx
@@ -41,13 +41,15 @@ void teca_cartesian_mesh_subset::get_properties_description(
         + (prefix.empty()?"teca_cartesian_mesh_subset":prefix));
 
     opts.add_options()
-        TECA_POPTS_GET(vector<double>, prefix, bounds,
+        TECA_POPTS_MULTI_GET(std::vector<double>, prefix, bounds,
             "bounding box given by x0,x1,y0,y1,z0,z1")
         TECA_POPTS_GET(bool, prefix, cover_bounds,
             "(T)use smallest subset covering or (F)largest "
             "subset contained by bounds")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -55,7 +57,9 @@ void teca_cartesian_mesh_subset::get_properties_description(
 void teca_cartesian_mesh_subset::set_properties(
     const string &prefix, variables_map &opts)
 {
-    TECA_POPTS_SET(opts, vector<double>, prefix, bounds)
+    this->teca_algorithm::set_properties(prefix, opts);
+
+    TECA_POPTS_SET(opts, std::vector<double>, prefix, bounds)
     TECA_POPTS_SET(opts, bool, prefix, cover_bounds)
 }
 #endif
@@ -85,8 +89,10 @@ teca_metadata teca_cartesian_mesh_subset::get_output_metadata(
     }
 
     this->extent.resize(6, 0UL);
-    if (teca_coordinate_util::bounds_to_extent(
-        this->bounds.data(), x, y, z, this->extent.data()))
+    if (teca_coordinate_util::bounds_to_extent(this->bounds.data(),
+            x, y, z, this->extent.data()) ||
+        teca_coordinate_util::validate_extent(x->size(),
+            y->size(), z->size(), this->extent.data(), true))
     {
         TECA_ERROR("Failed to convert bounds to extent")
         return teca_metadata();
diff --git a/alg/teca_cartesian_mesh_subset.h b/alg/teca_cartesian_mesh_subset.h
index 3b2b2bf56..b4d9761ae 100644
--- a/alg/teca_cartesian_mesh_subset.h
+++ b/alg/teca_cartesian_mesh_subset.h
@@ -4,7 +4,7 @@
 #include "teca_shared_object.h"
 #include "teca_algorithm.h"
 #include "teca_metadata.h"
-#include "teca_variant_array_fwd.h"
+#include "teca_variant_array.h"
 
 #include <string>
 #include <vector>
@@ -13,13 +13,13 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_cartesian_mesh_subset)
 
 /// applies a subset given in world coordinates to the upstream request
 /**
-an algorithm that applies a subset specified in
-world coordinates to upstream requests. the subset
-is specified as bounding box of the form [x_low to x_high,
-y_low to y_high, z_low to z_high]. The subset can be either
-the smallest subset containing the bounding box or the
-largest set contained by the bounding box, and is controled
-by the cover_bounds property.
+ * an algorithm that applies a subset specified in
+ * world coordinates to upstream requests. the subset
+ * is specified as bounding box of the form [x_low to x_high,
+ * y_low to y_high, z_low to z_high]. The subset can be either
+ * the smallest subset containing the bounding box or the
+ * largest set contained by the bounding box, and is controled
+ * by the cover_bounds property.
 */
 class teca_cartesian_mesh_subset : public teca_algorithm
 {
@@ -34,20 +34,26 @@ class teca_cartesian_mesh_subset : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // define the bounding box of the subset
-    // this algorithm converts this into an
-    // extent into the upstream dataset.
-    TECA_ALGORITHM_PROPERTY(std::vector<double>, bounds);
+    /** @name bounds
+     * define the bounding box of the subset this algorithm converts this into
+     * an extent into the upstream dataset.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::vector<double>, bounds)
 
     void set_bounds(double low_x, double high_x,
         double low_y, double high_y, double low_z, double high_z)
     { this->set_bounds({low_x, high_x, low_y, high_y, low_z, high_z}); }
+    ///@}
 
-    // control how bounds are converted. if true
-    // smallest subset covering the bounding box is
-    // used. if false the largest subset contained
-    // by the bounding box is used.
+    /** @name cover_bounds
+     * control how bounds are converted. if true smallest subset covering the
+     * bounding box is used. if false the largest subset contained by the
+     * bounding box is used.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(bool, cover_bounds)
+    ///@}
 
 protected:
     teca_cartesian_mesh_subset();
diff --git a/alg/teca_component_area_filter.cxx b/alg/teca_component_area_filter.cxx
index 2441e8d73..62773c3ed 100644
--- a/alg/teca_component_area_filter.cxx
+++ b/alg/teca_component_area_filter.cxx
@@ -3,7 +3,7 @@
 #include "teca_variant_array.h"
 #include "teca_metadata.h"
 #include "teca_cartesian_mesh.h"
-#include "teca_metadata_util.h"
+#include "teca_string_util.h"
 
 #include <iostream>
 #include <set>
@@ -82,31 +82,30 @@ void teca_component_area_filter::get_properties_description(
         TECA_POPTS_GET(std::string, prefix, component_variable,
             "name of the varibale containing connected component labeling")
         TECA_POPTS_GET(std::string, prefix, number_of_components_key,
-            "name of the key that contains the number of components"
-            "\"number_of_components\")")
+            "name of the key that contains the number of components")
         TECA_POPTS_GET(std::string, prefix, component_ids_key,
-            "name of the key that contains the list of component ids "
-            "\"component_ids\")")
+            "name of the key that contains the list of component ids")
         TECA_POPTS_GET(std::string, prefix, component_area_key,
-            "name of the key that contains the list of component areas "
-            "(\"component_area\")")
+            "name of the key that contains the list of component areas")
         TECA_POPTS_GET(int, prefix, mask_value,
             "components with area outside of the range will be replaced "
-            "by this label value (-1)")
+            "by this label value")
         TECA_POPTS_GET(double, prefix, low_area_threshold,
             "set the lower end of the range of areas to pass through. "
-            "components smaller than this are masked out. (-inf)")
+            "components smaller than this are masked out.")
         TECA_POPTS_GET(double, prefix, high_area_threshold,
             "set the higher end of the range of areas to pass through. "
-            "components larger than this are masked out. (+inf)")
+            "components larger than this are masked out.")
         TECA_POPTS_GET(std::string, prefix, variable_post_fix,
             "set a string that will be appended to variable names and "
-            "metadata keys in the filter's output (\"\")")
+            "metadata keys in the filter's output")
         TECA_POPTS_GET(int, prefix, contiguous_component_ids,
             "when the region label ids start at 0 and are consecutive "
-            "this flag enables use of an optimization (0)")
+            "this flag enables use of an optimization")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -114,6 +113,8 @@ void teca_component_area_filter::get_properties_description(
 void teca_component_area_filter::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, component_variable)
     TECA_POPTS_SET(opts, std::string, prefix, number_of_components_key)
     TECA_POPTS_SET(opts, std::string, prefix, component_ids_key)
@@ -184,7 +185,7 @@ std::vector<teca_metadata> teca_component_area_filter::get_upstream_request(
     const std::string &var_post_fix = this->variable_post_fix;
     if (!var_post_fix.empty())
     {
-        teca_metadata_util::remove_post_fix(arrays, var_post_fix);
+        teca_string_util::remove_post_fix(arrays, var_post_fix);
     }
 
     req.set("arrays", arrays);
diff --git a/alg/teca_component_area_filter.h b/alg/teca_component_area_filter.h
index f6c8e5a22..6ef2669c0 100644
--- a/alg/teca_component_area_filter.h
+++ b/alg/teca_component_area_filter.h
@@ -12,29 +12,29 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_component_area_filter)
 
 /// An algorithm that applies a mask based on connected component area
 /**
-The filter masks the regions identified by an integer label that are outside
-the range bracketed by the 'low_area_threshold' and 'high_area_threshold'
-properties. These default to -inf and +inf, hence by default no regions are
-masked. The mask value may be set by the 'mask_value' property which defaults
-to '0'.
-
-The filter expects an integer field containing connected component labels.
-This field is named by the 'component_variable' property. Additionally a list
-of label ids and coresponding areas is expected in the dataset metadata. The
-properties 'component_ids_key' and 'component_area_key' identify the latter
-metadata. These default to the names used by the 'teca_2d_component_area'
-algotihm, 'component_ids' and 'component_area'.
-
-Applying the 'teca_connected_component' algorithm followed by the
-'teca_2d_component_area' algorithm is the easiest way to get valid inputs for
-the 'component_area_filter'.
-
-The filtered coomponent ids are put in the output dataset along with the
-updated lists of valid component ids and component area metadata keys. By
-default the filtered data replaces the input data in the output. However, the
-input data can be retained by setting the 'variable_post_fix' property, a
-string that will be appended to the names of the filtered component array and
-metadata keys.
+ * The filter masks the regions identified by an integer label that are outside
+ * the range bracketed by the 'low_area_threshold' and 'high_area_threshold'
+ * properties. These default to -inf and +inf, hence by default no regions are
+ * masked. The mask value may be set by the 'mask_value' property which
+ * defaults to '0'.
+ *
+ * The filter expects an integer field containing connected component labels.
+ * This field is named by the 'component_variable' property. Additionally a
+ * list of label ids and coresponding areas is expected in the dataset
+ * metadata. The properties 'component_ids_key' and 'component_area_key'
+ * identify the latter metadata. These default to the names used by the
+ * 'teca_2d_component_area' algotihm, 'component_ids' and 'component_area'.
+ *
+ * Applying the 'teca_connected_component' algorithm followed by the
+ * 'teca_2d_component_area' algorithm is the easiest way to get valid inputs
+ * for the 'component_area_filter'.
+ *
+ * The filtered coomponent ids are put in the output dataset along with the
+ * updated lists of valid component ids and component area metadata keys. By
+ * default the filtered data replaces the input data in the output. However,
+ * the input data can be retained by setting the 'variable_post_fix' property,
+ * a string that will be appended to the names of the filtered component array
+ * and metadata keys.
 */
 class teca_component_area_filter : public teca_algorithm
 {
@@ -51,43 +51,78 @@ class teca_component_area_filter : public teca_algorithm
 
     // set the name of the input array containing connected
     // component labels
+    /** @name component_variable
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_variable)
+    ///@}
 
-    // set the name of the dataset metadata key holding the number of
-    // components left after the filter is applied
+    /** @name number_of_components_key
+     * set the name of the dataset metadata key holding the number of
+     * components left after the filter is applied
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, number_of_components_key)
+    ///@}
 
-    // set the name of the dataset metadata key holding connected component
-    // label ids
+    /** @name component_ids_key
+     * set the name of the dataset metadata key holding connected component
+     * label ids
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_ids_key)
+    ///@}
 
-    // set the name of the dataset metadata key holding connected component
-    // areas
+    /** @name component_area_key
+     * set the name of the dataset metadata key holding connected component
+     * areas
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_area_key)
-
-    // set this to be the default label id for the filtered out component
-    // areas. This will typically correspond to the label used for cells
-    // outside of the segmentation (i.e. in the background). One can use this
-    // property to override the mask value.  The default mask value is '-1'
-    // which results in aquiring the mask value from input metadata key
-    // `background_id`. Use -2 to specify no background label.
+    ///@}
+
+    /** @name mask_value
+     * set this to be the default label id for the filtered out component
+     * areas. This will typically correspond to the label used for cells
+     * outside of the segmentation (i.e. in the background). One can use this
+     * property to override the mask value.  The default mask value is '-1'
+     * which results in aquiring the mask value from input metadata key
+     * `background_id`. Use -2 to specify no background label.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(long, mask_value)
+    ///@}
 
-    // set the range identifying values to area filter.
-    // The defaults are (-infinity, infinity].
+    /** @name low_area_threshold
+     * set the range identifying values to area filter.  The defaults are
+     * (-infinity, infinity].
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(double, low_area_threshold)
-    TECA_ALGORITHM_PROPERTY(double, high_area_threshold)
+    ///@}
 
-    // a string to be appended to the name of the output variable.
-    // setting this to an empty string will result in the masked array
-    // replacing the input array in the output. default is an empty
-    // string ""
+    /** @name high_area_threshold
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(double, high_area_threshold)
+    ///@}
+
+    /** @name variable_post_fix
+     * a string to be appended to the name of the output variable.  setting
+     * this to an empty string will result in the masked array replacing the
+     * input array in the output. default is an empty string ""
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, variable_post_fix)
+    ///@}
 
-    // set this only if you know for certain that label ids
-    // are contiguous and start at 0. this enables use of a
-    // faster implementation.
+    /** @name contiguous_component_ids
+     * set this only if you know for certain that label ids are contiguous and
+     * start at 0. this enables use of a faster implementation.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, contiguous_component_ids)
+    ///@}
 
 protected:
     teca_component_area_filter();
diff --git a/alg/teca_component_statistics.cxx b/alg/teca_component_statistics.cxx
index a5de6f0ee..773e2f74f 100644
--- a/alg/teca_component_statistics.cxx
+++ b/alg/teca_component_statistics.cxx
@@ -47,6 +47,8 @@ void teca_component_statistics::get_properties_description(
             "list of arrays to compute statistics for")
         ;*/
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -54,8 +56,7 @@ void teca_component_statistics::get_properties_description(
 void teca_component_statistics::set_properties(
     const std::string &prefix, variables_map &opts)
 {
-    (void) prefix;
-    (void) opts;
+    this->teca_algorithm::set_properties(prefix, opts);
 
     //TECA_POPTS_SET(opts, std::vector<std::string>, prefix, dependent_variables)
 }
diff --git a/alg/teca_connected_components.h b/alg/teca_connected_components.h
index 0f188f7e0..693ffa1b4 100644
--- a/alg/teca_connected_components.h
+++ b/alg/teca_connected_components.h
@@ -12,35 +12,35 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_connected_components)
 
 /// an algorithm that computes connected component labeling
 /**
-an algorithm that computes connected component labeling for 1D, 2D, and 3D
-data. The components are computed from a binary segmentation provided on the
-input.
-
-the input binary segmentation is labeled and stored in a variable named by the
-component_variable property. the component ids are added to the output
-dataset metadata in an key named 'component_ids', and the number of components
-is stored in a key named 'number_of_components'. These keys facilitate further
-processing as one need not scan the labeled data to get the list of label ids.
-
-The cells outside of the segmentation (i.e. the background) are always assigned
-the label 0. The cells belonging to connected regions inside the segmentation
-are labeled starting from 1 up to number_of_components - 1.
-
-output keys:
-
-    number_of_components - number of component ids found. this will always be
-                           at least 1 long as the cells outside the segmentation
-                           are assigned the label 0.
-
-    component_ids - a vector containing the label of each component. This is
-                    always starts with 0, where the label 0 identifies cells
-                    out side of the segmentation, and ranges up to
-                    number_of_components - 1, where the labels from 1 up to
-                    number_of_components - 1 identify connected regions of
-                    cells inside the segmentation.
-
-    background_id - the label used for cells outside of the segmentation,
-                    i.e. the background. always 0.
+ * an algorithm that computes connected component labeling for 1D, 2D, and 3D
+ * data. The components are computed from a binary segmentation provided on the
+ * input.
+ *
+ * the input binary segmentation is labeled and stored in a variable named by the
+ * component_variable property. the component ids are added to the output
+ * dataset metadata in an key named 'component_ids', and the number of components
+ * is stored in a key named 'number_of_components'. These keys facilitate further
+ * processing as one need not scan the labeled data to get the list of label ids.
+ *
+ * The cells outside of the segmentation (i.e. the background) are always assigned
+ * the label 0. The cells belonging to connected regions inside the segmentation
+ * are labeled starting from 1 up to number_of_components - 1.
+ *
+ * output keys:
+ *
+ *  | name                 | description |
+ *  | ----                 | ----------- |
+ *  | number_of_components | number of component ids found. this will always be |
+ *  |                      | at least 1 long as the cells outside the segmentation |
+ *  |                      | are assigned the label 0. |
+ *  | component_ids | a vector containing the label of each component. This is |
+ *  |               | always starts with 0, where the label 0 identifies cells |
+ *  |               | out side of the segmentation, and ranges up to |
+ *  |               | number_of_components - 1, where the labels from 1 up to |
+ *  |               | number_of_components - 1 identify connected regions of |
+ *  |               | cells inside the segmentation. |
+ *  | background_id | the label used for cells outside of the segmentation, |
+ *  |               | i.e. the background. always 0. |
 */
 class teca_connected_components : public teca_algorithm
 {
diff --git a/alg/teca_dataset_diff.cxx b/alg/teca_dataset_diff.cxx
index 3905871cb..ffa008ae5 100644
--- a/alg/teca_dataset_diff.cxx
+++ b/alg/teca_dataset_diff.cxx
@@ -33,7 +33,7 @@
 
 // --------------------------------------------------------------------------
 teca_dataset_diff::teca_dataset_diff()
-    : relative_tolerance(1.0e-6), absolute_tolerance(-1.0), verbose(1)
+    : relative_tolerance(1.0e-6), absolute_tolerance(-1.0)
 {
     this->set_number_of_input_connections(2);
     this->set_number_of_output_ports(1);
@@ -54,15 +54,18 @@ void teca_dataset_diff::get_properties_description(
     opts.add_options()
         TECA_POPTS_GET(double, prefix, relative_tolerance, "relative test tolerance")
         TECA_POPTS_GET(double, prefix, absolute_tolerance, "absolute test tolerance")
-        TECA_POPTS_GET(int, prefix, verbose, "print status messages as the diff runs")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
 // --------------------------------------------------------------------------
 void teca_dataset_diff::set_properties(const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, double, prefix, relative_tolerance)
     TECA_POPTS_SET(opts, double, prefix, absolute_tolerance)
     TECA_POPTS_SET(opts, int, prefix, verbose)
diff --git a/alg/teca_dataset_diff.h b/alg/teca_dataset_diff.h
index 57bfffbba..881b928f6 100644
--- a/alg/teca_dataset_diff.h
+++ b/alg/teca_dataset_diff.h
@@ -18,16 +18,14 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_dataset_diff)
 
 /// compute the element wise difference between to datasets
 /**
-a two input algorithm that compares datasets by examining each
-element of their contained arrays. a threshold is used to detect
-when an element is different. a report containing the string FAIL
-is issued to stderr stream when a difference is detected. this
-algorithm is the core of TECA's regression test suite.
-
-by convention the first input produces the reference dataset,
-and the second input produces the dataset to validate. this is
-primarilly to support map-reduce implementation where after
-the reduction only rank 0 has data.
+ * a two input algorithm that compares datasets by examining each element of their
+ * contained arrays. a threshold is used to detect when an element is different. a
+ * report containing the string FAIL is issued to stderr stream when a difference
+ * is detected. this algorithm is the core of TECA's regression test suite.
+ *
+ * by convention the first input produces the reference dataset, and the second
+ * input produces the dataset to validate. this is primarilly to support
+ * map-reduce implementation where after the reduction only rank 0 has data.
 */
 class teca_dataset_diff : public teca_algorithm
 {
@@ -41,19 +39,24 @@ class teca_dataset_diff : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // Relative tolerance below which two floating-point numbers a and b are
-    // considered equal. if |a - b| <= max(|a|,|b|)*tol then a is equal to b.
-    // the relative tolerance is used with numbers not close to zero.
+    /** @name relative_tolerance
+     * Relative tolerance below which two floating-point numbers a and b are
+     * considered equal. if |a - b| <= max(|a|,|b|)*tol then a is equal to b.
+     * the relative tolerance is used with numbers not close to zero.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(double, relative_tolerance)
-
-    // The absolute tolerance below which two floating point numbers a and b are
-    // considered equal. if |a - b| <= tol then a is equal to b. The absolute
-    // tolerance is used with numbers close to zero.
+    ///@}
+
+    /** @name absolute_tolerance
+     * The absolute tolerance below which two floating point numbers a and b
+     * are considered equal. if |a - b| <= tol then a is equal to b. The
+     * absolute tolerance is used with numbers close to zero.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(double, absolute_tolerance)
+    ///@}
 
-    // if set infromation about the test progress is displayed during
-    // the test.
-    TECA_ALGORITHM_PROPERTY(int, verbose)
 protected:
     teca_dataset_diff();
 
@@ -107,7 +110,6 @@ class teca_dataset_diff : public teca_algorithm
 private:
     double relative_tolerance;
     double absolute_tolerance;
-    int verbose;
 };
 
 #endif
diff --git a/alg/teca_derived_quantity.cxx b/alg/teca_derived_quantity.cxx
index 46345bf8f..4d7f68b6e 100644
--- a/alg/teca_derived_quantity.cxx
+++ b/alg/teca_derived_quantity.cxx
@@ -31,12 +31,14 @@ void teca_derived_quantity::get_properties_description(
         + (prefix.empty()?"teca_derived_quantity":prefix));
 
     opts.add_options()
-        TECA_POPTS_GET(std::vector<std::string>, prefix, dependent_variables,
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, dependent_variables,
             "list of arrays needed to compute the derived quantity")
         TECA_POPTS_GET(std::string, prefix, derived_variable,
             "name of the derived quantity")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -44,6 +46,8 @@ void teca_derived_quantity::get_properties_description(
 void teca_derived_quantity::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::vector<std::string>, prefix, dependent_variables)
     TECA_POPTS_SET(opts, std::string, prefix, derived_variable)
 }
diff --git a/alg/teca_derived_quantity.h b/alg/teca_derived_quantity.h
index 922a87691..40b7510b5 100644
--- a/alg/teca_derived_quantity.h
+++ b/alg/teca_derived_quantity.h
@@ -3,7 +3,7 @@
 
 #include "teca_programmable_algorithm.h"
 #include "teca_metadata.h"
-#include "teca_dataset_fwd.h"
+#include "teca_dataset.h"
 #include "teca_shared_object.h"
 
 #include <string>
@@ -13,14 +13,13 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_derived_quantity)
 
 /// a programmable algorithm specialized for simple array based computations
 /**
-A programmable algorithm specialized for simple array based
-computations. A user provided callable(see set execute_callback)
-which operates on one or more arrays(the dependent variables) to
-produce a new array (the derived quantity). The purpose of this
-class is to implement the request and report phases of the pipeline
-consistently for this common use case. An implementation specific
-context(operation_name) differentiates between multiple instances
-in the same pipeline.
+ * A programmable algorithm specialized for simple array based computations. A
+ * user provided callable(see set execute_callback) which operates on one or more
+ * arrays(the dependent variables) to produce a new array (the derived quantity).
+ * The purpose of this class is to implement the request and report phases of the
+ * pipeline consistently for this common use case. An implementation specific
+ * context(operation_name) differentiates between multiple instances in the same
+pipeline.
 */
 class teca_derived_quantity : public teca_programmable_algorithm
 {
diff --git a/alg/teca_derived_quantity_numerics.h b/alg/teca_derived_quantity_numerics.h
index a755714d2..d5f375fae 100644
--- a/alg/teca_derived_quantity_numerics.h
+++ b/alg/teca_derived_quantity_numerics.h
@@ -1,21 +1,22 @@
 #ifndef teca_numerics_h
 #define teca_numerics_h
 
+/// @file
+
 #include "teca_mesh.h"
 #include <string>
 #include <vector>
 
-// this namespace contains numeric code that could be reused
-// by teca_derived_quantity
+/// Numeric code that could be reused by teca_derived_quantity
 namespace teca_derived_quantity_numerics
 {
-// an execute function designed for use with teca_derived_quantity
-// on a teca_mesh. shallow copies the input and computes the
-// point-wise average of the named variables.
-//
-// for every i
-// avg[i] = (v0[i] + v1[i])/2
-//
+/** an execute function designed for use with teca_derived_quantity
+ *  on a teca_mesh. shallow copies the input and computes the
+ *  point-wise average of the named variables.
+ *
+ *  for every i
+ *  avg[i] = (v0[i] + v1[i])/2
+ */
 struct point_wise_average
 {
     // construct the class with two input array names, v0,v1
@@ -70,12 +71,12 @@ struct point_wise_average
     std::string m_avg; // output variable name
 };
 
-// an execute function designed for use with teca_derived_quantity
-// on a teca_mesh. compute the point-wise difference of two variables
-//
-// for every i
-// diff[i] = v1[i] - v0[i]
-//
+/**  an execute function designed for use with teca_derived_quantity
+ *  on a teca_mesh. compute the point-wise difference of two variables
+ *
+ *  for every i
+ *  diff[i] = v1[i] - v0[i]
+ */
 struct point_wise_difference
 {
     // construct the class with two input array names, v0,v1
diff --git a/alg/teca_descriptive_statistics.cxx b/alg/teca_descriptive_statistics.cxx
index 2c7794f0a..042684228 100644
--- a/alg/teca_descriptive_statistics.cxx
+++ b/alg/teca_descriptive_statistics.cxx
@@ -128,7 +128,7 @@ void teca_descriptive_statistics::get_properties_description(
         + (prefix.empty()?"teca_descriptive_statistics":prefix));
 
     opts.add_options()
-        TECA_POPTS_GET(std::vector<std::string>, prefix, dependent_variables,
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, dependent_variables,
             "list of arrays to compute statistics for")
         ;
 
diff --git a/alg/teca_descriptive_statistics.h b/alg/teca_descriptive_statistics.h
index b426dca64..416476c1e 100644
--- a/alg/teca_descriptive_statistics.h
+++ b/alg/teca_descriptive_statistics.h
@@ -12,8 +12,8 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_descriptive_statistics)
 
 /// compute descriptive statistics over a set of arrays.
 /**
-compute the min, max, avg, median, standard deviation of a
-set of named arrays. the results are returned in a table.
+ * compute the min, max, avg, median, standard deviation of a set of named
+ * arrays. the results are returned in a table.
 */
 class teca_descriptive_statistics : public teca_algorithm
 {
diff --git a/alg/teca_elevation_mask.cxx b/alg/teca_elevation_mask.cxx
new file mode 100644
index 000000000..bc662a313
--- /dev/null
+++ b/alg/teca_elevation_mask.cxx
@@ -0,0 +1,384 @@
+#include "teca_elevation_mask.h"
+
+#include "teca_cartesian_mesh.h"
+#include "teca_array_collection.h"
+#include "teca_variant_array.h"
+#include "teca_metadata.h"
+#include "teca_array_attributes.h"
+
+#include "teca_dataset_source.h"
+#include "teca_dataset_capture.h"
+#include "teca_cartesian_mesh_regrid.h"
+#include "teca_index_executive.h"
+
+#include <algorithm>
+#include <iostream>
+#include <string>
+#include <set>
+#include <cmath>
+
+#if defined(TECA_HAS_BOOST)
+#include <boost/program_options.hpp>
+#endif
+
+//#define TECA_DEBUG
+
+struct teca_elevation_mask::internals_t
+{
+    // compute the valid value mask such that for each point the mask
+    // is 1 where the mesh point is above the surface of the Earth and
+    // 0 otherwise
+    template<typename mask_t, typename elev_num_t, typename mesh_num_t>
+    static void mask_by_surface_elevation(
+        size_t nx, size_t ny, size_t nz,
+        mask_t * __restrict__ mask,
+        const elev_num_t * __restrict__ surface_elev,
+        const mesh_num_t * __restrict__ mesh_height)
+    {
+        size_t nxy = nx*ny;
+        for (size_t k = 0; k < nz; ++k)
+        {
+            const mesh_num_t * __restrict__ mesh_height_k = mesh_height + k*nxy;
+            mask_t * __restrict__ mask_k = mask + k*nxy;
+            for (size_t q = 0; q < nxy; ++q)
+            {
+                mask_k[q] = mesh_height_k[q] >= (mesh_num_t)surface_elev[q] ? mask_t(1) : mask_t(0);
+            }
+        }
+    }
+};
+
+
+// --------------------------------------------------------------------------
+teca_elevation_mask::teca_elevation_mask() :
+    mesh_height_variable("zg"), surface_elevation_variable("z")
+{
+    this->set_number_of_input_connections(2);
+    this->set_number_of_output_ports(1);
+}
+
+// --------------------------------------------------------------------------
+teca_elevation_mask::~teca_elevation_mask()
+{
+}
+
+#if defined(TECA_HAS_BOOST)
+// --------------------------------------------------------------------------
+void teca_elevation_mask::get_properties_description(
+    const std::string &prefix, options_description &global_opts)
+{
+    options_description opts("Options for "
+        + (prefix.empty()?"teca_elevation_mask":prefix));
+
+    opts.add_options()
+
+        TECA_POPTS_GET(std::string, prefix, surface_elevation_variable,
+            "Set the name of the variable containing surface elevation"
+            " values in meters above mean sea level")
+
+        TECA_POPTS_GET(std::string, prefix, mesh_height_variable,
+            "Set the name of the variable containing point wise mesh height"
+            " values in meters above mean sea level")
+
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, mask_variables,
+            "Set the names of the variables to store the generated mask in."
+            " Each name is assigned a reference to the mask.")
+        ;
+
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
+    global_opts.add(opts);
+}
+
+// --------------------------------------------------------------------------
+void teca_elevation_mask::set_properties(
+    const std::string &prefix, variables_map &opts)
+{
+    this->teca_algorithm::set_properties(prefix, opts);
+
+    TECA_POPTS_SET(opts, std::string, prefix, surface_elevation_variable)
+    TECA_POPTS_SET(opts, std::string, prefix, mesh_height_variable)
+    TECA_POPTS_SET(opts, std::vector<std::string>, prefix, mask_variables)
+}
+#endif
+
+// --------------------------------------------------------------------------
+teca_metadata teca_elevation_mask::get_output_metadata(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md)
+{
+#ifdef TECA_DEBUG
+    cerr << teca_parallel_id()
+        << "teca_elevation_mask::get_output_metadata" << endl;
+#endif
+    (void)port;
+
+    // validate runtime provided settings
+    unsigned int n_mask_vars = this->mask_variables.size();
+    if (n_mask_vars == 0)
+    {
+        TECA_ERROR("The names of the mask_variables were not provided")
+        return teca_metadata();
+    }
+
+    // pass metadata from the input mesh through.
+    const teca_metadata &mesh_md = input_md[0];
+    teca_metadata out_md(mesh_md);
+
+    // add the mask arrays we will generate
+    for (unsigned int i = 0; i < n_mask_vars; ++i)
+        out_md.append("variables", this->mask_variables[i]);
+
+    // insert attributes to enable this to be written by the CF writer
+    teca_metadata attributes;
+    out_md.get("attributes", attributes);
+
+    teca_metadata mesh_height_atts;
+    if (attributes.get(this->mesh_height_variable, mesh_height_atts))
+    {
+        TECA_WARNING("Failed to get mesh_height_variable \""
+            << this->mesh_height_variable << "\" attrbibutes."
+            " Writing the result will not be possible")
+    }
+    else
+    {
+        // get the centering and size from the array
+        unsigned int centering = 0;
+        mesh_height_atts.get("centering", centering);
+
+        unsigned long size = 0;
+        mesh_height_atts.get("size", size);
+
+        // construct output attributes
+        teca_array_attributes mask_atts(
+            teca_variant_array_code<char>::get(),
+            centering, size, "none", "", "elevation mask");
+
+        // add one for each output
+        for (unsigned int i = 0; i < n_mask_vars; ++i)
+            attributes.set(this->mask_variables[i], (teca_metadata)mask_atts);
+
+        // update the attributes collection
+        out_md.set("attributes", attributes);
+    }
+
+    return out_md;
+}
+
+// --------------------------------------------------------------------------
+std::vector<teca_metadata> teca_elevation_mask::get_upstream_request(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md,
+    const teca_metadata &request)
+{
+    (void)port;
+    (void)input_md;
+
+    std::vector<teca_metadata> up_reqs;
+
+    // get the names of the arrays we need to request
+    if (this->mesh_height_variable.empty())
+    {
+        TECA_ERROR("The mesh_height_variable was not specified")
+        return up_reqs;
+    }
+
+    if (this->surface_elevation_variable.empty())
+    {
+        TECA_ERROR("The surface_elevation_variable was not specified")
+        return up_reqs;
+    }
+
+    // need to make the request for the surface elevation field using bounds
+    double req_bounds[6] = {0.0};
+    if (request.get("bounds", req_bounds, 6))
+    {
+        // bounds not specified, try to get an extent and convert to a bounds
+        unsigned long req_extent[6];
+        if (request.get("extent", req_extent, 6))
+        {
+            TECA_ERROR("Neither bounds nor extent were specified in the request")
+            return up_reqs;
+        }
+
+        const teca_metadata &md = input_md[0];
+
+        teca_metadata coords;
+        p_teca_variant_array x,y;
+
+        if (md.get("coordinates", coords) ||
+            !(x = coords.get("x")) || !(y = coords.get("y")))
+        {
+            TECA_ERROR("Failed to get mesh coordinates")
+            return up_reqs;
+        }
+
+        x->get(req_extent[0], req_bounds[0]);
+        x->get(req_extent[1], req_bounds[1]);
+        y->get(req_extent[2], req_bounds[2]);
+        y->get(req_extent[3], req_bounds[3]);
+    }
+
+    // input port 0 will source the mesh height field, and any other data
+    // requested by the down stream.  copy the incoming request to preserve the
+    // downstream requirements and add the mesh height variable
+    teca_metadata req_0(request);
+
+    std::set<std::string> mesh_arrays;
+    if (req_0.has("arrays"))
+        req_0.get("arrays", mesh_arrays);
+
+    mesh_arrays.insert(this->mesh_height_variable);
+
+    // intercept request for our output
+    int n_mask_vars = this->mask_variables.size();
+    for (int i = 0; i < n_mask_vars; ++i)
+        mesh_arrays.erase(this->mask_variables[i]);
+
+    req_0.set("arrays", mesh_arrays);
+
+
+    // input port 1 provides the surface elevation field, request it
+    // preserve bounds etc
+    const teca_metadata &elev_md = input_md[1];
+
+    std::string req_key;
+    if (elev_md.get("index_request_key", req_key))
+    {
+        TECA_ERROR("Metadata is missing \"index_request_key\"")
+        return up_reqs;
+    }
+
+    // surface elevations don't change over the timescale of concern
+    // always request index 0
+    teca_metadata req_1;
+    req_1.set(req_key, 0ul);
+    req_1.set("index_request_key", req_key);
+
+    // request the surface elevation
+    std::vector<std::string> elev_arrays(1, this->surface_elevation_variable);
+    req_1.set("arrays", elev_arrays);
+
+    // at the bounds of interest
+    req_1.set("bounds", req_bounds, 6);
+
+    // package the requests and send them up
+    up_reqs.push_back(req_0);
+    up_reqs.push_back(req_1);
+
+
+    return up_reqs;
+}
+
+// --------------------------------------------------------------------------
+const_p_teca_dataset teca_elevation_mask::execute(
+    unsigned int port,
+    const std::vector<const_p_teca_dataset> &input_data,
+    const teca_metadata &request)
+{
+#ifdef TECA_DEBUG
+    cerr << teca_parallel_id() << "teca_elevation_mask::execute" << endl;
+#endif
+    (void)port;
+    (void)request;
+
+    // check for an error upstream
+    if ((input_data.size() != 2) || !input_data[0] || !input_data[1])
+    {
+        TECA_ERROR("Invalid inputs detected")
+        return nullptr;
+    }
+
+    // get the input 3D mesh
+    const_p_teca_cartesian_mesh in_mesh
+        = std::dynamic_pointer_cast<const teca_cartesian_mesh>(input_data[0]);
+
+    if (!in_mesh)
+    {
+        TECA_ERROR("Data to mask on input port 0 is not a"
+            " teca_cartesian_mesh. Got " << input_data[0]->get_class_name())
+        return nullptr;
+    }
+
+    // get the mesh dimensions
+    unsigned long extent[6];
+    in_mesh->get_extent(extent);
+
+    unsigned long nx = extent[1] - extent[0] + 1;
+    unsigned long ny = extent[3] - extent[2] + 1;
+    unsigned long nz = extent[5] - extent[4] + 1;
+
+    // get the mesh height, this is a 3d field with the altitude for
+    // each mesh point
+    const_p_teca_variant_array mesh_height =
+        in_mesh->get_point_arrays()->get(this->mesh_height_variable);
+
+    if (!mesh_height)
+    {
+        TECA_ERROR("Mesh to mask is missing the height field \""
+            << this->mesh_height_variable << "\"")
+        return nullptr;
+    }
+
+    // get the surface elevations
+    const_p_teca_cartesian_mesh in_elev
+        = std::dynamic_pointer_cast<const teca_cartesian_mesh>(input_data[1]);
+
+    if (!in_elev)
+    {
+        TECA_ERROR("Data to mask on input port 0 is not a"
+            " teca_cartesian_mesh. Got " << input_data[0]->get_class_name())
+        return nullptr;
+    }
+
+    // get the surface elevation, this is a 2d field with surface altitude
+    //
+    // at each mesh point. regridding has been performed so that the horizontal
+    // coordinates are the same as the 3d mesh for which masks will be generated
+    const_p_teca_variant_array surface_elev =
+        in_elev->get_point_arrays()->get(this->surface_elevation_variable);
+
+    if (!surface_elev)
+    {
+        TECA_ERROR("Surface elevation data has no array \""
+            << this->surface_elevation_variable << "\"")
+        return nullptr;
+    }
+
+    // compute the mask
+    p_teca_char_array mask = teca_char_array::New(mesh_height->size());
+    char *p_mask = mask->get();
+
+    NESTED_TEMPLATE_DISPATCH(const teca_variant_array_impl,
+        surface_elev.get(),
+        _SURF,
+
+        const NT_SURF *p_surface_elev =
+            static_cast<const TT_SURF *>(surface_elev.get())->get();
+
+        NESTED_TEMPLATE_DISPATCH(const teca_variant_array_impl,
+            mesh_height.get(),
+            _MESH,
+
+            const NT_MESH *p_mesh_height =
+                static_cast<const TT_MESH *>(mesh_height.get())->get();
+
+            internals_t::mask_by_surface_elevation(nx, ny, nz,
+                p_mask, p_surface_elev, p_mesh_height);
+
+            )
+        )
+
+    // allocate the output mesh
+    p_teca_cartesian_mesh out_mesh = std::dynamic_pointer_cast<teca_cartesian_mesh>
+        (std::const_pointer_cast<teca_cartesian_mesh>(in_mesh)->new_shallow_copy());
+
+    // store the results under the requested names
+    int n_mask_vars = this->mask_variables.size();
+    for (int i = 0; i < n_mask_vars; ++i)
+    {
+       out_mesh->get_point_arrays()->set(this->mask_variables[i], mask);
+    }
+
+    return out_mesh;
+}
diff --git a/alg/teca_elevation_mask.h b/alg/teca_elevation_mask.h
new file mode 100644
index 000000000..fea8a7fbf
--- /dev/null
+++ b/alg/teca_elevation_mask.h
@@ -0,0 +1,115 @@
+#ifndef teca_elevation_mask_h
+#define teca_elevation_mask_h
+
+#include "teca_shared_object.h"
+#include "teca_algorithm.h"
+#include "teca_metadata.h"
+
+#include <string>
+#include <vector>
+
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_elevation_mask)
+
+/** @brief
+ * Generates a mask indicating where mesh points with a vertical pressure
+ * coordinate lie above the surface of the Earth.  The mask is set to 1 where
+ * data is above the Earth's surface and 0 otherwise.
+ *
+ * @details
+ * Given a 3D height field containing the altitude of each point in meters
+ * above mean sea level, and a 2D height field corresponding to height in
+ * meters above mean sea level of the surface of the Earth, generate a mask
+ * that is 1 where the 3D point is on or above the surface of the Earth and 0
+ * where it is below.
+ *
+ * The name of the 3D height field is specified by the  mesh_height_variable
+ * property. The name of the 2D height field conntaining elveation of the
+ * Earth's surface is specified by the  surface_elevation_variable property.
+ *
+ * The 3D mesh height field must be provided on input 0, and the 2D surface
+ * height field on input 1. Use the mask_names property to name the output
+ * mask.  If more than one name is provided each name will reference a pointer
+ * to the mask. Consider using names of the form X_valid in which case the
+ * output is compatible with the teca_valid_value_mask and will be treated
+ * as missing values by down stream algorithms.
+ *
+ * If the simulation does not provide the 3D height field, for simulations
+ * where the acceleration due to the Earth's gravity is assumed constant,
+ * teca_geopotential_height can generate the 3D height field.
+ *
+ * The primary use case of this algorithm is when dealing with calculations on
+ * 3D meshes with a vertical pressure coordinate and there is a need to
+ * identify and treat specially the mesh points that are below the surface of
+ * the Earth. There are a number of alternatives available depending on the
+ * data.  If your data has a _FillValue where data is below the surface then
+ * use teca_valid_value_mask instead of this algorithm. If your data has
+ * surface pressure field use teca_pressure_level_mask instead of this
+ * algorithm. If your dataset has surface temperature, and mean sea level
+ * pressure fields then use teca_surface_pressure to generate the surface
+ * pressure field and use teca_pressure_level_mask instead of this algorithm.
+ */
+class teca_elevation_mask : public teca_algorithm
+{
+public:
+    TECA_ALGORITHM_STATIC_NEW(teca_elevation_mask)
+    TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_elevation_mask)
+    TECA_ALGORITHM_CLASS_NAME(teca_elevation_mask)
+    ~teca_elevation_mask();
+
+    /** @name program_options
+     * report/initialize to/from Boost program options objects.
+     */
+    ///@{
+    TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
+    TECA_SET_ALGORITHM_PROPERTIES()
+    ///@}
+
+    /** @name mesh_height_variable
+     * Set the name of the 3D height field
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, mesh_height_variable)
+    ///@}
+
+    /** @name surface_elevation_variable
+     * Set the name of the variable containing the elevation of the Earth's
+     * surface.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, surface_elevation_variable)
+    ///@}
+
+    /** @name mask_variables
+     * set the names of the variables to store the generated mask in
+     * each variable will contain a reference to the mask
+     */
+    ///@{
+    TECA_ALGORITHM_VECTOR_PROPERTY(std::string, mask_variable)
+    ///@}
+
+protected:
+    teca_elevation_mask();
+
+private:
+    teca_metadata get_output_metadata(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md) override;
+
+    std::vector<teca_metadata> get_upstream_request(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md,
+        const teca_metadata &request) override;
+
+    const_p_teca_dataset execute(
+        unsigned int port,
+        const std::vector<const_p_teca_dataset> &input_data,
+        const teca_metadata &request) override;
+
+private:
+    std::string mesh_height_variable;
+    std::string surface_elevation_variable;
+    std::vector<std::string> mask_variables;
+    struct internals_t;
+};
+
+#endif
diff --git a/alg/teca_evaluate_expression.cxx b/alg/teca_evaluate_expression.cxx
index 69f485a30..4a1948321 100644
--- a/alg/teca_evaluate_expression.cxx
+++ b/alg/teca_evaluate_expression.cxx
@@ -18,7 +18,7 @@
 #include <boost/program_options.hpp>
 #endif
 #if defined(TECA_HAS_UDUNITS)
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 #endif
 #if defined(TECA_HAS_MPI)
 #include <mpi.h>
@@ -59,6 +59,8 @@ void teca_evaluate_expression::get_properties_description(
             "when set columns used in the calculation are removed from output")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -66,6 +68,8 @@ void teca_evaluate_expression::get_properties_description(
 void teca_evaluate_expression::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, expression)
     TECA_POPTS_SET(opts, std::string, prefix, result_variable)
     TECA_POPTS_SET(opts, int, prefix, remove_dependent_variables)
diff --git a/alg/teca_evaluate_expression.h b/alg/teca_evaluate_expression.h
index 91ce9b9f1..afbe546b6 100644
--- a/alg/teca_evaluate_expression.h
+++ b/alg/teca_evaluate_expression.h
@@ -10,23 +10,24 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_evaluate_expression)
 
-/**
-An algorithm that evaluates an expression stores the
-result in a new variable.
-
-the expression parser supports the following operations:
-    +,-,*,/,%,<.<=,>,>=,==,!=,&&,||.!,?
-
-grouping in the expression is denoted in the usual
-way: ()
-
-constants in the expression are expanded to full length
-arrays and can be typed. The supported types are:
-    d,f,L,l,i,s,c
-coresponding to double,float,long long, long, int,
-short and char repsectively.  integer types can be
-unsigned by including u after the code.
-*/
+/** @brief
+ * An algorithm that evaluates an expression stores the
+ * result in a new variable.
+ *
+ * @details
+ * The expression parser supports the following operations:
+ *     +,-,*,/,%,<.<=,>,>=,==,!=,&&,||.!,?
+ *
+ * Grouping in the expression is denoted in the usual
+ * way: ()
+ *
+ * Constants in the expression are expanded to full length
+ * arrays and can be typed. The supported types are:
+ *     d,f,L,l,i,s,c
+ * Corresponding to double,float, long long, long, int,
+ * short and char respectively. Integer types can be
+ * unsigned by including u after the code.
+ */
 class teca_evaluate_expression : public teca_algorithm
 {
 public:
@@ -40,18 +41,32 @@ class teca_evaluate_expression : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set/get the expression to evaluate
+    /** @name expression
+     * Set the expression to evaluate.
+     */
+    ///@{
+    /// Set the expression.
     void set_expression(const std::string &expr);
 
+    /// Get the expression.
     std::string get_expression()
     { return this->expression; }
-
-    // set the name of the variable to store the result in
-    TECA_ALGORITHM_PROPERTY(std::string, result_variable);
-
-    // when set columns used in the calculation are removed
-    // from the output. deault off.
+    ///@}
+
+    /** @name result_variable
+     * set the name of the variable to store the result in
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, result_variable)
+    ///@}
+
+    /** @name remove_dependent_variables
+     * when set columns used in the calculation are removed from the output.
+     * default off.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, remove_dependent_variables)
+    ///@}
 
 protected:
     teca_evaluate_expression();
diff --git a/alg/teca_face_to_cell_centering.cxx b/alg/teca_face_to_cell_centering.cxx
index 993df96c4..6e6f5c939 100644
--- a/alg/teca_face_to_cell_centering.cxx
+++ b/alg/teca_face_to_cell_centering.cxx
@@ -128,26 +128,26 @@ teca_face_to_cell_centering::~teca_face_to_cell_centering()
 void teca_face_to_cell_centering::get_properties_description(
     const string &prefix, options_description &global_opts)
 {
-    (void)prefix;
-    (void)global_opts;
-    /*options_description opts("Options for "
+    options_description opts("Options for "
         + (prefix.empty()?"teca_face_to_cell_centering":prefix));
 
-    opts.add_options()
+    /*opts.add_options()
         TECA_POPTS_GET(int, prefix, mode,
-            "transform mode (mode_wrf_v3)")
-        ;
+            "Set the coordinate transform mode. The valid modes"
+            " are: mode_wrf_v3)")
+        ;*/
 
-    global_opts.add(opts);*/
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
+    global_opts.add(opts);
 }
 
 // --------------------------------------------------------------------------
 void teca_face_to_cell_centering::set_properties(
     const string &prefix, variables_map &opts)
 {
-    (void)prefix;
-    (void)opts;
     //TECA_POPTS_SET(opts, int, prefix, mode)
+    this->teca_algorithm::set_properties(prefix, opts);
 }
 #endif
 
diff --git a/alg/teca_face_to_cell_centering.h b/alg/teca_face_to_cell_centering.h
index 563c9ae1f..458b7f9f0 100644
--- a/alg/teca_face_to_cell_centering.h
+++ b/alg/teca_face_to_cell_centering.h
@@ -10,10 +10,7 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_face_to_cell_centering)
 
-/// an algorithm that transforms vertical cooridinates
-/**
-An algorithm that transforms vertical coordinates of a mesh.
-*/
+/// An  algorithm that transforms from face to cell centering
 class teca_face_to_cell_centering : public teca_algorithm
 {
 public:
diff --git a/alg/teca_geography.h b/alg/teca_geography.h
index 1e1d35401..59592018b 100644
--- a/alg/teca_geography.h
+++ b/alg/teca_geography.h
@@ -1,48 +1,48 @@
 #ifndef teca_geography_h
 #define teca_geography_h
 
+/// @file
+
 #include <vector>
 #include <string>
 
+/// Codes for dealing with geography
 namespace teca_geography
 {
-/**
-get the number of cyclone basins. cyclone basin ids are
-in the range 0 to number of basins - 1.
+/** get the number of cyclone basins. cyclone basin ids are
+ * in the range 0 to number of basins - 1.
 */
 unsigned long get_number_of_cyclone_basins();
 
 /**
-get the unique list of names describing available cyclone basins.
-the list can be indexed by the ids returned by the
-get_cyclone_basin/s functions.
+ * get the unique list of names describing available cyclone basins.
+ * the list can be indexed by the ids returned by the
+ * get_cyclone_basin/s functions.
 */
 void get_cyclone_basin_names(std::vector<std::string> &names,
     std::vector<std::string> &long_names);
 
-/**
-load polygons describing the cyclone basins used by TECA
-
-upon return:
-
-    sizes array has been appended with the size of each basin
-    starts array has been appended with the starting index of
-    each basin's coordinates
-    x/y_coordinates have been appended with the coordinates
-    ids array has been appended with the basin id
-
-some basins are comprised of multiple polygons because
-they split over the periodic boundary. hence the ids array
-is used to identify a basin.
+/** load polygons describing the cyclone basins used by TECA
+ *
+ * upon return:
+ *
+ *     sizes array has been appended with the size of each basin
+ *     starts array has been appended with the starting index of
+ *     each basin's coordinates
+ *     x/y_coordinates have been appended with the coordinates
+ *     ids array has been appended with the basin id
+ *
+ * some basins are comprised of multiple polygons because
+ * they split over the periodic boundary. hence the ids array
+ * is used to identify a basin.
 */
 void get_cyclone_basins(std::vector<unsigned long> &sizes,
     std::vector<unsigned long> &starts, std::vector<double> &x_coordinates,
     std::vector<double> &y_coordinates, std::vector<int> &ids,
     std::vector<std::string> &names, std::vector<std::string> &long_names);
 
-/**
-load a cylcone basin by name. Either the short or long name
-can be used. see get_cyclone_basin_names.
+/** load a cyclone basin by name. Either the short or long name
+ * can be used. see get_cyclone_basin_names.
 */
 int get_cyclone_basin(const std::string &rname,
     std::vector<unsigned long> &sizes, std::vector<unsigned long> &starts,
@@ -50,9 +50,8 @@ int get_cyclone_basin(const std::string &rname,
     std::vector<int> &ids, std::vector<std::string> &names,
     std::vector<std::string> &long_names);
 
-/**
-load a cyclone basin by it's region id. region ids must be in the range
-of 0 to get_number_of_cylone_basins() - 1.
+/** load a cyclone basin by it's region id. region ids must be in the range
+ * of 0 to get_number_of_cyclone_basins() - 1.
 */
 int get_cyclone_basin(unsigned int rid,
     std::vector<unsigned long> &sizes, std::vector<unsigned long> &starts,
diff --git a/alg/teca_geometry.h b/alg/teca_geometry.h
index bb7306948..d096faff9 100644
--- a/alg/teca_geometry.h
+++ b/alg/teca_geometry.h
@@ -1,9 +1,12 @@
 #ifndef teca_geometry_h
 #define teca_geometry_h
 
+/// @file
+
+/// Codes dealing with computational geometry
 namespace teca_geometry
 {
-// tests if a point is Left|On|Right of an infinite line.
+/// tests if a point is Left|On|Right of an infinite line.
 template<typename n_t>
 bool left(n_t e0x, n_t e0y, n_t e1x, n_t e1y, n_t px, n_t py)
 {
@@ -14,8 +17,9 @@ bool left(n_t e0x, n_t e0y, n_t e1x, n_t e1y, n_t px, n_t py)
     ((e1x - e0x)*(py - e0y) - (px -  e0x)*(e1y - e0y)) >= n_t();
 }
 
-// winding number test for a point in a polygon
-// winding number is 0 when the point is outside.
+/** Winding number test for a point in a polygon. The winding number is 0 when
+ * the point is outside.
+ */
 template<typename n_t>
 bool point_in_poly(n_t px, n_t py,
     n_t *vx, n_t *vy, unsigned long nppts)
diff --git a/alg/teca_indexed_dataset_cache.cxx b/alg/teca_indexed_dataset_cache.cxx
new file mode 100644
index 000000000..f907edc00
--- /dev/null
+++ b/alg/teca_indexed_dataset_cache.cxx
@@ -0,0 +1,351 @@
+#include "teca_indexed_dataset_cache.h"
+
+#include "teca_metadata.h"
+#include "teca_priority_queue.h"
+
+#include <algorithm>
+#include <iostream>
+#include <string>
+#include <map>
+
+#include <mutex>
+#include <condition_variable>
+
+#if defined(TECA_HAS_BOOST)
+#include <boost/program_options.hpp>
+#endif
+
+//#define TECA_DEBUG
+
+struct cache_entry
+{
+    cache_entry() : m_data(nullptr), m_keep(1) {}
+
+    std::mutex m_mutex;             // for access to the cache and time
+    std::condition_variable m_cond; // use to wait for another thread to provide the data
+    const_p_teca_dataset m_data;    // the dataset
+    unsigned long m_keep;           // when 0 safe to delete the element
+};
+
+using p_cache_entry = std::shared_ptr<cache_entry>;
+
+using index_t = unsigned long;
+using priority_t = unsigned long;
+
+using data_map_t = std::map<index_t, p_cache_entry>;
+using use_map_t = std::map<index_t, priority_t>;
+
+using heap_t = teca_priority_queue<index_t,   // key type (request index)
+    mapped_key_priority<index_t, priority_t>, // to look up priorities
+    std::less<>,                              // heapify by smallest
+    mapped_key_t<index_t>>;                   // location tracking container
+
+using p_heap_t = std::shared_ptr<heap_t>;
+
+struct teca_indexed_dataset_cache::internals_t
+{
+    internals_t() : m_current_time(0)
+    {
+        mapped_key_priority priority_lookup(m_time_used);
+        m_heap = heap_t::New(priority_lookup);
+    }
+
+    std::mutex m_mutex;         // for access to the following
+    p_heap_t m_heap;            // heap with least recently used dataset at the top
+    use_map_t m_time_used;      // the use time of each cached dataset
+    data_map_t m_data;          // cached data
+    priority_t m_current_time;  // the current time of use
+};
+
+
+// --------------------------------------------------------------------------
+teca_indexed_dataset_cache::teca_indexed_dataset_cache() :
+    max_cache_size(0), internals(new internals_t)
+{
+    this->set_number_of_input_connections(1);
+    this->set_number_of_output_ports(1);
+}
+
+// --------------------------------------------------------------------------
+teca_indexed_dataset_cache::~teca_indexed_dataset_cache()
+{
+    delete this->internals;
+}
+
+#if defined(TECA_HAS_BOOST)
+// --------------------------------------------------------------------------
+void teca_indexed_dataset_cache::get_properties_description(
+    const std::string &prefix, options_description &global_opts)
+{
+    options_description opts("Options for "
+        + (prefix.empty()?"teca_indexed_dataset_cache":prefix));
+
+    opts.add_options()
+
+        TECA_POPTS_GET(unsigned long, prefix, max_cache_size,
+            "Sets the maximum number of datasets to cache.")
+
+        ;
+
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
+    global_opts.add(opts);
+}
+
+// --------------------------------------------------------------------------
+void teca_indexed_dataset_cache::set_properties(
+    const std::string &prefix, variables_map &opts)
+{
+    this->teca_algorithm::set_properties(prefix, opts);
+
+    TECA_POPTS_SET(opts, unsigned long, prefix, max_cache_size)
+}
+#endif
+
+// --------------------------------------------------------------------------
+void teca_indexed_dataset_cache::clear_cache()
+{
+    {
+    std::lock_guard<std::mutex> lock(this->internals->m_mutex);
+    this->internals->m_heap->clear();
+    this->internals->m_time_used.clear();
+    this->internals->m_data.clear();
+    this->internals->m_current_time = 0;
+    }
+}
+
+// --------------------------------------------------------------------------
+std::vector<teca_metadata> teca_indexed_dataset_cache::get_upstream_request(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md,
+    const teca_metadata &request)
+{
+#ifdef TECA_DEBUG
+    std::cerr << teca_parallel_id()
+        << "teca_indexed_dataset_cache::get_upstream_request" << std::endl;
+#endif
+    (void)port;
+    (void)input_md;
+
+    std::vector<teca_metadata> up_reqs;
+
+    // force the user to set the cache size
+    if (this->max_cache_size == 0)
+    {
+        TECA_ERROR("max_cache_size is 0, you must set the"
+            " cache size before use.")
+        return up_reqs;
+    }
+
+    // get the requested index
+    std::string request_key;
+    if (request.get("index_request_key", request_key))
+    {
+        TECA_ERROR("Failed to locate the index_request_key")
+        return up_reqs;
+    }
+
+    index_t index = 0;
+    if (request.get(request_key, index))
+    {
+        TECA_ERROR("Failed to get the requested index using the"
+            " index_request_key \"" << request_key << "\"")
+        return up_reqs;
+    }
+
+    {
+    std::lock_guard<std::mutex> lock(this->internals->m_mutex);
+
+    // is this index in the cache?
+    if (this->internals->m_time_used.count(index))
+    {
+        // yes, update the use time
+        this->internals->m_time_used[index] = ++this->internals->m_current_time;
+        this->internals->m_heap->modified(index);
+
+        // make a note that it needs to be served one more time before
+        // it can be removed
+        p_cache_entry elem = this->internals->m_data[index];
+
+        {
+        std::lock_guard<std::mutex> elock(elem->m_mutex);
+        ++elem->m_keep;
+        }
+
+#ifdef TECA_DEBUG
+        std::cerr << teca_parallel_id() << "update entry " << index
+            << " keep=" << elem->m_keep << std::endl;
+#endif
+        return up_reqs;
+    }
+
+    // no, not in cache
+    // set the use time and put in the heap
+    this->internals->m_time_used[index] = ++this->internals->m_current_time;
+    this->internals->m_heap->push(index);
+
+    // add an empty cache enrty
+    this->internals->m_data[index] = std::make_shared<cache_entry>();
+
+#ifdef TECA_DEBUG
+    std::cerr << teca_parallel_id() << "add entry " << index << " "
+        << this->internals->m_current_time << std::endl;
+#endif
+    }
+
+    // generate the request for this index
+    up_reqs.push_back(request);
+    return up_reqs;
+}
+
+// --------------------------------------------------------------------------
+const_p_teca_dataset teca_indexed_dataset_cache::execute(
+    unsigned int port,
+    const std::vector<const_p_teca_dataset> &input_data,
+    const teca_metadata &request)
+{
+#ifdef TECA_DEBUG
+    std::cerr << teca_parallel_id()
+        << "teca_indexed_dataset_cache::execute" << std::endl;
+#endif
+    (void)port;
+
+    // get the requested index
+    std::string request_key;
+    if (request.get("index_request_key", request_key))
+    {
+        TECA_ERROR("Failed to locate the index_request_key")
+        return nullptr;
+    }
+
+    index_t index = 0;
+    if (request.get(request_key, index))
+    {
+        TECA_ERROR("Failed to get the requested index using the"
+            " index_request_key \"" << request_key << "\"")
+        return nullptr;
+    }
+
+    const_p_teca_dataset data_out;
+
+    // get the cache element associated with the requested index
+    p_cache_entry elem;
+    {
+    std::lock_guard<std::mutex> lock(this->internals->m_mutex);;
+    data_map_t::iterator it = this->internals->m_data.find(index);
+    if (it == this->internals->m_data.end())
+    {
+        TECA_ERROR("The cache is in an invalid state")
+        return nullptr;
+    }
+    elem = it->second;
+    }
+
+    if (input_data.size())
+    {
+        // add new data to the cache
+        {
+        std::lock_guard<std::mutex> elock(elem->m_mutex);
+        elem->m_data = input_data[0];
+        --elem->m_keep;
+        }
+        // notify other threads that may be waiting for this data
+        elem->m_cond.notify_all();
+#ifdef TECA_DEBUG
+        std::cerr << teca_parallel_id() << "add data " << index
+            << " keep=" << elem->m_keep << std::endl;
+#endif
+    }
+    else
+    {
+        // fetch existing data from the cache
+        if (!elem->m_data)
+        {
+            // data is not yet ready, it will be provided by another thread
+            std::unique_lock<std::mutex> elock(elem->m_mutex);
+            if (!elem->m_data)
+            {
+                // data is not ready wait for another thread to provide
+                elem->m_cond.wait(elock, [&]{ return bool(elem->m_data); });
+                --elem->m_keep;
+            }
+        }
+        else
+        {
+            // data is ready
+            std::lock_guard<std::mutex> elock(elem->m_mutex);
+            --elem->m_keep;
+        }
+#ifdef TECA_DEBUG
+        std::cerr << teca_parallel_id() << "use data " << index
+            << " keep=" << elem->m_keep << std::endl;
+#endif
+    }
+
+    // return the dataset
+    data_out = elem->m_data;
+
+    // enforce the max cache size
+    {
+    std::lock_guard<std::mutex> lock(this->internals->m_mutex);
+    unsigned long n_cached = this->internals->m_time_used.size();
+    if (n_cached > this->max_cache_size)
+    {
+#ifdef TECA_DEBUG
+        std::cerr << "cache too large " <<  n_cached << std::endl;
+        this->internals->m_heap->to_stream(std::cerr, false);
+#endif
+        // might have to save some elements if they haven't been served yet
+        std::vector<index_t> save;
+        save.reserve(n_cached);
+
+        unsigned long n_to_rm = n_cached - this->max_cache_size;
+
+        // make one pass over the cache in lru order, or stop if we find
+        // enough elements that can be deleted
+        for (unsigned long i = 0; n_to_rm && (i < n_cached); ++i)
+        {
+            index_t idx = this->internals->m_heap->pop();
+
+            p_cache_entry elem = this->internals->m_data[idx];
+
+            // have all requests for the data been served?
+            unsigned long keep = 0;
+            {
+            std::lock_guard<std::mutex> elock(elem->m_mutex);
+            keep = elem->m_keep;
+            }
+            if (keep)
+            {
+                // no, delete later
+                save.push_back(idx);
+#ifdef TECA_DEBUG
+                std::cerr << teca_parallel_id() << "save "
+                    << idx << " keep=" << keep << std::endl;
+#endif
+            }
+            else
+            {
+                // yes, delete now
+                this->internals->m_data.erase(idx);
+                this->internals->m_time_used.erase(idx);
+                --n_to_rm;
+#ifdef TECA_DEBUG
+                std::cerr << teca_parallel_id() << "evict "
+                    << idx << std::endl;
+#endif
+            }
+        }
+
+        // put elements we couldn't remove because they haven't been
+        // served yet back on the heap
+        unsigned long n = save.size();
+        for (unsigned long i = 0; i < n; ++i)
+        {
+            this->internals->m_heap->push(save[i]);
+        }
+    }
+    }
+
+    return data_out;
+}
diff --git a/alg/teca_indexed_dataset_cache.h b/alg/teca_indexed_dataset_cache.h
new file mode 100644
index 000000000..d7863c7d6
--- /dev/null
+++ b/alg/teca_indexed_dataset_cache.h
@@ -0,0 +1,65 @@
+#ifndef teca_indexed_dataset_cache_h
+#define teca_indexed_dataset_cache_h
+
+#include "teca_shared_object.h"
+#include "teca_algorithm.h"
+#include "teca_metadata.h"
+
+#include <string>
+#include <vector>
+
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_indexed_dataset_cache)
+
+/// Caches N datasets such that repeated requests for the same dataset are served from the cache
+/**
+ * A cache storing up to N datasets. Datasets are identified using their
+ * request index.  Repeated requests for the same dataset (ie same index) are
+ * served from the cache. When more than N unique datasets have been requested
+ * the cache is modified such that the least recently used dataset is replaced.
+ */
+class teca_indexed_dataset_cache : public teca_algorithm
+{
+public:
+    TECA_ALGORITHM_STATIC_NEW(teca_indexed_dataset_cache)
+    TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_indexed_dataset_cache)
+    TECA_ALGORITHM_CLASS_NAME(teca_indexed_dataset_cache)
+    ~teca_indexed_dataset_cache();
+
+    // report/initialize to/from Boost program options
+    // objects.
+    TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
+    TECA_SET_ALGORITHM_PROPERTIES()
+
+    /** @name max_cache_size
+     * Set the max number of datasets to cache.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(unsigned long, max_cache_size)
+    ///@}
+
+    /// clear any cached data.
+    void clear_cache();
+
+protected:
+    teca_indexed_dataset_cache();
+
+private:
+
+    std::vector<teca_metadata> get_upstream_request(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md,
+        const teca_metadata &request) override;
+
+    const_p_teca_dataset execute(
+        unsigned int port,
+        const std::vector<const_p_teca_dataset> &input_data,
+        const teca_metadata &request) override;
+
+private:
+    unsigned long max_cache_size;
+
+    struct internals_t;
+    internals_t *internals;
+};
+
+#endif
diff --git a/alg/teca_integrated_vapor_transport.cxx b/alg/teca_integrated_vapor_transport.cxx
index 39f2fd5f2..01405eaa1 100644
--- a/alg/teca_integrated_vapor_transport.cxx
+++ b/alg/teca_integrated_vapor_transport.cxx
@@ -156,15 +156,17 @@ void teca_integrated_vapor_transport::get_properties_description(
 
     opts.add_options()
         TECA_POPTS_GET(std::string, prefix, wind_u_variable,
-            "name of the variable containg the lon component of the wind vector (ua)")
+            "name of the variable containg the lon component of the wind vector")
         TECA_POPTS_GET(std::string, prefix, wind_v_variable,
-            "name of the variable containg the lat component of the wind vector (va)")
-        TECA_POPTS_GET(std::string, prefix, specific_humidty_variable,
-            "name of the variable containg the specific humidity (hus)")
+            "name of the variable containg the lat component of the wind vector")
+        TECA_POPTS_GET(std::string, prefix, specific_humidity_variable,
+            "name of the variable containg the specific humidity")
         TECA_POPTS_GET(double, prefix, fill_value,
-            "the value of the NetCDF _FillValue attribute (1e20)")
+            "the value of the NetCDF _FillValue attribute")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -172,6 +174,8 @@ void teca_integrated_vapor_transport::get_properties_description(
 void teca_integrated_vapor_transport::set_properties(
     const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, wind_u_variable)
     TECA_POPTS_SET(opts, std::string, prefix, wind_v_variable)
     TECA_POPTS_SET(opts, std::string, prefix, specific_humidity_variable)
@@ -419,5 +423,22 @@ const_p_teca_dataset teca_integrated_vapor_transport::execute(
             )
         )
 
+    // pass 2D arrays through.
+    p_teca_array_collection in_arrays =
+        std::const_pointer_cast<teca_array_collection>(in_mesh->get_point_arrays());
+
+    p_teca_array_collection out_arrays = out_mesh->get_point_arrays();
+
+    int n_arrays = in_arrays->size();
+    for (int i = 0; i < n_arrays; ++i)
+    {
+        p_teca_variant_array array = in_arrays->get(i);
+        if (array->size() == nxy)
+        {
+            // pass the array.
+            out_arrays->append(in_arrays->get_name(i), array);
+        }
+    }
+
     return out_mesh;
 }
diff --git a/alg/teca_integrated_vapor_transport.h b/alg/teca_integrated_vapor_transport.h
index 44bd896a4..4ce7649a7 100644
--- a/alg/teca_integrated_vapor_transport.h
+++ b/alg/teca_integrated_vapor_transport.h
@@ -10,19 +10,21 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_integrated_vapor_transport)
 
-/// an algorithm that computes integrated vapor transport (IVT)
+/// An algorithm that computes integrated vapor transport (IVT)
 /**
-Compute integrated vaport transport (IVT) from wind vector and
-specific humidity.
-
-IVT = - \frac{1}{g} \int_{p_0}^{p_1} \vec{v} q dp
-
-where q is the specific humidity, and \vec{v} = (u, v) are the
-longitudinal and latitudinal components of wind.
-
-This calculation is an instance of a vertical reduction where
-a 3D mesh is transformed into a 2D one.
-*/
+ * Compute integrated vapor transport (IVT) from wind vector and
+ * specific humidity.
+ *
+ * \f[
+ * IVT = \frac{1}{g} \int_{p_{sfc}}^{p_{top}} \vec{v} q dp
+ * \f]
+ *
+ * where q is the specific humidity, and \f$\vec{v} = (u, v)\f$ are the
+ * longitudinal and latitudinal components of wind.
+ *
+ * This calculation is an instance of a vertical reduction where
+ * a 3D mesh is transformed into a 2D one.
+ */
 class teca_integrated_vapor_transport : public teca_vertical_reduction
 {
 public:
@@ -31,35 +33,59 @@ class teca_integrated_vapor_transport : public teca_vertical_reduction
     TECA_ALGORITHM_CLASS_NAME(teca_integrated_vapor_transport)
     ~teca_integrated_vapor_transport();
 
-    // report/initialize to/from Boost program options
-    // objects.
+    /** @name program_options
+     * report/initialize to/from Boost program options objects.
+     */
+    ///@{
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
+    ///@}
 
-    // set the name of the varaiable that contains the longitudinal
-    // component of the wind vector ("ua")
+    /** @name wind_u_variable
+     * set the name of the varaiable that contains the longitudinal component
+     * of the wind vector ("ua")
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, wind_u_variable)
+    ///@}
 
-    // set the name of the varaiable that contains the latitudinal
-    // component of the wind vector ("va")
+    /** @name wind_v_variable
+     * set the name of the varaiable that contains the latitudinal component of
+     * the wind vector ("va")
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, wind_v_variable)
-
-    // set the name of the variable that contains the specific
-    // humidity ("hus")
-    TECA_ALGORITHM_PROPERTY(std::string,
-        specific_humidity_variable)
-
-    // set the name of the varaiable that contains the longitudinal
-    // component of the ivt vector ("ivt_u")
+    ///@}
+
+    /** @name specific_humidity_variable
+     * set the name of the variable that contains the specific humidity ("hus")
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, specific_humidity_variable)
+    ///@}
+
+    /** @name ivt_u_variable
+     * set the name of the varaiable that contains the longitudinal component
+     * of the ivt vector ("ivt_u")
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, ivt_u_variable)
+    ///@}
 
-    // set the name of the varaiable that contains the latitudinal
-    // component of the ivt vector ("ivt_v")
+    /** @name ivt_v_variable
+     * set the name of the varaiable that contains the latitudinal component of
+     * the ivt vector ("ivt_v")
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, ivt_v_variable)
+    ///@}
 
-    // set the _fillValue attribute for the output data.
-    // default 1.0e20
+    /** @name fill_value
+     * set the _fillValue attribute for the output data.  default 1.0e20
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(double, fill_value)
+    ///@}
 
 protected:
     teca_integrated_vapor_transport();
diff --git a/alg/teca_integrated_water_vapor.cxx b/alg/teca_integrated_water_vapor.cxx
new file mode 100644
index 000000000..481dfc690
--- /dev/null
+++ b/alg/teca_integrated_water_vapor.cxx
@@ -0,0 +1,362 @@
+#include "teca_integrated_water_vapor.h"
+
+#include "teca_cartesian_mesh.h"
+#include "teca_array_collection.h"
+#include "teca_variant_array.h"
+#include "teca_metadata.h"
+#include "teca_coordinate_util.h"
+
+#include <algorithm>
+#include <iostream>
+#include <string>
+#include <cmath>
+
+#if defined(TECA_HAS_BOOST)
+#include <boost/program_options.hpp>
+#endif
+
+using std::string;
+using std::vector;
+using std::cerr;
+using std::endl;
+using std::cos;
+
+//#define TECA_DEBUG
+
+namespace {
+template <typename coord_t, typename num_t>
+void cartesian_iwv(unsigned long nx, unsigned long ny, unsigned long nz,
+    const coord_t *plev, const num_t *q, num_t *iwv)
+{
+    unsigned long nxy = nx*ny;
+
+    // initialize the result
+    memset(iwv, 0, nxy*sizeof(num_t));
+
+    // work an x-y slice at  a time
+    unsigned long nzm1 = nz - 1;
+    for (unsigned long k = 0; k < nzm1; ++k)
+    {
+        // dp over the slice
+        num_t h2 = num_t(0.5) * (plev[k+1] - plev[k]);
+
+        // the current two x-y-planes of data
+        unsigned long knxy = k*nxy;
+        const num_t *q_k0 = q + knxy;
+        const num_t *q_k1 = q_k0 + nxy;
+
+        // accumulate this plane of data using trapazoid rule
+        for (unsigned long i = 0; i < nxy; ++i)
+        {
+            iwv[i] += h2 * (q_k0[i] + q_k1[i]);
+        }
+    }
+
+    // check the sign, in this way we can handle both increasing and decreasing
+    // pressure coordinates
+    num_t s = plev[1] - plev[0] < num_t(0) ? num_t(-1) : num_t(1);
+
+    // scale by -1/g
+    num_t m1g = s/num_t(9.80665);
+    for (unsigned long i = 0; i < nxy; ++i)
+        iwv[i] *= m1g;
+}
+
+template <typename coord_t, typename num_t>
+void cartesian_iwv(unsigned long nx, unsigned long ny, unsigned long nz,
+    const coord_t *plev, const num_t *q, const char *q_valid, num_t *iwv)
+{
+    unsigned long nxy = nx*ny;
+
+    // initialize the result
+    memset(iwv, 0, nxy*sizeof(num_t));
+
+    // work an x-y slice at a time
+    unsigned long nzm1 = nz - 1;
+    for (unsigned long k = 0; k < nzm1; ++k)
+    {
+        // dp over the slice
+        num_t h2 = num_t(0.5) * (plev[k+1] - plev[k]);
+
+        // the current two x-y-planes of data
+        unsigned long knxy = k*nxy;
+        const num_t *q_k0 = q + knxy;
+        const num_t *q_k1 = q_k0 + nxy;
+
+        const char *q_valid_k0 = q_valid + knxy;
+        const char *q_valid_k1 = q_valid_k0 + nxy;
+
+        // accumulate this plane of data using trapazoid rule
+        for (unsigned long i = 0; i < nxy; ++i)
+        {
+            iwv[i] += ((q_valid_k0[i] && q_valid_k1[i]) ?
+               h2 * (q_k0[i] + q_k1[i]) : num_t(0));
+        }
+    }
+
+    // check the sign, in this way we can handle both increasing and decreasing
+    // pressure coordinates
+    num_t s = plev[1] - plev[0] < num_t(0) ? num_t(-1) : num_t(1);
+
+    // scale by -1/g
+    num_t m1g = s/num_t(9.80665);
+    for (unsigned long i = 0; i < nxy; ++i)
+        iwv[i] *= m1g;
+}
+}
+
+// --------------------------------------------------------------------------
+teca_integrated_water_vapor::teca_integrated_water_vapor() :
+    specific_humidity_variable("Q"), iwv_variable("IWV"),
+    fill_value(1.0e20)
+{
+    this->set_number_of_input_connections(1);
+    this->set_number_of_output_ports(1);
+}
+
+// --------------------------------------------------------------------------
+teca_integrated_water_vapor::~teca_integrated_water_vapor()
+{}
+
+#if defined(TECA_HAS_BOOST)
+// --------------------------------------------------------------------------
+void teca_integrated_water_vapor::get_properties_description(
+    const string &prefix, options_description &global_opts)
+{
+    options_description opts("Options for "
+        + (prefix.empty()?"teca_integrated_water_vapor":prefix));
+
+    opts.add_options()
+        TECA_POPTS_GET(std::string, prefix, specific_humidity_variable,
+            "name of the variable containg the specific humidity")
+        TECA_POPTS_GET(double, prefix, fill_value,
+            "the value of the NetCDF _FillValue attribute")
+        ;
+
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
+    global_opts.add(opts);
+}
+
+// --------------------------------------------------------------------------
+void teca_integrated_water_vapor::set_properties(
+    const string &prefix, variables_map &opts)
+{
+    this->teca_algorithm::set_properties(prefix, opts);
+
+    TECA_POPTS_SET(opts, std::string, prefix, specific_humidity_variable)
+    TECA_POPTS_SET(opts, double, prefix, fill_value)
+}
+#endif
+
+// --------------------------------------------------------------------------
+teca_metadata teca_integrated_water_vapor::get_output_metadata(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md)
+{
+#ifdef TECA_DEBUG
+    std::cerr << teca_parallel_id()
+        << "teca_integrated_water_vapor::get_output_metadata" << std::endl;
+#endif
+    (void)port;
+
+    // set things up in the first pass, and don't modify in subsequent passes
+    // due to threading concerns
+
+    if (this->get_number_of_derived_variables() == 0)
+    {
+        // the base class will handle dealing with the transformation of
+        // mesh dimensions and reporting the array we produce, but we have
+        // to determine the data type and tell the name of the produced array.
+        const teca_metadata &md = input_md[0];
+
+        teca_metadata attributes;
+        if (md.get("attributes", attributes))
+        {
+            TECA_ERROR("Failed to determine output data type "
+                "because attributes are misisng")
+            return teca_metadata();
+        }
+
+        teca_metadata hus_atts;
+        if (attributes.get(this->specific_humidity_variable, hus_atts))
+        {
+            TECA_ERROR("Failed to determine output data type "
+                "because attributes for \"" << this->specific_humidity_variable
+                << "\" are misisng")
+            return teca_metadata();
+        }
+
+        int type_code = 0;
+        if (hus_atts.get("type_code", type_code))
+        {
+            TECA_ERROR("Failed to determine output data type "
+                "because attributes for \"" << this->specific_humidity_variable
+                << "\" is misisng a \"type_code\"")
+            return teca_metadata();
+        }
+
+        teca_array_attributes iwv_atts(
+            type_code, teca_array_attributes::point_centering,
+            0, "kg m^{-1} s^{-1}", "longitudinal integrated vapor transport",
+            "the longitudinal component of integrated vapor transport",
+            1, this->fill_value);
+
+
+        // install name and attributes of the output variables in the base classs
+        this->append_derived_variable(this->iwv_variable);
+        this->append_derived_variable_attribute(iwv_atts);
+    }
+
+    if (this->get_number_of_dependent_variables() == 0)
+    {
+        // install the names of the input variables in the base class
+        this->append_dependent_variable(this->specific_humidity_variable);
+    }
+
+    // invoke the base class method, which does the work of transforming
+    // the mesh and reporting the variables and their attributes.
+    return teca_vertical_reduction::get_output_metadata(port, input_md);
+}
+
+// --------------------------------------------------------------------------
+std::vector<teca_metadata> teca_integrated_water_vapor::get_upstream_request(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md,
+    const teca_metadata &request)
+{
+    // invoke the base class method
+    return teca_vertical_reduction::get_upstream_request(port, input_md, request);
+}
+
+// --------------------------------------------------------------------------
+const_p_teca_dataset teca_integrated_water_vapor::execute(
+    unsigned int port,
+    const std::vector<const_p_teca_dataset> &input_data,
+    const teca_metadata &request)
+{
+#ifdef TECA_DEBUG
+    std::cerr << teca_parallel_id()
+        << "teca_integrated_water_vapor::execute" << std::endl;
+#endif
+    (void)port;
+
+    // get the input mesh
+    const_p_teca_cartesian_mesh in_mesh
+        = std::dynamic_pointer_cast<const teca_cartesian_mesh>(input_data[0]);
+
+    if (!in_mesh)
+    {
+        TECA_ERROR("Failed to compute IWV because a cartesian mesh is required.")
+        return nullptr;
+    }
+
+    // get the input dimensions
+    unsigned long extent[6] = {0};
+    if (in_mesh->get_extent(extent))
+    {
+        TECA_ERROR("Failed to compute IWV because mesh extent is missing.")
+        return nullptr;
+    }
+
+    unsigned long nx = extent[1] - extent[0] + 1;
+    unsigned long ny = extent[3] - extent[2] + 1;
+    unsigned long nz = extent[5] - extent[4] + 1;
+
+    // get the pressure coordinates
+    const_p_teca_variant_array p = in_mesh->get_z_coordinates();
+    if (!p)
+    {
+        TECA_ERROR("Failed to compute IWV because pressure coordinates are missing")
+        return nullptr;
+    }
+
+    if (p->size() < 2)
+    {
+        TECA_ERROR("Failed to compute IWV because z dimensions "
+            << p->size() << " < 2 as required by the integration method")
+        return nullptr;
+    }
+
+    // gather the input arrays
+    const_p_teca_variant_array q =
+        in_mesh->get_point_arrays()->get(this->specific_humidity_variable);
+
+    if (!q)
+    {
+        TECA_ERROR("Failed to compute IWV because specific humidity \""
+            << this->specific_humidity_variable << "\" is missing")
+        return nullptr;
+    }
+
+    const_p_teca_variant_array q_valid =
+           in_mesh->get_point_arrays()->get(this->specific_humidity_variable + "_valid");
+
+    // the base class will construct the output mesh
+    p_teca_cartesian_mesh out_mesh
+        = std::dynamic_pointer_cast<teca_cartesian_mesh>(
+            std::const_pointer_cast<teca_dataset>(
+                teca_vertical_reduction::execute(port, input_data, request)));
+
+    if (!out_mesh)
+    {
+        TECA_ERROR("Failed to compute IWV because the output mesh was "
+            "not constructed")
+        return nullptr;
+    }
+
+    // allocate the output arrays
+    unsigned long nxy = nx*ny;
+    p_teca_variant_array iwv = q->new_instance(nxy);
+
+    // store the result
+    out_mesh->get_point_arrays()->set(this->iwv_variable, iwv);
+
+    // calculate IWV
+    NESTED_TEMPLATE_DISPATCH_FP(const teca_variant_array_impl,
+        p.get(), _COORDS,
+
+        const NT_COORDS *p_p = static_cast<TT_COORDS*>(p.get())->get();
+
+        NESTED_TEMPLATE_DISPATCH_FP(teca_variant_array_impl,
+            iwv.get(), _DATA,
+
+            NT_DATA *p_iwv = static_cast<TT_DATA*>(iwv.get())->get();
+
+            const NT_DATA *p_q = static_cast<const TT_DATA*>(q.get())->get();
+
+            const char *p_q_valid = nullptr;
+            if (q_valid)
+            {
+                using TT_MASK = teca_char_array;
+
+                p_q_valid = dynamic_cast<const TT_MASK*>(q_valid.get())->get();
+
+                ::cartesian_iwv(nx, ny, nz, p_p, p_q, p_q_valid, p_iwv);
+            }
+            else
+            {
+                ::cartesian_iwv(nx, ny, nz, p_p, p_q, p_iwv);
+            }
+            )
+        )
+
+    // pass 2D arrays through.
+    p_teca_array_collection in_arrays =
+        std::const_pointer_cast<teca_array_collection>(in_mesh->get_point_arrays());
+
+    p_teca_array_collection out_arrays = out_mesh->get_point_arrays();
+
+    int n_arrays = in_arrays->size();
+    for (int i = 0; i < n_arrays; ++i)
+    {
+        p_teca_variant_array array = in_arrays->get(i);
+        if (array->size() == nxy)
+        {
+            // pass the array.
+            out_arrays->append(in_arrays->get_name(i), array);
+        }
+    }
+
+    return out_mesh;
+}
diff --git a/alg/teca_integrated_water_vapor.h b/alg/teca_integrated_water_vapor.h
new file mode 100644
index 000000000..3070e6a49
--- /dev/null
+++ b/alg/teca_integrated_water_vapor.h
@@ -0,0 +1,85 @@
+#ifndef teca_integrated_water_vapor_h
+#define teca_integrated_water_vapor_h
+
+#include "teca_shared_object.h"
+#include "teca_vertical_reduction.h"
+#include "teca_metadata.h"
+
+#include <string>
+#include <vector>
+
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_integrated_water_vapor)
+
+/// An algorithm that computes integrated water vapor (IWV)
+/**
+ * Compute integrated vaport transport (IWV) from the specific humidity.
+ *
+ * \f[
+ * IWV = \frac{1}{g} \int_{p_{sfc}}^{p_{top}} q dp
+ * \f]
+ *
+ * where q is the specific humidity.
+ *
+ * This calculation is an instance of a vertical reduction where
+ * a 3D mesh is transformed into a 2D one.
+ */
+class teca_integrated_water_vapor : public teca_vertical_reduction
+{
+public:
+    TECA_ALGORITHM_STATIC_NEW(teca_integrated_water_vapor)
+    TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_integrated_water_vapor)
+    TECA_ALGORITHM_CLASS_NAME(teca_integrated_water_vapor)
+    ~teca_integrated_water_vapor();
+
+    // report/initialize to/from Boost program options
+    // objects.
+    TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
+    TECA_SET_ALGORITHM_PROPERTIES()
+
+    /** @name specific_humidity_variable
+     * set the name of the variable that contains the specific humidity ("hus")
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, specific_humidity_variable)
+    ///@}
+
+    /** @name iwv_variable
+     * set the name of the varaiable that contains the integrated water vapor
+     * ("iwv").
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, iwv_variable)
+    ///@}
+
+    /** @name fill_value
+     * set the _fillValue attribute for the output data.  default 1.0e20
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(double, fill_value)
+    ///@}
+
+protected:
+    teca_integrated_water_vapor();
+
+private:
+    teca_metadata get_output_metadata(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md) override;
+
+    std::vector<teca_metadata> get_upstream_request(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md,
+        const teca_metadata &request) override;
+
+    const_p_teca_dataset execute(
+        unsigned int port,
+        const std::vector<const_p_teca_dataset> &input_data,
+        const teca_metadata &request) override;
+
+private:
+    std::string specific_humidity_variable;
+    std::string iwv_variable;
+    double fill_value;
+};
+
+#endif
diff --git a/alg/teca_l2_norm.cxx b/alg/teca_l2_norm.cxx
index 9d66dbdd0..df2aed92f 100644
--- a/alg/teca_l2_norm.cxx
+++ b/alg/teca_l2_norm.cxx
@@ -1,6 +1,6 @@
 #include "teca_l2_norm.h"
 
-#include "teca_cartesian_mesh.h"
+#include "teca_mesh.h"
 #include "teca_array_collection.h"
 #include "teca_variant_array.h"
 #include "teca_metadata.h"
@@ -92,6 +92,8 @@ void teca_l2_norm::get_properties_description(
             "array to store the computed norm in")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -99,6 +101,8 @@ void teca_l2_norm::get_properties_description(
 void teca_l2_norm::set_properties(
     const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, component_0_variable)
     TECA_POPTS_SET(opts, std::string, prefix, component_1_variable)
     TECA_POPTS_SET(opts, std::string, prefix, component_2_variable)
@@ -279,12 +283,12 @@ const_p_teca_dataset teca_l2_norm::execute(
     (void)port;
 
     // get the input mesh
-    const_p_teca_cartesian_mesh in_mesh
-        = std::dynamic_pointer_cast<const teca_cartesian_mesh>(input_data[0]);
+    const_p_teca_mesh in_mesh
+        = std::dynamic_pointer_cast<const teca_mesh>(input_data[0]);
 
     if (!in_mesh)
     {
-        TECA_ERROR("Failed to compute l2 norm. dataset is not a teca_cartesian_mesh")
+        TECA_ERROR("Failed to compute l2 norm. dataset is not a teca_mesh")
         return nullptr;
     }
 
@@ -355,11 +359,10 @@ const_p_teca_dataset teca_l2_norm::execute(
 
     // create the output mesh, pass everything through, and
     // add the l2 norm array
-    p_teca_cartesian_mesh out_mesh = teca_cartesian_mesh::New();
-
-    out_mesh->shallow_copy(std::const_pointer_cast<teca_cartesian_mesh>(in_mesh));
+    p_teca_mesh out_mesh = std::static_pointer_cast<teca_mesh>
+        (std::const_pointer_cast<teca_mesh>(in_mesh)->new_shallow_copy());
 
-    out_mesh->get_point_arrays()->append(
+    out_mesh->get_point_arrays()->set(
         this->get_l2_norm_variable(request), l2_norm);
 
     return out_mesh;
diff --git a/alg/teca_l2_norm.h b/alg/teca_l2_norm.h
index f67e23581..5a67eceb0 100644
--- a/alg/teca_l2_norm.h
+++ b/alg/teca_l2_norm.h
@@ -10,10 +10,7 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_l2_norm)
 
-/// an algorithm that computes L2 norm
-/**
-Compute L2 norm
-*/
+/// An algorithm that computes L2 norm
 class teca_l2_norm : public teca_algorithm
 {
 public:
@@ -27,19 +24,43 @@ class teca_l2_norm : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the arrays that contain the vector components
-    // to compute norm from
+    /** @name component_0_variable
+     * Set the arrays that contain the vector components to compute the norm
+     * from.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_0_variable)
+    ///@}
+
+    /** @name component_1_variable
+     * Set the arrays that contain the vector components to compute the norm
+     * from.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_1_variable)
+    ///@}
+
+    /** @name component_2_variable
+     * Set the arrays that contain the vector components to compute the norm
+     * from.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_2_variable)
+    ///@}
 
-    // set the name of the array to store the result in.
-    // the default is "l2_norm"
+    /** @name l2_norm_variable
+     * set the name of the array to store the result in.  the default is
+     * "l2_norm"
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, l2_norm_variable)
+    ///@}
 
 protected:
     teca_l2_norm();
 
+    // helpers to get the variable names from either the incoming
+    // request or the class member variable.
     std::string get_component_0_variable(const teca_metadata &request);
     std::string get_component_1_variable(const teca_metadata &request);
     std::string get_component_2_variable(const teca_metadata &request);
diff --git a/alg/teca_laplacian.cxx b/alg/teca_laplacian.cxx
index 43c481e44..9d9966dd3 100644
--- a/alg/teca_laplacian.cxx
+++ b/alg/teca_laplacian.cxx
@@ -44,7 +44,7 @@ void laplacian(num_t *w, const pt_t *lon, const pt_t *lat,
     // delta lon squared as a function of latitude
     num_t d_lon = (lon[1] - lon[0]) * deg_to_rad<num_t>() * earth_radius<num_t>();
     // tan(lat)
-    num_t *tan_lat = static_cast<num_t*>(malloc(n_bytes)); 
+    num_t *tan_lat = static_cast<num_t*>(malloc(n_bytes));
     for (unsigned long j = 0; j < n_lat; ++j)
     {
         delta_lon_sq[j] = pow(d_lon * cos(lat[j] * deg_to_rad<num_t>()),2);
@@ -65,7 +65,7 @@ void laplacian(num_t *w, const pt_t *lon, const pt_t *lat,
     {
 	// set the current row in the u/v/w arrays
         unsigned long jj = j*n_lon;
-	/* 
+	/*
 	 * The following f_* variables describe the field
 	 * f in a grid oriented fashion:
 	 *
@@ -74,12 +74,12 @@ void laplacian(num_t *w, const pt_t *lon, const pt_t *lat,
 	 *	f_ijm	f_ji	f_ijp
 	 *
 	 *	f_imjm	f_imj	f_imjp
-	 * 
+	 *
 	 * The 'j' direction represents longitude, the
-	 * 'i' direciton represents latitude. 
+	 * 'i' direciton represents latitude.
 	 *
 	 * Note: The laplacian represented here uses the chain
-	 * rule to separate the (1/cos(lat)*d(cos(lat)*df/dlat)/dlat 
+	 * rule to separate the (1/cos(lat)*d(cos(lat)*df/dlat)/dlat
 	 * term into two terms.
 	 *
 	 */
@@ -94,15 +94,15 @@ void laplacian(num_t *w, const pt_t *lon, const pt_t *lat,
 	// set the pointer index for the output field w
 	// ... this is index i,j
         num_t *ww = w + jj;
-	// create a dummy variable for u**2 
+	// create a dummy variable for u**2
         num_t dlon_sq = delta_lon_sq[j];
 
         for (unsigned long i = 1; i < max_i; ++i)
         {
 	    // calculate the laplacian in spherical coordinates, assuming
 	    // constant radius R.
-            ww[i] = (f_imj[i] - num_t(2)*f_ij[i] + f_ipj[i])/dlat_sq - 
-		    tan_lat[j]*(f_ipj[i]-f_imj[i])/dlat + 
+            ww[i] = (f_imj[i] - num_t(2)*f_ij[i] + f_ipj[i])/dlat_sq -
+		    tan_lat[j]*(f_ipj[i]-f_imj[i])/dlat +
                     (f_ijm[i] - num_t(2)*f_ij[i] + f_ijp[i])/dlon_sq;
         }
     }
@@ -125,13 +125,13 @@ void laplacian(num_t *w, const pt_t *lon, const pt_t *lat,
 	    // set the pointer index for the output field w
 	    // ... this is index i,j
             num_t *ww = w + jj;
-	    // create a dummy variable for u**2 
+	    // create a dummy variable for u**2
             num_t dlon_sq = delta_lon_sq[j];
 
 	    // calculate the laplacian in spherical coordinates, assuming
 	    // constant radius R.
-            ww[0] = (f_imj[0] - num_t(2)*f_ij[0] + f_ipj[0])/dlat_sq - 
-		    tan_lat[j]*(f_ipj[0]-f_imj[0])/dlat + 
+            ww[0] = (f_imj[0] - num_t(2)*f_ij[0] + f_ipj[0])/dlat_sq -
+		    tan_lat[j]*(f_ipj[0]-f_imj[0])/dlat +
                     (f_ijm[0] - num_t(2)*f_ij[0] + f_ijp[0])/dlon_sq;
         }
 
@@ -152,13 +152,13 @@ void laplacian(num_t *w, const pt_t *lon, const pt_t *lat,
 	    // set the pointer index for the output field w
 	    // ... this is index i,j
             num_t *ww = w + jj + max_i;
-	    // create a dummy variable for u**2 
+	    // create a dummy variable for u**2
             num_t dlon_sq = delta_lon_sq[j];
 
 	    // calculate the laplacian in spherical coordinates, assuming
 	    // constant radius R.
-            ww[0] = (f_imj[0] - num_t(2)*f_ij[0] + f_ipj[0])/dlat_sq - 
-		    tan_lat[j]*(f_ipj[0]-f_imj[0])/dlat + 
+            ww[0] = (f_imj[0] - num_t(2)*f_ij[0] + f_ipj[0])/dlat_sq -
+		    tan_lat[j]*(f_ipj[0]-f_imj[0])/dlat +
                     (f_ijm[0] - num_t(2)*f_ij[0] + f_ijp[0])/dlon_sq;
         }
     }
@@ -193,7 +193,7 @@ void laplacian(num_t *w, const pt_t *lon, const pt_t *lat,
 
 // --------------------------------------------------------------------------
 teca_laplacian::teca_laplacian() :
-    component_0_variable(), 
+    component_0_variable(),
     laplacian_variable("laplacian")
 {
     this->set_number_of_input_connections(1);
@@ -219,6 +219,8 @@ void teca_laplacian::get_properties_description(
             "array to store the computed laplacian in")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -226,6 +228,8 @@ void teca_laplacian::get_properties_description(
 void teca_laplacian::set_properties(
     const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, component_0_variable)
     TECA_POPTS_SET(opts, std::string, prefix, laplacian_variable)
 }
diff --git a/alg/teca_laplacian.h b/alg/teca_laplacian.h
index 247e00bd4..35e623d39 100644
--- a/alg/teca_laplacian.h
+++ b/alg/teca_laplacian.h
@@ -10,10 +10,7 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_laplacian)
 
-/// an algorithm that computes laplacian
-/**
-Compute laplacian from a vector field.
-*/
+/// An algorithm that computes the Laplacian from a vector field.
 class teca_laplacian : public teca_algorithm
 {
 public:
@@ -27,14 +24,29 @@ class teca_laplacian : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the arrays that contain the vector components
-    // to compute laplacian from
+    /** @name component_0_variable
+     * Set the arrays that contain the vector components to compute laplacian
+     * from.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_0_variable)
+    ///@}
+
+    /** @name component_1_variable
+     * Set the arrays that contain the vector components to compute laplacian
+     * from.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_1_variable)
+    ///@}
 
-    // set the name of the array to store the result in.
-    // the default is "laplacian"
+    /** @name laplacian_variable
+     * Set the name of the array to store the result in.  the default is
+     * "laplacian".
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, laplacian_variable)
+    ///@}
 
 protected:
     teca_laplacian();
diff --git a/alg/teca_latitude_damper.cxx b/alg/teca_latitude_damper.cxx
index 34478dcfd..0a4804a1e 100644
--- a/alg/teca_latitude_damper.cxx
+++ b/alg/teca_latitude_damper.cxx
@@ -3,7 +3,7 @@
 #include "teca_variant_array.h"
 #include "teca_metadata.h"
 #include "teca_cartesian_mesh.h"
-#include "teca_metadata_util.h"
+#include "teca_string_util.h"
 
 #include <iostream>
 #include <set>
@@ -74,27 +74,31 @@ void teca_latitude_damper::get_properties_description(
 {
     options_description opts("Options for "
         + (prefix.empty()?"teca_latitude_damper":prefix));
-    
+
     opts.add_options()
         TECA_POPTS_GET(double, prefix, center,
             "set the center (mu) for the gaussian filter")
         TECA_POPTS_GET(double, prefix, half_width_at_half_max,
             "set the value of the half width at half maximum (HWHM) "
             "to calculate sigma from: sigma = HWHM/std::sqrt(2.0*std::log(2.0))")
-        TECA_POPTS_GET(std::vector<std::string>, prefix, damped_variables,
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, damped_variables,
             "set the variables that will be damped by the inverted "
             "gaussian filter")
         TECA_POPTS_GET(std::string, prefix, variable_post_fix,
             "set the post-fix that will be attached to the variables "
             "that will be saved in the output")
         ;
-    
+
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 // --------------------------------------------------------------------------
 void teca_latitude_damper::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, double, prefix, center)
     TECA_POPTS_SET(opts, double, prefix, half_width_at_half_max)
     TECA_POPTS_SET(opts, std::vector<std::string>, prefix, damped_variables)
@@ -213,14 +217,14 @@ std::vector<teca_metadata> teca_latitude_damper::get_upstream_request(
 
     arrays.insert(damped_vars.begin(), damped_vars.end());
 
-    // Cleaning off the postfix for arrays passed in the pipeline. 
+    // Cleaning off the postfix for arrays passed in the pipeline.
     // For ex a down stream could request "foo_damped" then we'd
     // need to request "foo". also remove "foo_damped" from the
     // request.
     const std::string &var_post_fix = this->variable_post_fix;
     if (!var_post_fix.empty())
     {
-        teca_metadata_util::remove_post_fix(arrays, var_post_fix);
+        teca_string_util::remove_post_fix(arrays, var_post_fix);
     }
 
     req.set("arrays", arrays);
diff --git a/alg/teca_latitude_damper.h b/alg/teca_latitude_damper.h
index 9cab2b7ff..908b6cc22 100644
--- a/alg/teca_latitude_damper.h
+++ b/alg/teca_latitude_damper.h
@@ -10,21 +10,24 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_latitude_damper)
 
+/// Inverted Gaussian damper for scalar fields.
 /**
-damps the specified scalar field(s) using an inverted Gaussian centered on a
-given latitude with a half width specified in degrees latitude. The paramters
-defining the Gaussian (center, half width at half max) can be specified by the
-user directly or by down stream algorithm via the following keys in the request.
-
-request keys:
-
-  teca_latitude_damper::damped_variables
-  teca_latitude_damper::half_width_at_half_max
-  teca_latitude_damper::center
-
-note that user specified values take precedence over request keys. When using
-request keys be sure to include the variable post-fix.
-*/
+ * Damps the specified scalar field(s) using an inverted Gaussian centered on a
+ * given latitude with a half width specified in degrees latitude. The
+ * parameters defining the Gaussian (center, half width at half max) can be
+ * specified by the user directly or by down stream algorithm via the
+ * following keys in the request.
+ *
+ * request keys:
+ *
+ *   teca_latitude_damper::damped_variables
+ *   teca_latitude_damper::half_width_at_half_max
+ *   teca_latitude_damper::center
+ *
+ * @note
+ * User specified values take precedence over request keys. When
+ * using request keys be sure to include the variable post-fix.
+ */
 class teca_latitude_damper : public teca_algorithm
 {
 public:
@@ -38,7 +41,7 @@ class teca_latitude_damper : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the center of the Gaussian in units of degress latitude.
+    // set the center of the Gaussian in units of degrees latitude.
     // default is 0.0 deg lat
     TECA_ALGORITHM_PROPERTY(double, center)
 
diff --git a/alg/teca_mask.h b/alg/teca_mask.h
index 6c7dcb84d..02b6072e8 100644
--- a/alg/teca_mask.h
+++ b/alg/teca_mask.h
@@ -1,6 +1,8 @@
 #ifndef teca_mask_h
 #define teca_mask_h
 
+/// @file
+
 #include "teca_shared_object.h"
 #include "teca_algorithm.h"
 #include "teca_metadata.h"
@@ -11,9 +13,8 @@
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_mask)
 
 /// an algorithm that masks a range of values
-/**
-An algorithm to mask a range of values in an array. Values
-in the range are replaced with the mask value.
+/** An algorithm to mask a range of values in an array. Values
+ * in the range are replaced with the mask value.
 */
 class teca_mask : public teca_algorithm
 {
diff --git a/alg/teca_normalize_coordinates.cxx b/alg/teca_normalize_coordinates.cxx
index a9544c7ae..a4f946816 100644
--- a/alg/teca_normalize_coordinates.cxx
+++ b/alg/teca_normalize_coordinates.cxx
@@ -5,6 +5,7 @@
 #include "teca_variant_array.h"
 #include "teca_metadata.h"
 #include "teca_coordinate_util.h"
+#include "teca_metadata_util.h"
 
 #include <algorithm>
 #include <iostream>
@@ -16,35 +17,80 @@
 #include <boost/program_options.hpp>
 #endif
 
-using std::cerr;
-using std::endl;
-
 //#define TECA_DEBUG
 
-struct teca_normalize_coordinates::internals_t
+struct internals
 {
-    internals_t() {}
-    ~internals_t() {}
-
-    static
-    p_teca_variant_array normalize_axis(const const_p_teca_variant_array &x);
-
-    static
-    void normalize_extent(p_teca_variant_array out_x,
-        p_teca_variant_array out_y, p_teca_variant_array out_z,
-        unsigned long *whole_extent, unsigned long *extent_in,
-        unsigned long *extent_out);
-
-    static
-    void normalize_variables(bool normalize_x,
-        bool normalize_y, bool normalize_z, unsigned long *extent,
-        p_teca_array_collection data);
+    // check and flip the axis. templated on comparison type std::less puts in
+    // ascending order, std::greater puts in descending order.
+    template <template<typename> typename compare_t>
+    static int reorder(p_teca_variant_array &x_out,
+        const const_p_teca_variant_array &x, bool &do_reorder);
+
+    // transforms coordinates from [-180, 180] to [0, 360].
+    template <typename data_t>
+    static data_t periodic_shift_x(data_t x);
+
+    // transforms coordinates from [0, 360] to [-180, 180].
+    template <typename data_t>
+    static data_t inv_periodic_shift_x(data_t x);
+
+    template<typename coord_t>
+    static void periodic_shift_x(coord_t *pxo,
+        unsigned long *pmap, const coord_t *px, unsigned long nx);
+
+    template<typename coord_t>
+    static void inv_periodic_shift_x(unsigned long *pmap,
+        const coord_t *px, unsigned long nx);
+
+    static int inv_periodic_shift_x(
+        p_teca_unsigned_long_array &map,
+        const const_p_teca_variant_array &x);
+
+    static int periodic_shift_x(p_teca_variant_array &out_x,
+        p_teca_unsigned_long_array &shift_map,
+        const const_p_teca_variant_array &in_x,
+        bool &shifted_x);
+
+    static int periodic_shift_x(p_teca_array_collection data,
+        const teca_metadata &attributes,
+        const const_p_teca_unsigned_long_array &shift_map,
+        const unsigned long *extent_in,
+        const unsigned long *extent_out);
+
+    // put the y-axis in ascending order if it is not.  if a transformation was
+    // applied reordered_y is set.
+    static int ascending_order_y(
+        p_teca_variant_array &out_y, const const_p_teca_variant_array &in_y,
+        bool &reorder_y);
+
+    // apply corresponding transformation that put the -y-axis in ascending
+    // order to all data arrays
+    static int ascending_order_y(p_teca_array_collection data,
+        const teca_metadata &attributes, const unsigned long *extent);
+
+
+    template <typename data_t>
+    struct indirect_less;
 };
 
+template <typename data_t>
+struct internals::indirect_less
+{
+    indirect_less(data_t *data) : m_data(data) {}
+
+    bool operator()(const unsigned long &l, const unsigned long &r)
+    {
+        return m_data[l] < m_data[r];
+    }
+
+    data_t *m_data;
+};
 
 // --------------------------------------------------------------------------
-p_teca_variant_array teca_normalize_coordinates::internals_t::normalize_axis(
-    const const_p_teca_variant_array &x)
+template <template<typename> typename compare_t>
+int internals::reorder(p_teca_variant_array &x_out,
+    const const_p_teca_variant_array &x, bool &do_reorder)
 {
     unsigned long nx = x->size();
     unsigned long x1 = nx - 1;
@@ -52,190 +98,343 @@ p_teca_variant_array teca_normalize_coordinates::internals_t::normalize_axis(
     NESTED_TEMPLATE_DISPATCH(const teca_variant_array_impl,
         x.get(), _C,
 
-        // detect coordinate axis in descending order, reorder it in ascending
-        // order. for instance an // input of x = (90 30 -30 -90) is transformed
-        // to x = (-90 -30 30 90)
         const NT_C *px = dynamic_cast<TT_C*>(x.get())->get();
-        if (px[x1] < px[0])
-        {
-            p_teca_variant_array xo = x->new_instance(nx);
-            NT_C *pxo = static_cast<teca_variant_array_impl<NT_C>*>(xo.get())->get();
 
-            pxo += x1;
-            for (unsigned long i = 0; i < nx; ++i)
-                pxo[-i] = px[i];
+        // if comp(x0, x1) reverse the axis.
+        // when comp is less than the output will be ascending
+        // when comp is greater than the output will be descending
+        compare_t compare;
+        do_reorder = compare(px[x1], px[0]);
 
-            return xo;
-        }
+        if (!do_reorder)
+            return 0;
+
+        p_teca_variant_array xo = x->new_instance(nx);
+        NT_C *pxo = static_cast<teca_variant_array_impl<NT_C>*>(xo.get())->get();
+
+        pxo += x1;
+        for (unsigned long i = 0; i < nx; ++i)
+            pxo[-i] = px[i];
+
+        x_out = xo;
+
+        return 0;
         )
-    return nullptr;
+
+    TECA_ERROR("Unsupported coordinate type " << x->get_class_name())
+    return -1;
 }
 
 // --------------------------------------------------------------------------
-void teca_normalize_coordinates::internals_t::normalize_extent(
-    p_teca_variant_array out_x, p_teca_variant_array out_y,
-    p_teca_variant_array out_z, unsigned long *whole_extent,
-    unsigned long *extent_in, unsigned long *extent_out)
+template <typename data_t>
+data_t internals::periodic_shift_x(data_t x)
 {
-#if defined(TECA_DEBUG)
-    cerr << "out=[" << out_x << ", " << out_y << ", " << out_z << "]" << endl
-        << "whole_extent=[" << whole_extent[0] << ", " << whole_extent[1] << ", "
-        << whole_extent[2] << ", " << whole_extent[3] << ", " << whole_extent[4]
-        << ", " << whole_extent[5] << "]" << endl << "extent_in=[" << extent_in[0]
-        << ", " << extent_in[1] << ", " << extent_in[2] << ", " << extent_in[3]
-        << ", " << extent_in[4] << ", " << extent_in[5] << "]" << endl;
-#endif
+    if (x < data_t(0))
+        return x + data_t(360);
+    return x;
+}
 
-    memcpy(extent_out, extent_in, 6*sizeof(unsigned long));
+// --------------------------------------------------------------------------
+template <typename data_t>
+data_t internals::inv_periodic_shift_x(data_t x)
+{
+    if (x > data_t(180))
+        return x - data_t(360);
+    return x;
+}
 
-    // detect coordinate axes in descending order, transform the incoming
-    // extents from ascending order coordinates back to original descending
-    // order coordinate system so the upstream gets the correct extent
-    if (out_x)
-    {
-        unsigned long wnx = whole_extent[1] - whole_extent[0];
-        extent_out[0] = wnx - extent_in[1];
-        extent_out[1] = wnx - extent_in[0];
-    }
+// --------------------------------------------------------------------------
+template<typename coord_t>
+void internals::periodic_shift_x(coord_t *pxo,
+    unsigned long *pmap, const coord_t *px, unsigned long nx)
+{
+    coord_t *tmp = (coord_t*)malloc(nx*sizeof(coord_t));
 
-    if (out_y)
-    {
-        unsigned long wny = whole_extent[3] - whole_extent[2];
-        extent_out[2] = wny - extent_in[3];
-        extent_out[3] = wny - extent_in[2];
-    }
+    // apply the periodic shift, this will leave the axis out of order
+    for (unsigned long i = 0; i < nx; ++i)
+        tmp[i] = periodic_shift_x(px[i]);
 
-    if (out_z)
-    {
-        unsigned long wnz = whole_extent[5] - whole_extent[4];
-        extent_out[4] = wnz - extent_in[5];
-        extent_out[5] = wnz - extent_in[4];
-    }
+    // construct the map the puts the axis back into order.
+    for (unsigned long i = 0; i < nx; ++i)
+        pmap[i] = i;
 
-#if defined(TECA_DEBUG)
-    cerr << "extent_out=[" << extent_out[0] << ", " << extent_out[1] << ", "
-        << extent_out[2] << ", " << extent_out[3] << ", " << extent_out[4]
-        << ", " << extent_out[5] << "]" << endl;
-#endif
+    indirect_less comp(tmp);
+    std::sort(pmap, pmap + nx, comp);
+
+    // reoder the periodic shifted values
+    for (unsigned long i = 0; i < nx; ++i)
+        pxo[i] = tmp[pmap[i]];
+
+    free(tmp);
 }
 
+// --------------------------------------------------------------------------
+template<typename coord_t>
+void internals::inv_periodic_shift_x(unsigned long *pmap,
+    const coord_t *px, unsigned long nx)
+{
+    coord_t *tmp = (coord_t*)malloc(nx*sizeof(coord_t));
+
+    // apply the periodic shift, this will leave the axis out of order
+    for (unsigned long i = 0; i < nx; ++i)
+        tmp[i] = inv_periodic_shift_x(px[i]);
+
+    // construct the map that the puts the axis back into order.
+    for (unsigned long i = 0; i < nx; ++i)
+        pmap[i] = i;
+
+    indirect_less comp(tmp);
+    std::sort(pmap, pmap + nx, comp);
+
+    free(tmp);
+}
 
 // --------------------------------------------------------------------------
-void teca_normalize_coordinates::internals_t::normalize_variables(
-    bool normalize_x, bool normalize_y, bool normalize_z,
-    unsigned long *extent, p_teca_array_collection data)
+int internals::inv_periodic_shift_x(p_teca_unsigned_long_array &map,
+    const const_p_teca_variant_array &x)
 {
-    unsigned long nx = extent[1] - extent[0] + 1;
-    unsigned long ny = extent[3] - extent[2] + 1;
-    unsigned long nz = extent[5] - extent[4] + 1;
+    unsigned long nx = x->size();
+
+    NESTED_TEMPLATE_DISPATCH(const teca_variant_array_impl,
+        x.get(), _C,
+
+        const NT_C *px = dynamic_cast<TT_C*>(x.get())->get();
+
+        map = teca_unsigned_long_array::New(nx);
+        unsigned long *pmap = map->get();
 
-    unsigned long nxy = nx*ny;
-    unsigned long nxyz = nxy*nz;
+        inv_periodic_shift_x(pmap, px, nx);
 
+        return 0;
+        )
+
+    TECA_ERROR("Unsupported coordinate type " << x->get_class_name())
+    return -1;
+}
+
+// --------------------------------------------------------------------------
+int internals::periodic_shift_x(p_teca_variant_array &x_out,
+    p_teca_unsigned_long_array &map, const const_p_teca_variant_array &x,
+    bool &shifted_x)
+{
+// ignore warning about unsigned integer types. these will never need
+// the periodic shift and the code will ignore them.
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wtype-limits"
+    unsigned long nx = x->size();
     unsigned long x1 = nx - 1;
-    unsigned long y1 = ny - 1;
-    unsigned long z1 = nz - 1;
 
-    unsigned int n_arrays = data->size();
+    NESTED_TEMPLATE_DISPATCH(const teca_variant_array_impl,
+        x.get(), _C,
 
-    // for any coodinate axes that have been transformed from descending order
-    // into ascending order, apply the same transform to the scalar data arrays
-    if (normalize_x)
-    {
-        for (unsigned int l = 0; l < n_arrays; ++l)
+        const NT_C *px = dynamic_cast<TT_C*>(x.get())->get();
+
+        // check that the shift is needed.
+        shifted_x = (px[0] < NT_C(0));
+
+        if (!shifted_x)
+            return 0;
+
+        // this approach requires that coordinates are in ascending
+        // order
+        if (px[x1] < px[0])
         {
-            p_teca_variant_array a = data->get(l);
-            p_teca_variant_array ao = a->new_instance(nxyz);
-            NESTED_TEMPLATE_DISPATCH(teca_variant_array_impl,
-                a.get(), _A,
-                NT_A *pa = static_cast<TT_A*>(a.get())->get();
-                NT_A *pao = static_cast<TT_A*>(ao.get())->get();
-                for (unsigned long k = 0; k < nz; ++k)
-                {
-                    unsigned long kk = k*nxy;
-                    for (unsigned long j = 0; j < ny; ++j)
-                    {
-                        unsigned long jj = kk + j*nx;
+            TECA_ERROR("A periodic shift can only be apllied to"
+                " coordinates in ascending order")
+            return -1;
+        }
 
-                        NT_A *par = pa + jj;
-                        NT_A *paor = pao + jj + x1;
+        // in its current form this approach handles coordinates in
+        // -180 to 180.
+        if ((px[0] < NT_C(-180)) || (px[x1] > NT_C(180)))
+        {
+            TECA_ERROR("Invalid x-axis coordinate range ["
+                << px[0] << " , " << px[x1] << "] coordinates in the"
+                " range [-180.0, 180] are required")
+            return -1;
+        }
 
-                        for (unsigned long i = 0; i < nx; ++i)
-                            paor[-i] = par[i];
-                    }
-                }
-                )
-            data->set(l, ao);
+        // if 2 coordinate points touch the periodic boundary remnove 1 so the
+        // output does not have an extranious data point at the boundary.
+        if (teca_coordinate_util::equal(px[0], NT_C(-180)) &&
+            teca_coordinate_util::equal(px[nx-1], NT_C(180)))
+        {
+            nx -= 1;
         }
-    }
 
-    if (normalize_y)
+        p_teca_variant_array xo = x->new_instance(nx);
+        NT_C *pxo = static_cast<teca_variant_array_impl<NT_C>*>
+            (xo.get())->get();
+
+        map = teca_unsigned_long_array::New(nx);
+        unsigned long *pmap = map->get();
+
+        periodic_shift_x(pxo, pmap, px, nx);
+
+        x_out = xo;
+
+        return 0;
+        )
+
+    TECA_ERROR("Unsupported coordinate type " << x->get_class_name())
+    return -1;
+#pragma GCC diagnostic pop
+}
+
+// --------------------------------------------------------------------------
+int internals::ascending_order_y(
+    p_teca_variant_array &out_y, const const_p_teca_variant_array &in_y,
+    bool &reorder_y)
+{
+    if (reorder<std::less>(out_y, in_y, reorder_y))
+        return -1;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int internals::periodic_shift_x(p_teca_array_collection data,
+    const teca_metadata &attributes,
+    const const_p_teca_unsigned_long_array &shift_map,
+    const unsigned long *extent_in,
+    const unsigned long *extent_out)
+{
+    // apply periodic shift in the x-direction
+    const unsigned long *pmap = shift_map->get();
+
+    unsigned int n_arrays = data->size();
+    for (unsigned int l = 0; l < n_arrays; ++l)
     {
-        unsigned int n_arrays = data->size();
-        for (unsigned int l = 0; l < n_arrays; ++l)
+        // get the extent of the input/output array
+        const std::string &array_name = data->get_name(l);
+        teca_metadata array_attributes;
+        if (attributes.get(array_name, array_attributes))
         {
-            p_teca_variant_array a = data->get(l);
-            p_teca_variant_array ao = a->new_instance(nxyz);
-            NESTED_TEMPLATE_DISPATCH(teca_variant_array_impl,
-                a.get(), _A,
-                NT_A *pa = static_cast<TT_A*>(a.get())->get();
-                NT_A *pao = static_cast<TT_A*>(ao.get())->get();
-                for (unsigned long k = 0; k < nz; ++k)
+            TECA_ERROR("Failed to get the attributes for \""
+                << array_name << "\"")
+            return -1;
+        }
+
+        unsigned long array_extent_in[6] = {0ul};
+        teca_metadata_util::get_array_extent(array_attributes,
+            extent_in, array_extent_in);
+
+        unsigned long array_extent_out[6] = {0ul};
+        teca_metadata_util::get_array_extent(array_attributes,
+            extent_out, array_extent_out);
+
+        // input and output arrays may be different size if there was a duplicated
+        // coordinate point on the periodic boundary
+        unsigned long nxi = array_extent_in[1] - array_extent_in[0] + 1;
+        unsigned long nyi = array_extent_in[3] - array_extent_in[2] + 1;
+        unsigned long nxyi = nxi*nyi;
+
+        unsigned long nxo = array_extent_out[1] - array_extent_out[0] + 1;
+        unsigned long nyo = array_extent_out[3] - array_extent_out[2] + 1;
+        unsigned long nzo = array_extent_out[5] - array_extent_out[4] + 1;
+        unsigned long nxyo = nxo*nyo;
+        unsigned long nxyzo = nxyo*nzo;
+
+        p_teca_variant_array a = data->get(l);
+
+        p_teca_variant_array ao = a->new_instance(nxyzo);
+        NESTED_TEMPLATE_DISPATCH(teca_variant_array_impl,
+            a.get(), _A,
+            NT_A *pa = static_cast<TT_A*>(a.get())->get();
+            NT_A *pao = static_cast<TT_A*>(ao.get())->get();
+            for (unsigned long k = 0; k < nzo; ++k)
+            {
+                unsigned long kki = k*nxyi;
+                unsigned long kko = k*nxyo;
+                for (unsigned long j = 0; j < nyo; ++j)
                 {
-                    unsigned long kk = k*nxy;
-                    for (unsigned long j = 0; j < ny; ++j)
+                    unsigned long jji = kki + j*nxi;
+                    unsigned long jjo = kko + j*nxo;
+
+                    NT_A *par = pa + jji;
+                    NT_A *paor = pao + jjo;
+
+                    for (unsigned long i = 0; i < nxo; ++i)
                     {
-                        unsigned long jj = kk + j*nx;
-                        unsigned long jjo = kk + (y1 - j)*nx;
-                        NT_A *par = pa + jj;
-                        NT_A *paor = pao + jjo;
-                        for (unsigned long i = 0; i < nx; ++i)
-                            paor[i] = par[i];
+                        paor[i] = par[pmap[i]];
                     }
                 }
-                )
-            data->set(l, ao);
-        }
+            }
+            )
+
+        data->set(l, ao);
     }
 
-    if (normalize_z)
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int internals::ascending_order_y(p_teca_array_collection data,
+    const teca_metadata &attributes, const unsigned long *mesh_extent)
+{
+    // for any coodinate axes that have been transformed from descending order
+    // into ascending order, apply the same transform to the scalar data arrays
+    unsigned int n_arrays = data->size();
+    for (unsigned int l = 0; l < n_arrays; ++l)
     {
-        for (unsigned int l = 0; l < n_arrays; ++l)
-        {
-            p_teca_variant_array a = data->get(l);
-            p_teca_variant_array ao = a->new_instance(nxyz);
-            NESTED_TEMPLATE_DISPATCH(teca_variant_array_impl,
-                a.get(), _A,
-                NT_A *pa = static_cast<TT_A*>(a.get())->get();
-                NT_A *pao = static_cast<TT_A*>(ao.get())->get();
-                for (unsigned long k = 0; k < nz; ++k)
-                {
-                    unsigned long kk = k*nxy;
-                    unsigned long kko = (z1 - k)*nxy;
-                    for (unsigned long j = 0; j < ny; ++j)
-                    {
-                        unsigned long jnx = j*nx;
-                        unsigned long jj = kk + jnx;
-                        unsigned long jjo = kko + jnx;
+        const std::string &array_name = data->get_name(l);
 
-                        NT_A *par = pa + jj;
-                        NT_A *paor = pao + jjo;
+        // get the extent of the array
+        unsigned long array_extent[6] = {0ul};
 
-                        for (unsigned long i = 0; i < nx; ++i)
-                            paor[i] = par[i];
-                    }
-                }
-                )
-            data->set(l, ao);
+        teca_metadata array_attributes;
+        if (attributes.get(array_name, array_attributes))
+        {
+            TECA_ERROR("Failed to get attributes for array \""
+                << array_name << "\"")
+            return -1;
         }
+
+        teca_metadata_util::get_array_extent(array_attributes,
+            mesh_extent, array_extent);
+
+        unsigned long nx = array_extent[1] - array_extent[0] + 1;
+        unsigned long ny = array_extent[3] - array_extent[2] + 1;
+        unsigned long nz = array_extent[5] - array_extent[4] + 1;
+
+        unsigned long nxy = nx*ny;
+        unsigned long nxyz = nxy*nz;
+
+        unsigned long y1 = ny - 1;
+
+        // apply the transform
+        p_teca_variant_array a = data->get(l);
+        p_teca_variant_array ao = a->new_instance(nxyz);
+        NESTED_TEMPLATE_DISPATCH(teca_variant_array_impl,
+            a.get(), _A,
+            NT_A *pa = static_cast<TT_A*>(a.get())->get();
+            NT_A *pao = static_cast<TT_A*>(ao.get())->get();
+            for (unsigned long k = 0; k < nz; ++k)
+            {
+                unsigned long kk = k*nxy;
+                for (unsigned long j = 0; j < ny; ++j)
+                {
+                    unsigned long jj = kk + j*nx;
+                    unsigned long jjo = kk + (y1 - j)*nx;
+                    NT_A *par = pa + jj;
+                    NT_A *paor = pao + jjo;
+                    for (unsigned long i = 0; i < nx; ++i)
+                        paor[i] = par[i];
+                }
+            }
+            )
+        data->set(l, ao);
     }
+
+    return 0;
 }
 
+
+
 // --------------------------------------------------------------------------
-teca_normalize_coordinates::teca_normalize_coordinates() : internals(nullptr)
+teca_normalize_coordinates::teca_normalize_coordinates() :
+    enable_periodic_shift_x(0), enable_y_axis_ascending(1)
 {
-    this->internals = new teca_normalize_coordinates::internals_t;
-
     this->set_number_of_input_connections(1);
     this->set_number_of_output_ports(1);
 }
@@ -243,20 +442,37 @@ teca_normalize_coordinates::teca_normalize_coordinates() : internals(nullptr)
 // --------------------------------------------------------------------------
 teca_normalize_coordinates::~teca_normalize_coordinates()
 {
-    delete this->internals;
 }
 
 #if defined(TECA_HAS_BOOST)
 // --------------------------------------------------------------------------
 void teca_normalize_coordinates::get_properties_description(
-    const std::string &/*prefix*/, options_description &/*global_opts*/)
+    const std::string &prefix, options_description &global_opts)
 {
+    options_description opts("Options for "
+        + (prefix.empty()?"teca_normalize_coordinates":prefix));
+
+    opts.add_options()
+        TECA_POPTS_GET(int, prefix, enable_periodic_shift_x,
+            "Enables application of periodic shift in the x-direction.")
+        TECA_POPTS_GET(int, prefix, enable_y_axis_ascending,
+            "Enables transformtion the ensures the y-axis is in"
+            " ascending order.")
+        ;
+
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
+    global_opts.add(opts);
 }
 
 // --------------------------------------------------------------------------
 void teca_normalize_coordinates::set_properties(
-    const std::string &/*prefix*/, variables_map &/*opts*/)
+    const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
+    TECA_POPTS_SET(opts, int, prefix, enable_periodic_shift_x)
+    TECA_POPTS_SET(opts, int, prefix, enable_y_axis_ascending)
 }
 #endif
 
@@ -265,8 +481,8 @@ teca_metadata teca_normalize_coordinates::get_output_metadata(
     unsigned int port, const std::vector<teca_metadata> &input_md)
 {
 #ifdef TECA_DEBUG
-    cerr << teca_parallel_id()
-        << "teca_normalize_coordinates::get_output_metadata" << endl;
+    std::cerr << teca_parallel_id()
+        << "teca_normalize_coordinates::get_output_metadata" << std::endl;
 #endif
     (void)port;
 
@@ -287,20 +503,68 @@ teca_metadata teca_normalize_coordinates::get_output_metadata(
         return teca_metadata();
     }
 
-    // check for and transform coordinate axes from descending order
-    // to ascending order
-    p_teca_variant_array out_x, out_y, out_z;
-    if ((out_x = this->internals->normalize_axis(in_x)))
+    // ensure x-axis is in 0 to 360
+    bool shifted_x = false;
+    p_teca_variant_array out_x;
+    p_teca_unsigned_long_array shift_map;
+    if (this->enable_periodic_shift_x &&
+        internals::periodic_shift_x(out_x, shift_map, in_x, shifted_x))
+    {
+        TECA_ERROR("Failed to apply periodic shift to the x-axis")
+        return teca_metadata();
+    }
+
+    // ensure y-axis ascending
+    bool reordered_y = false;
+    p_teca_variant_array out_y;
+    if (this->enable_y_axis_ascending &&
+        internals::ascending_order_y(out_y, in_y, reordered_y))
+    {
+        TECA_ERROR("Failed to put the y-axis in ascending order")
+        return teca_metadata();
+    }
+
+    // pass normalized coordinates
+    if (out_x)
+    {
         coords.set("x", out_x);
 
-    if ((out_y = this->internals->normalize_axis(in_y)))
-        coords.set("y", out_y);
+        // update the whole extent in case the coordinate axis touches the periodic boundary
+        if (out_x->size() != in_x->size())
+        {
+            unsigned long whole_extent[6];
+            if (out_md.get("whole_extent", whole_extent, 6))
+            {
+                TECA_ERROR("Failed to get the input whole_extent")
+                return teca_metadata();
+            }
+            whole_extent[1] -= 1;
+            out_md.set("whole_extent", whole_extent);
+        }
+    }
 
-    if ((out_z = this->internals->normalize_axis(in_z)))
-        coords.set("z", out_z);
+    if (out_y)
+        coords.set("y", out_y);
 
-    if (out_x || out_y || out_z)
+    if (out_x || out_y)
+    {
+        double bounds[6] = {0.0};
+        teca_coordinate_util::get_cartesian_mesh_bounds(
+            out_x ? out_x : in_x, out_y ? out_y : in_y, in_z,
+            bounds);
         out_md.set("coordinates", coords);
+        out_md.set("bounds", bounds);
+    }
+
+    if ((this->verbose > 1) &&
+        teca_mpi_util::mpi_rank_0(this->get_communicator()))
+    {
+        if (reordered_y)
+            TECA_STATUS("The y-axis will be transformed to be in ascending order.")
+
+        if (shifted_x)
+            TECA_STATUS("The x-axis will be transformed from [-180, 180] to [0, 360].")
+    }
 
     return out_md;
 }
@@ -310,6 +574,10 @@ std::vector<teca_metadata> teca_normalize_coordinates::get_upstream_request(
     unsigned int port, const std::vector<teca_metadata> &input_md,
     const teca_metadata &request)
 {
+#ifdef TECA_DEBUG
+    std::cerr << teca_parallel_id()
+        << "teca_normalize_coordinates::get_upstream_request" << std::endl;
+#endif
     (void)port;
 
     std::vector<teca_metadata> up_reqs;
@@ -327,28 +595,50 @@ std::vector<teca_metadata> teca_normalize_coordinates::get_upstream_request(
         return up_reqs;
     }
 
-    p_teca_variant_array in_x, in_y, in_z;
+    p_teca_variant_array in_x, in_y, z;
     if (!(in_x = coords.get("x")) || !(in_y = coords.get("y"))
-        || !(in_z = coords.get("z")))
+        || !(z = coords.get("z")))
     {
         TECA_ERROR("metadata is missing coordinate arrays")
         return up_reqs;
     }
 
-    // now convert the original coordinate axes into the
-    // normalized system. this isn't cached for thread safety
-    p_teca_variant_array out_x, out_y, out_z;
-    out_x = this->internals->normalize_axis(in_x);
-    out_y = this->internals->normalize_axis(in_y);
-    out_z = this->internals->normalize_axis(in_z);
+    // ensure x-axis is in 0 to 360
+    bool shifted_x = false;
+    p_teca_variant_array out_x;
+    p_teca_unsigned_long_array shift_map;
+    if (this->enable_periodic_shift_x &&
+        internals::periodic_shift_x(out_x, shift_map, in_x, shifted_x))
+    {
+        TECA_ERROR("Failed to apply periodic shift to the x-axis")
+        return up_reqs;
+    }
+
+    // compute the inverse map
+    p_teca_unsigned_long_array inv_shift_map;
+    if (shifted_x && internals::inv_periodic_shift_x(inv_shift_map, out_x))
+    {
+        TECA_ERROR("Failed to compute the inverse shifty map")
+        return up_reqs;
+    }
 
-    // normalized system is the same as the original, pass the request up
-    if (!out_x && !out_y && !out_z)
+    // ensure y-axis ascending
+    bool reordered_y = false;
+    p_teca_variant_array out_y;
+    if (this->enable_y_axis_ascending &&
+        internals::ascending_order_y(out_y, in_y, reordered_y))
     {
-        up_reqs.push_back(request);
+        TECA_ERROR("Failed to put the y-axis in ascending order")
         return up_reqs;
     }
 
+    // get the transformed bounds
+    const_p_teca_variant_array x = out_x ? out_x : in_x;
+    const_p_teca_variant_array y = out_y ? out_y : in_y;
+
+    double bounds[6] = {0.0};
+    teca_coordinate_util::get_cartesian_mesh_bounds(x, y, z, bounds);
+
     // get the original extent
     unsigned long whole_extent[6] = {0};
     if (input_md[0].get("whole_extent", whole_extent, 6))
@@ -359,35 +649,122 @@ std::vector<teca_metadata> teca_normalize_coordinates::get_upstream_request(
 
     // get the extent that is being requested
     unsigned long extent_in[6] = {0};
-    unsigned long extent_out[6] = {0};
-    double bounds[6] = {0.0};
-    if (req.get("bounds", bounds, 6))
+    double req_bounds[6] = {0.0};
+    if (req.get("bounds", req_bounds, 6))
     {
-        // bounds key not present, check for extent key
-        // if not present use whole_extent
+        // bounds key not present, check for extent key if not present use
+        // whole_extent
         if (request.get("extent", extent_in, 6))
+        {
+            // correct in case we removed a duplicated point at the periodic
+            // boundary
+            if (out_x && (in_x->size() != out_x->size()))
+                whole_extent[1]  -= 1;
+
             memcpy(extent_in, whole_extent, 6*sizeof(unsigned long));
+        }
+
+        // convert extent to bounds
+        x->get(extent_in[0], req_bounds[0]);
+        x->get(extent_in[1], req_bounds[1]);
+        y->get(extent_in[2], req_bounds[2]);
+        y->get(extent_in[3], req_bounds[3]);
+        z->get(extent_in[4], req_bounds[4]);
+        z->get(extent_in[5], req_bounds[5]);
     }
     else
     {
-        // bounds key was present, convert the bounds to an
-        // an extent that covers them.
-        if (teca_coordinate_util::bounds_to_extent(bounds,
-            (out_x ? out_x : in_x), (out_y ? out_y : in_y),
-            (out_z ? out_z : in_z), extent_in))
-        {
-            TECA_ERROR("invalid bounds requested.")
-            return up_reqs;
-        }
-
         // remove the bounds request, which will force the reader to
         // use the given extent
         req.remove("bounds");
     }
 
-    // apply the trsnaform if needed
-    this->internals->normalize_extent(out_x, out_y, out_z,
-        whole_extent, extent_in, extent_out);
+    // validate the requested bounds
+    if (!teca_coordinate_util::same_orientation(bounds, req_bounds) ||
+        !teca_coordinate_util::covers(bounds, req_bounds))
+    {
+        TECA_ERROR("Invalid request. The requested bounds ["
+            <<  req_bounds[0] << ", " << req_bounds[1] << ", "
+            <<  req_bounds[2] << ", " << req_bounds[3] << ", "
+            <<  req_bounds[4] << ", " << req_bounds[5]
+            << "] is not covered by the available bounds ["
+            <<  bounds[0] << ", " << bounds[1] << ", "
+            <<  bounds[2] << ", " << bounds[3] << ", "
+            <<  bounds[4] << ", " << bounds[5] << "]")
+        return up_reqs;
+    }
+
+    // transform the bounds
+    double tfm_bounds[6];
+    memcpy(tfm_bounds, req_bounds, 6*sizeof(double));
+
+    if (shifted_x)
+    {
+        // if a bounds request crosses the periodic boundary
+        // then it needs to be split into 2 requests. Eg: a request
+        // for [90, 270] becomes [-180, -90], [90, 180].
+        // If this comes up a lot we could implement as follows:
+        // issue both requests here and merge the data in execute.
+
+        if (((req_bounds[0] < 180.0) && (req_bounds[1] > 180.0)) ||
+            teca_coordinate_util::equal(req_bounds[0], 180.0) ||
+            teca_coordinate_util::equal(req_bounds[1], 180.0))
+        {
+            // crosses periodic boundary (TODO handle subseting)
+            unsigned long x1 = in_x->size() - 1;
+            in_x->get(0, tfm_bounds[0]);
+            in_x->get(x1, tfm_bounds[1]);
+
+            TECA_WARNING("The requested x-axis bounds"
+                " [" << req_bounds[0] << ", " << req_bounds[1] << "] cross a"
+                " periodic boundary. Subsetting across a periodic boundary is"
+                " not fully implemented. Requesting the entire x-axis ["
+                << tfm_bounds[0] << ", " << tfm_bounds[1] << "]")
+        }
+        else
+        {
+            tfm_bounds[0] = internals::inv_periodic_shift_x(tfm_bounds[0]);
+            tfm_bounds[1] = internals::inv_periodic_shift_x(tfm_bounds[1]);
+        }
+    }
+
+    if (reordered_y)
+    {
+        std::swap(tfm_bounds[2], tfm_bounds[3]);
+    }
+
+    // convert the transformed bounds to an
+    // an extent that covers them in the upstream coordinate system
+    unsigned long extent_out[6];
+    memcpy(extent_out, extent_in, 6*sizeof(unsigned long));
+
+    if (teca_coordinate_util::bounds_to_extent(tfm_bounds,
+            in_x, in_y, z, extent_out) ||
+        teca_coordinate_util::validate_extent(in_x->size(),
+            in_y->size(), z->size(), extent_out, true))
+    {
+        TECA_ERROR("invalid bounds requested.")
+        return up_reqs;
+    }
+
+#ifdef TECA_DEBUG
+    std::cerr << "req_bounds = [" <<  req_bounds[0]
+        << ", " << req_bounds[1] << ", " <<  req_bounds[2]
+        << ", " << req_bounds[3] << ", " <<  req_bounds[4]
+        << ", " << req_bounds[5] << "]" << std::endl
+        << "tfm_bounds = [" <<  tfm_bounds[0]
+        << ", " << tfm_bounds[1] << ", " <<  tfm_bounds[2]
+        << ", " << tfm_bounds[3] << ", " <<  tfm_bounds[4]
+        << ", " << tfm_bounds[5] << "]" << std::endl
+        << "extent_in = [" <<  extent_in[0]
+        << ", " << extent_in[1] << ", " <<  extent_in[2]
+        << ", " << extent_in[3] << ", " <<  extent_in[4]
+        << ", " << extent_in[5] << "]" << std::endl
+        << "extent_out = [" <<  extent_out[0]
+        << ", " << extent_out[1] << ", " <<  extent_out[2]
+        << ", " << extent_out[3] << ", " <<  extent_out[4]
+        << ", " << extent_out[5] << "]" << std::endl;
+#endif
 
     // send the request up
     req.set("extent", extent_out, 6);
@@ -402,7 +779,8 @@ const_p_teca_dataset teca_normalize_coordinates::execute(unsigned int port,
     const teca_metadata &request)
 {
 #ifdef TECA_DEBUG
-    cerr << teca_parallel_id() << "teca_normalize_coordinates::execute" << endl;
+    std::cerr << teca_parallel_id()
+        << "teca_normalize_coordinates::execute" << std::endl;
 #endif
     (void)port;
     (void)request;
@@ -413,7 +791,7 @@ const_p_teca_dataset teca_normalize_coordinates::execute(unsigned int port,
 
     if (!in_mesh)
     {
-        TECA_ERROR("Failed to compute l2 norm. dataset is not a teca_cartesian_mesh")
+        TECA_ERROR("The input dataset is not a teca_cartesian_mesh")
         return nullptr;
     }
 
@@ -426,37 +804,98 @@ const_p_teca_dataset teca_normalize_coordinates::execute(unsigned int port,
     const_p_teca_variant_array in_y = in_mesh->get_y_coordinates();
     const_p_teca_variant_array in_z = in_mesh->get_z_coordinates();
 
-    // transform the axes to ascending order if needed
-    p_teca_variant_array out_x, out_y, out_z;
-    if ((out_x = this->internals->normalize_axis(in_x)))
+    // get the extent
+    unsigned long extent_in[6];
+    in_mesh->get_extent(extent_in);
+
+    unsigned long extent_out[6];
+    memcpy(extent_out, extent_in, 6*sizeof(unsigned long));
+
+    // ensure x-axis is in 0 to 360
+    bool shifted_x = false;
+    p_teca_variant_array out_x;
+    p_teca_unsigned_long_array shift_map;
+    if (this->enable_periodic_shift_x &&
+        internals::periodic_shift_x(out_x, shift_map, in_x, shifted_x))
     {
-        std::string var;
-        in_mesh->get_x_coordinate_variable(var);
-        out_mesh->set_x_coordinates(var, out_x);
+        TECA_ERROR("Failed to apply periodic shift to the x-axis")
+        return nullptr;
     }
 
-    if ((out_y = this->internals->normalize_axis(in_y)))
+    teca_metadata attributes;
+
+    if (shifted_x)
     {
+        in_mesh->get_attributes(attributes);
+
+        if (this->verbose &&
+            teca_mpi_util::mpi_rank_0(this->get_communicator()))
+        {
+            TECA_STATUS("The x-axis will be transformed from [-180, 180] to [0, 360].")
+        }
+
         std::string var;
-        in_mesh->get_y_coordinate_variable(var);
-        out_mesh->set_y_coordinates(var, out_y);
+        in_mesh->get_x_coordinate_variable(var);
+        out_mesh->set_x_coordinates(var, out_x);
+
+        // correct extent in case the coordinate axis touches the periodic boundary
+        if (out_x && (out_x->size() != in_x->size()))
+        {
+            if (teca_mpi_util::mpi_rank_0(this->get_communicator()))
+            {
+                TECA_WARNING("The coordinate and data on the periodic boundary"
+                    " at x = +/- 180 is duplicated.")
+            }
+
+            extent_out[1] -= 1;
+            out_mesh->set_extent(extent_out);
+
+            unsigned long whole_extent[6];
+            in_mesh->get_whole_extent(whole_extent);
+            whole_extent[1] -= 1;
+
+            out_mesh->set_whole_extent(whole_extent);
+        }
+
+        if (internals::periodic_shift_x(out_mesh->get_point_arrays(),
+            attributes, shift_map, extent_in, extent_out))
+        {
+            TECA_ERROR("Failed to apply periodic shift in the x direction")
+            return nullptr;
+        }
     }
 
-    if ((out_z = this->internals->normalize_axis(in_z)))
+    // ensure y-axis ascending
+    bool reordered_y = false;
+    p_teca_variant_array out_y;
+    if (this->enable_y_axis_ascending &&
+        internals::ascending_order_y(out_y, in_y, reordered_y))
     {
-        std::string var;
-        in_mesh->get_z_coordinate_variable(var);
-        out_mesh->set_z_coordinates(var, out_z);
+        TECA_ERROR("Failed to put the y-axis in ascending order")
+        return nullptr;
     }
 
-    // apply the same set of transforms to the data
-    if (out_x || out_y || out_z)
+    if (reordered_y)
     {
-        unsigned long extent[6];
-        in_mesh->get_extent(extent);
+        if (attributes.empty())
+            in_mesh->get_attributes(attributes);
+
+        if (this->verbose &&
+            teca_mpi_util::mpi_rank_0(this->get_communicator()))
+        {
+            TECA_STATUS("The y-axis will be transformed to be in ascending order.")
+        }
 
-        this->internals->normalize_variables(out_x.get(),
-            out_y.get(), out_z.get(), extent, out_mesh->get_point_arrays());
+        std::string var;
+        in_mesh->get_y_coordinate_variable(var);
+        out_mesh->set_y_coordinates(var, out_y);
+
+        if (internals::ascending_order_y(out_mesh->get_point_arrays(),
+            attributes, extent_out))
+        {
+            TECA_ERROR("Failed to put point arrays into ascending order")
+            return nullptr;
+        }
     }
 
     return out_mesh;
diff --git a/alg/teca_normalize_coordinates.h b/alg/teca_normalize_coordinates.h
index 87d071603..265a269ab 100644
--- a/alg/teca_normalize_coordinates.h
+++ b/alg/teca_normalize_coordinates.h
@@ -10,12 +10,27 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_normalize_coordinates)
 
-/// an algorithm to ensure that coordinates are in ascending order
-/**
-Transformations of coordinates and data to/from ascending order
-are made as data and information pass up and down stream through
-the algorithm.
-*/
+/** @brief
+ * An algorithm to ensure that Cartesian mesh coordinates follow conventions
+ *
+ * @details
+ * When enabled, transformations of coordinates and data are applied such that
+ * Cartesian meshes are follow the conventions:
+ *
+ * 1. the x-axis coordinates are in the range of 0 to 360.
+ * 2. the y-axis coordinate are in ascending order.
+ *
+ * These transformations are automatically applied and can be enabled or
+ * disbaled as needed. The properties enable_periodic_shift and
+ * enable_y_axis_ascending provide a way to enable/disable the transforms.
+ *
+ * Subset requests are not implemented when the periodic shift is enabled. When
+ * a request is made for data that crosses the periodic boundary, the request
+ * is modified to request the entire x-axis.
+ *
+ * If data point opn the periodic boundary is duplicated, the data at 180 is
+ * dropped and a warning is issued.g
+ */
 class teca_normalize_coordinates : public teca_algorithm
 {
 public:
@@ -29,6 +44,30 @@ class teca_normalize_coordinates : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
+    /** @name enable_periodic_shift_x
+     * If set, this  enables an automatic transformation of the x-axis
+     * coordinates and data from [-180, 180] to [0, 360]. When enabled, the
+     * transformation is applied if the lowest x coordinate is less than 0 and
+     * skipped otherwise.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(int, enable_periodic_shift_x)
+    ///@}
+
+    /** @name enable_y_axis_ascending
+     * If set, this enables an automatic transformation of the y-axis
+     * coordinates and data from descending to ascending order. The
+     * transformation is applied if the lowest y coordinate is greater than the
+     * highest y coordinate skipped otherwise. Many TECA algorithms are written
+     * to process data with y-axis coordinates in ascending order, thus the
+     * transform is enabled by default. Setting this to 0 disables the
+     * transform for cases where it is desirable to pass data through
+     * unmodified.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(int, enable_y_axis_ascending)
+    ///@}
+
 protected:
     teca_normalize_coordinates();
 
@@ -45,8 +84,8 @@ class teca_normalize_coordinates : public teca_algorithm
         const teca_metadata &request) override;
 
 private:
-    struct internals_t;
-    internals_t *internals;
+    int enable_periodic_shift_x;
+    int enable_y_axis_ascending;
 };
 
 #endif
diff --git a/alg/teca_parser.h b/alg/teca_parser.h
index 540d8db28..7e1703b0e 100644
--- a/alg/teca_parser.h
+++ b/alg/teca_parser.h
@@ -1,6 +1,8 @@
 #ifndef teca_parser_h
 #define teca_parser_h
 
+/// @file
+
 #include "teca_common.h"
 
 #include <vector>
@@ -42,14 +44,14 @@
          << "\" requires " << _nreq << " operands, given "              \
          << _ngive << ". ", _expr, _pos)
 
+/// Codes dealing with expression parsing.
 namespace teca_parser
 {
-/**
-class that recognizes and extracts tokens during parsing.
-given a pointer (first argument) the methods return the
-number of chars in the token, or 0 when the pointer doesn't
-point to a valid token, and copies the token into the buffer
-(second argument).
+/** Recognizes and extracts tokens during parsing.
+ * given a pointer (first argument) the methods return the
+ * number of chars in the token, or 0 when the pointer doesn't
+ * point to a valid token, and copies the token into the buffer
+ * (second argument).
 */
 class tokenizer
 {
@@ -64,13 +66,12 @@ class tokenizer
     static unsigned int get_operator_precedence(char *op);
 };
 
-/**
-convert infix expression to postfix. returns the postfix form
-of the expression in a string allocated with malloc. caller to
-free the string. return nullptr if there is an error.
-
-template types implement detection of classes of syntactical
-tokens. groups, constants, variables, and operators.
+/** Convert infix expression to postfix. returns the postfix form
+ * of the expression in a string allocated with malloc. caller to
+ * free the string. return nullptr if there is an error.
+ *
+ * template types implement detection of classes of syntactical
+ * tokens. groups, constants, variables, and operators.
 */
 template<typename tokenizer_t=teca_parser::tokenizer>
 char *infix_to_postfix(const char *iexpr, std::set<std::string> *variables)
@@ -191,15 +192,14 @@ char *infix_to_postfix(const char *iexpr, std::set<std::string> *variables)
     return rpnexpr;
 }
 
-/**
-evaluate a postfix expression. returns non zero if an error occurred.
-the result of the evaluted expression is returned in iexpr_result.
-
-template types define the intermediate types used in the calculation.
-arg_t would likely be the const form of work_t. resolvers for constants,
-variables, and operators are passed. The purpose of the resolvers is
-to identify token class and implement variable lookup, and operator
-evaluation.
+/** evaluate a postfix expression. returns non zero if an error occurred.
+ * the result of the evaluated expression is returned in iexpr_result.
+ *
+ * template types define the intermediate types used in the calculation.
+ * arg_t would likely be the const form of work_t. resolvers for constants,
+ * variables, and operators are passed. The purpose of the resolvers is
+ * to identify token class and implement variable lookup, and operator
+ * evaluation.
 */
 template<typename work_t, typename arg_t, typename operand_resolver_t,
 typename operator_resolver_t, typename tokenizer_t=teca_parser::tokenizer>
diff --git a/alg/teca_rename_variables.cxx b/alg/teca_rename_variables.cxx
new file mode 100644
index 000000000..16c95d9eb
--- /dev/null
+++ b/alg/teca_rename_variables.cxx
@@ -0,0 +1,225 @@
+#include "teca_rename_variables.h"
+
+#include "teca_mesh.h"
+#include "teca_array_collection.h"
+#include "teca_variant_array.h"
+#include "teca_metadata.h"
+#include "teca_array_attributes.h"
+
+#include <algorithm>
+#include <iostream>
+#include <string>
+#include <set>
+#include <cmath>
+
+#if defined(TECA_HAS_BOOST)
+#include <boost/program_options.hpp>
+#endif
+
+using std::string;
+using std::vector;
+using std::set;
+using std::cerr;
+using std::endl;
+
+//#define TECA_DEBUG
+
+// --------------------------------------------------------------------------
+teca_rename_variables::teca_rename_variables() :
+    original_variable_names(), new_variable_names()
+{
+    this->set_number_of_input_connections(1);
+    this->set_number_of_output_ports(1);
+}
+
+// --------------------------------------------------------------------------
+teca_rename_variables::~teca_rename_variables()
+{}
+
+#if defined(TECA_HAS_BOOST)
+// --------------------------------------------------------------------------
+void teca_rename_variables::get_properties_description(
+    const string &prefix, options_description &global_opts)
+{
+    options_description opts("Options for "
+        + (prefix.empty()?"teca_rename_variables":prefix));
+
+    opts.add_options()
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, original_variable_names,
+            "Sets the list of original_variable_names to rename.")
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, new_variable_names,
+            "Sets the list of new names, one for each variable to rename.")
+        ;
+
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
+    global_opts.add(opts);
+}
+
+// --------------------------------------------------------------------------
+void teca_rename_variables::set_properties(
+    const string &prefix, variables_map &opts)
+{
+    this->teca_algorithm::set_properties(prefix, opts);
+
+    TECA_POPTS_SET(opts, std::vector<std::string>, prefix, original_variable_names)
+    TECA_POPTS_SET(opts, std::vector<std::string>, prefix, new_variable_names)
+
+}
+#endif
+
+// --------------------------------------------------------------------------
+teca_metadata teca_rename_variables::get_output_metadata(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md)
+{
+#ifdef TECA_DEBUG
+    cerr << teca_parallel_id()
+        << "teca_rename_variables::get_output_metadata" << endl;
+#endif
+    (void)port;
+
+    // validate the user provided values.
+    if (this->original_variable_names.size() != this->new_variable_names.size())
+    {
+        TECA_ERROR("Each variable to rename must have a "
+            " corresponding output_variable_name.")
+        return teca_metadata();
+    }
+
+    teca_metadata out_md(input_md[0]);
+
+    // update the list of original_variable_names to reflect the new names
+    std::set<std::string> out_vars;
+    if (out_md.get("variables", out_vars))
+    {
+        TECA_ERROR("Failed to get the list of variables")
+        return teca_metadata();
+    }
+
+    unsigned long n_vars = this->original_variable_names.size();
+    for (unsigned long i = 0; i < n_vars; ++i)
+    {
+        std::set<std::string>::iterator it = out_vars.find(this->original_variable_names[i]);
+        if (it == out_vars.end())
+        {
+            TECA_ERROR("No such variable \"" << this->original_variable_names[i]
+                << "\" to rename")
+            return teca_metadata();
+        }
+
+        out_vars.erase(it);
+        out_vars.insert(this->new_variable_names[i]);
+    }
+
+    // update the list of attributes to reflect the new names
+    teca_metadata attributes;
+    if (out_md.get("attributes", attributes))
+    {
+        TECA_ERROR("Failed to get attributes")
+        return teca_metadata();
+    }
+
+    for (unsigned long i = 0; i < n_vars; ++i)
+    {
+        const std::string &var_name = this->original_variable_names[i];
+
+        teca_metadata atts;
+        if (attributes.get(var_name, atts))
+        {
+            TECA_ERROR("Failed to get attributes for \"" << var_name << "\"")
+            return teca_metadata();
+        }
+
+        attributes.remove(var_name);
+
+        attributes.set(this->new_variable_names[i], atts);
+    }
+
+    out_md.set("attributes", attributes);
+
+    return out_md;
+}
+
+// --------------------------------------------------------------------------
+std::vector<teca_metadata> teca_rename_variables::get_upstream_request(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md,
+    const teca_metadata &request)
+{
+    (void)port;
+    (void)input_md;
+
+    vector<teca_metadata> up_reqs;
+
+    // copy the incoming request to preserve the downstream requirements.
+    // replace renamed original_variable_names with their original name
+    teca_metadata req(request);
+
+    std::set<std::string> arrays;
+    if (req.has("arrays"))
+        req.get("arrays", arrays);
+
+    unsigned long n_vars = this->new_variable_names.size();
+    for (unsigned long i = 0; i < n_vars; ++i)
+    {
+        std::set<std::string>::iterator it = arrays.find(this->new_variable_names[i]);
+        if (it != arrays.end())
+        {
+            arrays.erase(it);
+            arrays.insert(this->original_variable_names[i]);
+        }
+
+    }
+
+    req.set("arrays", arrays);
+    up_reqs.push_back(req);
+
+    return up_reqs;
+}
+
+// --------------------------------------------------------------------------
+const_p_teca_dataset teca_rename_variables::execute(
+    unsigned int port,
+    const std::vector<const_p_teca_dataset> &input_data,
+    const teca_metadata &request)
+{
+#ifdef TECA_DEBUG
+    cerr << teca_parallel_id() << "teca_rename_variables::execute" << endl;
+#endif
+    (void)port;
+    (void)request;
+
+    // get the input mesh
+    const_p_teca_mesh in_mesh
+        = std::dynamic_pointer_cast<const teca_mesh>(input_data[0]);
+
+    if (!in_mesh)
+    {
+        TECA_ERROR("The input dataset is not a teca_mesh")
+        return nullptr;
+    }
+
+    // create the output mesh, pass everything through.
+    p_teca_mesh out_mesh = std::static_pointer_cast<teca_mesh>
+        (std::const_pointer_cast<teca_mesh>(in_mesh)->new_shallow_copy());
+
+
+    // rename the arrays if they are found
+    p_teca_array_collection arrays = out_mesh->get_point_arrays();
+
+    unsigned long n_vars = this->original_variable_names.size();
+    for (unsigned long i = 0; i < n_vars; ++i)
+    {
+        const std::string var_name = this->original_variable_names[i];
+
+        p_teca_variant_array array = arrays->get(var_name);
+        if (array)
+        {
+            arrays->remove(var_name);
+            arrays->set(this->new_variable_names[i], array);
+        }
+    }
+
+    return out_mesh;
+}
diff --git a/alg/teca_rename_variables.h b/alg/teca_rename_variables.h
new file mode 100644
index 000000000..24ebb7103
--- /dev/null
+++ b/alg/teca_rename_variables.h
@@ -0,0 +1,68 @@
+#ifndef teca_rename_variables_h
+#define teca_rename_variables_h
+
+#include "teca_shared_object.h"
+#include "teca_algorithm.h"
+#include "teca_metadata.h"
+
+#include <string>
+#include <vector>
+
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_rename_variables)
+
+/// An algorithm that renames variables.
+class teca_rename_variables : public teca_algorithm
+{
+public:
+    TECA_ALGORITHM_STATIC_NEW(teca_rename_variables)
+    TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_rename_variables)
+    TECA_ALGORITHM_CLASS_NAME(teca_rename_variables)
+    ~teca_rename_variables();
+
+    // report/initialize to/from Boost program options
+    // objects.
+    TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
+    TECA_SET_ALGORITHM_PROPERTIES()
+
+    /** @name original_variable_names
+     * Set the list of variables to rename. For each variable to rename a new
+     * name must be specified at the same index in the new_variable_names
+     * list. The two lists must be the same length.
+     */
+    ///@{
+    TECA_ALGORITHM_VECTOR_PROPERTY(std::string, original_variable_name)
+    ///@}
+
+    /** @name new_variable_names
+     * Set the names of the renamed variables. The new names are applied to the
+     * list of variables to rename in the same order and the two lists must be
+     * the same length.
+     */
+    ///@{
+    TECA_ALGORITHM_VECTOR_PROPERTY(std::string, new_variable_name)
+    ///@}
+
+protected:
+    teca_rename_variables();
+
+private:
+    teca_metadata get_output_metadata(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md) override;
+
+    std::vector<teca_metadata> get_upstream_request(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md,
+        const teca_metadata &request) override;
+
+    const_p_teca_dataset execute(
+        unsigned int port,
+        const std::vector<const_p_teca_dataset> &input_data,
+        const teca_metadata &request) override;
+
+private:
+    std::vector<std::string> original_variable_names;
+    std::vector<std::string> new_variable_names;
+};
+
+#endif
diff --git a/alg/teca_saffir_simpson.h b/alg/teca_saffir_simpson.h
index 89a73c168..618f44827 100644
--- a/alg/teca_saffir_simpson.h
+++ b/alg/teca_saffir_simpson.h
@@ -1,44 +1,51 @@
 #ifndef teca_saffir_simpson
 #define teca_saffir_simpson
 
+/// @file
+
 #include <limits>
 
+/// Codes dealing with the Saffir-Simpson scale
 namespace teca_saffir_simpson
 {
-// Saffir-Simpson scale prescribes the following limits:
-// CAT wind km/h
-// -1:   0- 63  :  Tropical depression
-//  0:  63-119  :  Tropical storm
-//  1: 119-153 km/h
-//  2: 154-177 km/h
-//  3: 178-208 km/h
-//  4: 209-251 km/h
-//  5: 252 km/h or higher
+/** Saffir-Simpson scale prescribes the following limits:
+ *  CAT wind km/h
+ *  -1:   0- 63  :  Tropical depression
+ *   0:  63-119  :  Tropical storm
+ *   1: 119-153 km/h
+ *   2: 154-177 km/h
+ *   3: 178-208 km/h
+ *   4: 209-251 km/h
+ *   5: 252 km/h or higher
+ */
 constexpr double low_wind_bound_kmph[] = {0.0, 63.0,
     119.0, 154.0, 178.0, 209.0, 252.0};
 
-// get the high bound for the given class of storm
+/// get the high bound for the given class of storm
 constexpr double high_wind_bound_kmph[] = {63.0,
     119.0, 154.0, 178.0, 209.0, 252.0,
     std::numeric_limits<double>::max()};
 
+/// get the lower bound for the given class of storm
 template<typename n_t>
 constexpr n_t get_lower_bound_kmph(int c)
 {
     return low_wind_bound_kmph[++c];
 }
 
+/// get the higher bound for the given class of storm
 template<typename n_t>
 constexpr n_t get_upper_bound_kmph(int c)
 {
     return high_wind_bound_kmph[++c];
 }
 
-// given wind speed in km/hr return Saffir-Simpson category
-// NOTE: there is some ambiguity in the above as
-// it's defined using integers. we are not converting
-// to integer here.
-// get the low bound for the given class of storm
+/** given wind speed in km/hr return Saffir-Simpson category
+ *  NOTE: there is some ambiguity in the above as
+ *  it's defined using integers. we are not converting
+ *  to integer here.
+ *  get the low bound for the given class of storm
+ */
 template<typename n_t>
 int classify_kmph(n_t w)
 {
@@ -62,25 +69,26 @@ int classify_kmph(n_t w)
     return 5;
 }
 
-// get the low bound for the given class of storm
+/// get the low bound for the given class of storm
 template<typename n_t>
 constexpr n_t get_lower_bound_mps(int c)
 {
     return get_lower_bound_kmph<n_t>(c)/n_t(3.6);
 }
 
-// get the high bound for the given class of storm
+/// get the high bound for the given class of storm
 template<typename n_t>
 constexpr n_t get_upper_bound_mps(int c)
 {
     return get_upper_bound_kmph<n_t>(c)/n_t(3.6);
 }
 
-// given wind speed in km/hr return Saffir-Simpson category
-// NOTE: there is some ambiguity in the above as
-// it's defined using integers. we are not converting
-// to integer here.
-// get the low bound for the given class of storm
+/** given wind speed in km/hr return Saffir-Simpson category
+ *  NOTE: there is some ambiguity in the above as
+ *  it's defined using integers. we are not converting
+ *  to integer here.
+ *  get the low bound for the given class of storm
+ */
 template<typename n_t>
 int classify_mps(n_t w)
 {
diff --git a/alg/teca_temporal_average.cxx b/alg/teca_simple_moving_average.cxx
similarity index 84%
rename from alg/teca_temporal_average.cxx
rename to alg/teca_simple_moving_average.cxx
index 3e19f32c9..3e4e4eb8f 100644
--- a/alg/teca_temporal_average.cxx
+++ b/alg/teca_simple_moving_average.cxx
@@ -1,4 +1,4 @@
-#include "teca_temporal_average.h"
+#include "teca_simple_moving_average.h"
 
 #include "teca_mesh.h"
 #include "teca_array_collection.h"
@@ -21,7 +21,7 @@ using std::endl;
 //#define TECA_DEBUG
 
 // --------------------------------------------------------------------------
-teca_temporal_average::teca_temporal_average()
+teca_simple_moving_average::teca_simple_moving_average()
     : filter_width(3), filter_type(backward)
 {
     this->set_number_of_input_connections(1);
@@ -29,16 +29,16 @@ teca_temporal_average::teca_temporal_average()
 }
 
 // --------------------------------------------------------------------------
-teca_temporal_average::~teca_temporal_average()
+teca_simple_moving_average::~teca_simple_moving_average()
 {}
 
 #if defined(TECA_HAS_BOOST)
 // --------------------------------------------------------------------------
-void teca_temporal_average::get_properties_description(
+void teca_simple_moving_average::get_properties_description(
     const string &prefix, options_description &global_opts)
 {
     options_description opts("Options for "
-        + (prefix.empty()?"teca_temporal_average":prefix));
+        + (prefix.empty()?"teca_simple_moving_average":prefix));
 
     opts.add_options()
         TECA_POPTS_GET(unsigned int, prefix, filter_width,
@@ -47,20 +47,24 @@ void teca_temporal_average::get_properties_description(
             "use a backward(0), forward(1) or centered(2) stencil")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
 // --------------------------------------------------------------------------
-void teca_temporal_average::set_properties(
+void teca_simple_moving_average::set_properties(
     const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, unsigned int, prefix, filter_width)
     TECA_POPTS_SET(opts, int, prefix, filter_type)
 }
 #endif
 
 // --------------------------------------------------------------------------
-std::vector<teca_metadata> teca_temporal_average::get_upstream_request(
+std::vector<teca_metadata> teca_simple_moving_average::get_upstream_request(
     unsigned int port,
     const std::vector<teca_metadata> &input_md,
     const teca_metadata &request)
@@ -80,7 +84,7 @@ std::vector<teca_metadata> teca_temporal_average::get_upstream_request(
             break;
     }
     cerr << teca_parallel_id()
-        << "teca_temporal_average::get_upstream_request filter_type="
+        << "teca_simple_moving_average::get_upstream_request filter_type="
         << type << endl;
 #endif
     (void) port;
@@ -128,38 +132,42 @@ std::vector<teca_metadata> teca_temporal_average::get_upstream_request(
             TECA_ERROR("Invalid \"filter_type\" " << this->filter_type)
             return up_reqs;
     }
+    first = std::max(0l, first);
+    last = std::min(num_steps - 1, last);
 
+    // make a request for each time that will be used in the
+    // average
     for (long i = first; i <= last; ++i)
     {
-        // make a request for each time that will be used in the
-        // average
-        if ((i >= 0) && (i < num_steps))
-        {
+        teca_metadata up_req(request);
+        up_req.set("time_step", i);
+        up_reqs.push_back(up_req);
+    }
+
 #ifdef TECA_DEBUG
-            cerr << teca_parallel_id()
-                << "request time_step " << i << endl;
+    cerr << teca_parallel_id() << "processing " << active_step
+        << " request " << first << " - " << last << endl;
 #endif
-            teca_metadata up_req(request);
-            up_req.set("time_step", i);
-            up_reqs.push_back(up_req);
-        }
-    }
 
     return up_reqs;
 }
 
 // --------------------------------------------------------------------------
-const_p_teca_dataset teca_temporal_average::execute(
+const_p_teca_dataset teca_simple_moving_average::execute(
     unsigned int port,
     const std::vector<const_p_teca_dataset> &input_data,
     const teca_metadata &request)
 {
 #ifdef TECA_DEBUG
     cerr << teca_parallel_id()
-        << "teca_temporal_average::execute" << endl;
+        << "teca_simple_moving_average::execute" << endl;
 #endif
     (void)port;
 
+    // nothing to do
+    if ((input_data.size() < 1) || !input_data[0])
+        return nullptr;
+
     // create output and copy metadata, coordinates, etc
     p_teca_mesh out_mesh
         = std::dynamic_pointer_cast<teca_mesh>(input_data[0]->new_instance());
diff --git a/alg/teca_temporal_average.h b/alg/teca_simple_moving_average.h
similarity index 62%
rename from alg/teca_temporal_average.h
rename to alg/teca_simple_moving_average.h
index ca00c5c40..5b2f82d63 100644
--- a/alg/teca_temporal_average.h
+++ b/alg/teca_simple_moving_average.h
@@ -1,5 +1,5 @@
-#ifndef teca_temporal_average_h
-#define teca_temporal_average_h
+#ifndef teca_simple_moving_average_h
+#define teca_simple_moving_average_h
 
 #include "teca_shared_object.h"
 #include "teca_algorithm.h"
@@ -8,7 +8,7 @@
 #include <string>
 #include <vector>
 
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_temporal_average)
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_simple_moving_average)
 
 /// an algorithm that averages data in time
 /**
@@ -16,33 +16,41 @@ an algorithm that averages data in time. filter_width
 controls the number of time steps to average over.
 all arrays in the input data are processed.
 */
-class teca_temporal_average : public teca_algorithm
+class teca_simple_moving_average : public teca_algorithm
 {
 public:
-    TECA_ALGORITHM_STATIC_NEW(teca_temporal_average)
-    TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_temporal_average)
-    TECA_ALGORITHM_CLASS_NAME(teca_temporal_average)
-    ~teca_temporal_average();
+    TECA_ALGORITHM_STATIC_NEW(teca_simple_moving_average)
+    TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_simple_moving_average)
+    TECA_ALGORITHM_CLASS_NAME(teca_simple_moving_average)
+    ~teca_simple_moving_average();
 
     // report/initialize to/from Boost program options
     // objects.
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the number of steps to average. should be odd.
+    /** @name filter_width
+     * set the number of steps to average. should be odd.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(unsigned int, filter_width)
+    ///@}
 
 
-    // select the filter stencil, default is backward
+    /** @name filter_type
+     * select the filter stencil, default is backward
+     */
+    ///@{
     enum {
         backward,
         centered,
         forward
     };
     TECA_ALGORITHM_PROPERTY(int, filter_type)
+    ///@}
 
 protected:
-    teca_temporal_average();
+    teca_simple_moving_average();
 
 private:
     std::vector<teca_metadata> get_upstream_request(
diff --git a/alg/teca_table_calendar.cxx b/alg/teca_table_calendar.cxx
index 79768f323..57f5ef945 100644
--- a/alg/teca_table_calendar.cxx
+++ b/alg/teca_table_calendar.cxx
@@ -16,7 +16,7 @@
 #include <boost/program_options.hpp>
 #endif
 #if defined(TECA_HAS_UDUNITS)
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 #endif
 #if defined(TECA_HAS_MPI)
 #include <mpi.h>
@@ -73,6 +73,8 @@ void teca_table_calendar::get_properties_description(
             "prepended to all output column names")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -80,6 +82,8 @@ void teca_table_calendar::get_properties_description(
 void teca_table_calendar::set_properties(
     const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, units)
     TECA_POPTS_SET(opts, std::string, prefix, calendar)
     TECA_POPTS_SET(opts, std::string, prefix, time_column)
@@ -270,7 +274,7 @@ const_p_teca_dataset teca_table_calendar::execute(
             int curr_minute = 0;
             double curr_second = 0;
 
-            if (calcalcs::date(curr_time[i], &curr_year, &curr_month,
+            if (teca_calcalcs::date(curr_time[i], &curr_year, &curr_month,
                 &curr_day, &curr_hour, &curr_minute, &curr_second,
                 units.c_str(), calendar.c_str()))
             {
diff --git a/alg/teca_table_calendar.h b/alg/teca_table_calendar.h
index 3f58ec4c5..fbc0cd494 100644
--- a/alg/teca_table_calendar.h
+++ b/alg/teca_table_calendar.h
@@ -10,21 +10,24 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_table_calendar)
 
-/// an algorithm that transforms NetCDF CF-2 time
-/// variable into an absolute date.
-/**
-Transform NetCDF CF-2 time variable into an absolute
-date. By default the "time" column is used, but this
-can be over road by set_active_column methods. the
-table must have temporal metadata containing base date
-and calendar units following the CF-2 convention.
-the output table will contain year,month,day,hours,
-minutes columns.
-
-NOTE: this should be used in serial, as the udunits
-package loads an xml file in each instance. The
-CalCalcs package also has thread safety issues.
-*/
+/** @brief
+ * An algorithm that transforms NetCDF CF-2 time
+ * variable into an absolute date.
+ *
+ * @details
+ * Transform NetCDF CF-2 time variable into an absolute
+ * date. By default the "time" column is used, but this
+ * can be over road by set_active_column methods. the
+ * table must have temporal metadata containing base date
+ * and calendar units following the CF-2 convention.
+ * the output table will contain year,month,day,hours,
+ * minutes columns.
+ *
+ * @note
+ * This should be used in serial, as the UDUNITS
+ * package loads an XML file in each instance. The
+ * CalCalcs package also has thread safety issues.
+ */
 class teca_table_calendar : public teca_algorithm
 {
 public:
diff --git a/alg/teca_table_reduce.h b/alg/teca_table_reduce.h
index 2740494d6..6add595c6 100644
--- a/alg/teca_table_reduce.h
+++ b/alg/teca_table_reduce.h
@@ -2,7 +2,7 @@
 #define teca_table_reduce_h
 
 #include "teca_shared_object.h"
-#include "teca_dataset_fwd.h"
+#include "teca_dataset.h"
 #include "teca_metadata.h"
 #include "teca_index_reduce.h"
 
@@ -11,12 +11,11 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_table_reduce)
 
-// a reduction on tabular data over time steps
+/// A reduction on tabular data over time steps.
 /**
-a reduction on tabular data over time steps.
-tabular data from each time step is collected and
-concatenated into a big table.
-*/
+ * Tabular data from each time step is collected and
+ * concatenated into a big table.
+ */
 class teca_table_reduce : public teca_index_reduce
 {
 public:
diff --git a/alg/teca_table_region_mask.cxx b/alg/teca_table_region_mask.cxx
index 1b5b9bed9..75bbc37a8 100644
--- a/alg/teca_table_region_mask.cxx
+++ b/alg/teca_table_region_mask.cxx
@@ -17,7 +17,7 @@
 #include <boost/program_options.hpp>
 #endif
 #if defined(TECA_HAS_UDUNITS)
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 #endif
 #if defined(TECA_HAS_MPI)
 #include <mpi.h>
@@ -49,11 +49,11 @@ void teca_table_region_mask::get_properties_description(
 
     opts.add_options()
         TECA_POPTS_GET(std::string, prefix, x_coordinate_column,
-            "name of the column containing x cooridnates. default \"lon\"")
+            "name of the column containing x cooridnates.")
         TECA_POPTS_GET(std::string, prefix, y_coordinate_column,
-            "name of the column containing y cooridnates. default \"lat\"")
+            "name of the column containing y cooridnates.")
         TECA_POPTS_GET(std::string, prefix, result_column,
-            "name of the column to store the mask in. default \"region_mask\"")
+            "name of the column to store the mask in.")
         TECA_POPTS_MULTI_GET(std::vector<unsigned long>, prefix, region_sizes,
             "the number of points in each region")
         TECA_POPTS_MULTI_GET(std::vector<double>, prefix, region_x_coordinates,
@@ -62,6 +62,8 @@ void teca_table_region_mask::get_properties_description(
             "list of y coordinates describing the regions")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -69,6 +71,8 @@ void teca_table_region_mask::get_properties_description(
 void teca_table_region_mask::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, x_coordinate_column)
     TECA_POPTS_SET(opts, std::string, prefix, y_coordinate_column)
     TECA_POPTS_SET(opts, std::string, prefix, result_column)
diff --git a/alg/teca_table_region_mask.h b/alg/teca_table_region_mask.h
index 3b3f7dafc..434bfdce6 100644
--- a/alg/teca_table_region_mask.h
+++ b/alg/teca_table_region_mask.h
@@ -10,13 +10,16 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_table_region_mask)
 
-/**
- an algorithm that identifies rows in the table that are
-inside the list of regions provided. a new column, called
-the mask column is created. It has 1's if the row is in
-the set of regions, otherwise 0's. The invert property
-can be used to invert the result.
-*/
+/** @brief
+ * An algorithm that identifies rows in the table that are
+ * inside the list of regions provided.
+ *
+ * @details
+ * A new column, called the mask column is created. 
+ * It has 1's if the row is in the set of regions,
+ * otherwise 0's. The invert property
+ * can be used to invert the result.
+ */
 class teca_table_region_mask : public teca_algorithm
 {
 public:
@@ -37,7 +40,7 @@ class teca_table_region_mask : public teca_algorithm
 
     // set the name of the column to store the mask in
     // the mask is a column of 1 and 0 indicating if the
-    // row satsifies the criteria or not. the default is
+    // row satisfies the criteria or not. the default is
     // "region_mask"
     TECA_ALGORITHM_PROPERTY(std::string, result_column);
 
diff --git a/alg/teca_table_remove_rows.cxx b/alg/teca_table_remove_rows.cxx
index 986023cc4..6840f8641 100644
--- a/alg/teca_table_remove_rows.cxx
+++ b/alg/teca_table_remove_rows.cxx
@@ -17,7 +17,7 @@
 #include <boost/program_options.hpp>
 #endif
 #if defined(TECA_HAS_UDUNITS)
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 #endif
 #if defined(TECA_HAS_MPI)
 #include <mpi.h>
@@ -56,6 +56,8 @@ void teca_table_remove_rows::get_properties_description(
             "when set columns used in the calculation are removed from output")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -63,6 +65,8 @@ void teca_table_remove_rows::get_properties_description(
 void teca_table_remove_rows::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, mask_expression)
     TECA_POPTS_SET(opts, int, prefix, remove_dependent_variables)
 }
diff --git a/alg/teca_table_remove_rows.h b/alg/teca_table_remove_rows.h
index 543b9eada..882f3b259 100644
--- a/alg/teca_table_remove_rows.h
+++ b/alg/teca_table_remove_rows.h
@@ -10,23 +10,24 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_table_remove_rows)
 
-/**
-an algorithm that removes rows from a table where
-a given expression evaluates to true.
-
-the expression parser supports the following operations:
-    +,-,*,/,%,<.<=,>,>=,==,!=,&&,||.!,?
-
-grouping in the expression is denoted in the usual
-way: ()
-
-constants in the expression are expanded to full length
-arrays and can be typed. The supported types are:
-    d,f,L,l,i,s,c
-coresponding to double,float,long long, long, int,
-short and char repsectively.  integer types can be
-unsigned by including u after the code.
-*/
+/** @brief
+ * An algorithm that removes rows from a table where
+ * a given expression evaluates to true.
+ *
+ * @details
+ * The expression parser supports the following operations:
+ *     +,-,*,/,%,<.<=,>,>=,==,!=,&&,||.!,?
+ *
+ * Grouping in the expression is denoted in the usual
+ * way: ()
+ *
+ * Constants in the expression are expanded to full length
+ * arrays and can be typed. The supported types are:
+ *     d,f,L,l,i,s,c
+ * Corresponding to double,float, long long, long, int,
+ * short and char respectively. Integer types can be
+ * unsigned by including u after the code.
+ */
 class teca_table_remove_rows : public teca_algorithm
 {
 public:
@@ -40,17 +41,27 @@ class teca_table_remove_rows : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the expression to use to determine which rows
-    // are removed. rows are removed where the expression
-    // evaluates true.
+    /** @name mask_expression
+     * set the expression to use to determine which rows are removed. rows are
+     * removed where the expression evaluates true.
+     */
+    ///@{
+    /// Set the mask expression
     void set_mask_expression(const std::string &expr);
 
+    /// Get the mask expression
     std::string get_mask_expression()
     { return this->mask_expression; }
+    ///@}
 
-    // when set columns used in the calculation are removed
-    // from the output. deault off.
+    /** @name remove_dependent_variables
+     * when set columns used in the calculation are removed from the output.
+     * default off.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, remove_dependent_variables)
+    ///@}
+
 
 protected:
     teca_table_remove_rows();
diff --git a/alg/teca_table_sort.cxx b/alg/teca_table_sort.cxx
index e85daabbb..ef8fae195 100644
--- a/alg/teca_table_sort.cxx
+++ b/alg/teca_table_sort.cxx
@@ -76,6 +76,8 @@ void teca_table_sort::get_properties_description(
             "if set a stable sort will be used")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -83,6 +85,8 @@ void teca_table_sort::get_properties_description(
 void teca_table_sort::set_properties(
     const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, index_column)
     TECA_POPTS_SET(opts, int, prefix, index_column_id)
     TECA_POPTS_SET(opts, int, prefix, stable_sort)
diff --git a/alg/teca_table_to_stream.cxx b/alg/teca_table_to_stream.cxx
index 58b15a108..f9ee2cc84 100644
--- a/alg/teca_table_to_stream.cxx
+++ b/alg/teca_table_to_stream.cxx
@@ -54,6 +54,9 @@ void teca_table_to_stream::get_properties_description(
         TECA_POPTS_GET(std::string, prefix, stream,
             "name of stream to send output to. stderr, stdout")
         ;
+
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -61,6 +64,8 @@ void teca_table_to_stream::get_properties_description(
 void teca_table_to_stream::set_properties(
     const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, header)
     TECA_POPTS_SET(opts, std::string, prefix, footer)
     TECA_POPTS_SET(opts, std::string, prefix, stream)
@@ -91,6 +96,25 @@ void teca_table_to_stream::set_stream(const std::string &s)
     }
 }
 
+// --------------------------------------------------------------------------
+std::string teca_table_to_stream::get_stream()
+{
+    if (this->stream == &std::cerr)
+    {
+        return "stderr";
+    }
+    else if (this->stream == &std::cout)
+    {
+        return "stdout";
+    }
+    else if (!this->stream)
+    {
+        return "null";
+    }
+
+    return "unknown";
+}
+
 // --------------------------------------------------------------------------
 void teca_table_to_stream::set_stream_to_stderr()
 {
diff --git a/alg/teca_table_to_stream.h b/alg/teca_table_to_stream.h
index c2fcd631c..c88c6d747 100644
--- a/alg/teca_table_to_stream.h
+++ b/alg/teca_table_to_stream.h
@@ -11,8 +11,7 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_table_to_stream)
 
-/// an algorithm that serializes a table to a c++ stream object.
-/// This is primarilly useful for debugging.
+/// An algorithm that serializes a table to a C++ stream object.
 class teca_table_to_stream : public teca_algorithm
 {
 public:
@@ -40,6 +39,9 @@ class teca_table_to_stream : public teca_algorithm
     void set_stream_to_stderr();
     void set_stream_to_stdout();
 
+    // get the stream name
+    std::string get_stream();
+
 protected:
     teca_table_to_stream();
 
diff --git a/alg/teca_tc_candidates.cxx b/alg/teca_tc_candidates.cxx
index 76ac71657..b08eede71 100644
--- a/alg/teca_tc_candidates.cxx
+++ b/alg/teca_tc_candidates.cxx
@@ -4,7 +4,6 @@
 #include "teca_variant_array.h"
 #include "teca_table.h"
 #include "teca_database.h"
-#include "teca_calendar.h"
 #include "teca_coordinate_util.h"
 #include "gfdl_tc_candidates.h"
 
@@ -71,34 +70,36 @@ void teca_tc_candidates::get_properties_description(
             "name of core temperature variable")
         TECA_POPTS_GET(double, prefix, max_core_radius,
             "maximum number of degrees latitude separation between "
-            "vorticity max and pressure min defining a storm (2.0)")
+            "vorticity max and pressure min defining a storm")
         TECA_POPTS_GET(double, prefix, min_vorticity_850mb,
-            "minimum vorticty to be considered a tropical storm (1.6e-4)")
+            "minimum vorticty to be considered a tropical storm")
         TECA_POPTS_GET(double, prefix, vorticity_850mb_window,
             "size of the search window in degrees. storms core must have a "
-            "local vorticity max centered on this window (7.74446)")
+            "local vorticity max centered on this window")
         TECA_POPTS_GET(double, prefix, max_pressure_delta,
-            "maximum pressure change within specified radius (400.0)")
+            "maximum pressure change within specified radius")
         TECA_POPTS_GET(double, prefix, max_pressure_radius,
-            "radius in degrees over which max pressure change is computed (5.0)")
+            "radius in degrees over which max pressure change is computed")
         TECA_POPTS_GET(double, prefix, max_core_temperature_delta,
-            "maximum core temperature change over the specified radius (0.8)")
+            "maximum core temperature change over the specified radius")
         TECA_POPTS_GET(double, prefix, max_core_temperature_radius,
-            "radius in degrees over which max core temperature change is computed (5.0)")
+            "radius in degrees over which max core temperature change is computed")
         TECA_POPTS_GET(double, prefix, max_thickness_delta,
-            "maximum thickness change over the specified radius (50.0)")
+            "maximum thickness change over the specified radius")
         TECA_POPTS_GET(double, prefix, max_thickness_radius,
-            "radius in degrees over with max thickness change is comuted (4.0)")
+            "radius in degrees over with max thickness change is comuted")
         TECA_POPTS_GET(double, prefix, search_lat_low,
-            "lowest latitude in degrees to search for storms (-80.0)")
+            "lowest latitude in degrees to search for storms")
         TECA_POPTS_GET(double, prefix, search_lat_high,
-            "highest latitude in degrees to search for storms (80.0)")
+            "highest latitude in degrees to search for storms")
         TECA_POPTS_GET(double, prefix, search_lon_low,
-            "lowest longitude in degrees to search for stroms (1)")
+            "lowest longitude in degrees to search for stroms")
         TECA_POPTS_GET(double, prefix, search_lon_high,
-            "highest longitude in degrees to search for storms (0)")
+            "highest longitude in degrees to search for storms")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     opts.add(ard_opts);
 }
 
@@ -106,6 +107,8 @@ void teca_tc_candidates::get_properties_description(
 void teca_tc_candidates::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, surface_wind_speed_variable)
     TECA_POPTS_SET(opts, std::string, prefix, vorticity_850mb_variable)
     TECA_POPTS_SET(opts, std::string, prefix, sea_level_pressure_variable)
@@ -453,8 +456,9 @@ const_p_teca_dataset teca_tc_candidates::execute(unsigned int port,
     cerr << std::endl;
 #endif
     seconds_t dt(t1 - t0);
-    TECA_STATUS("teca_tc_candidates step=" << time_step
-        << " t=" << time_offset << ", dt=" << dt.count() << " sec")
+
+    TECA_STATUS("At step " << time_step << " time " << time_offset << " "
+        << n_candidates << " candidates detected in " << dt.count() << " seconds")
 
     return out_table;
 }
diff --git a/alg/teca_tc_candidates.h b/alg/teca_tc_candidates.h
index 85b1dcdcb..7c45c50a5 100644
--- a/alg/teca_tc_candidates.h
+++ b/alg/teca_tc_candidates.h
@@ -10,41 +10,42 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_tc_candidates)
 
+/// GFDL tropical storms detection algorithm.
 /**
-GFDL tropical storms detection algorithm
-for more information see
-"Seasonal forecasting of tropical storms using coupled GCM integrations"
-
- --- INPUT
-     Gwind  - wind speed at 850 mb
-     Gvort  - vorticity_850mb  at 850 mb
-     Gtbar  - mean core_temperature for warm core layer
-     Gpsl   - sea level sea_level_pressure
-     Gthick - thickness of 200 to 1000 mb layer
-     Grlon  - longitudes
-     Grlat  - latitudes
-     iyear  - year
-     imon   - month
-     iday   - day of month
-     ihour  - hour
-     iucy   - unit for output
-
- --- OUTPUT
- --- record # 1
-     num0   - day
-     imon0  - month
-     iyear  - year
-     number - number of cyclones found
- --- records # 2...number+1
-     idex, jdex - (i,j) index of cyclone
-     svort_max  - max vorticity_850mb
-     swind_max  - max wind
-      spsl_min  - min sea level sea_level_pressure
-     svort_lon,  svort_lat - longitude & latitude of max vorticity_850mb
-      spsl_lon,   spsl_lat - longitude & latitude of min slp
-      stemperature_lon,   stemperature_lat - longitude & latitude of warm core
-    sthick_lon, sthick_lat - longitude & latitude of max thickness
-*/
+ * For more information see
+ * "Seasonal forecasting of tropical storms using coupled GCM integrations"
+ *
+ *  --- INPUT
+ *      Gwind  - wind speed at 850 mb
+ *      Gvort  - vorticity_850mb  at 850 mb
+ *      Gtbar  - mean core_temperature for warm core layer
+ *      Gpsl   - sea level sea_level_pressure
+ *      Gthick - thickness of 200 to 1000 mb layer
+ *      Grlon  - longitudes
+ *      Grlat  - latitudes
+ *      iyear  - year
+ *      imon   - month
+ *      iday   - day of month
+ *      ihour  - hour
+ *      iucy   - unit for output
+ *
+ *  --- OUTPUT
+ *  --- record # 1
+ *      num0   - day
+ *      imon0  - month
+ *      iyear  - year
+ *      number - number of cyclones found
+ *  --- records # 2...number+1
+ *      idex, jdex - (i,j) index of cyclone
+ *      svort_max  - max vorticity_850mb
+ *      swind_max  - max wind
+ *       spsl_min  - min sea level sea_level_pressure
+ *      svort_lon,  svort_lat - longitude & latitude of max vorticity_850mb
+ *       spsl_lon,   spsl_lat - longitude & latitude of min slp
+ *     stemperature_lon,   stemperature_lat - longitude & latitude of warm
+ *                                            core
+ *     sthick_lon, sthick_lat - longitude & latitude of max thickness
+ */
 class teca_tc_candidates : public teca_algorithm
 {
 public:
@@ -85,19 +86,19 @@ class teca_tc_candidates : public teca_algorithm
     TECA_ALGORITHM_PROPERTY(double, max_thickness_radius)
 
     // set/get the bounding box to search for storms
-    // in units of degreees lat,lon
+    // in units of degrees lat,lon
     TECA_ALGORITHM_PROPERTY(double, search_lat_low)
     TECA_ALGORITHM_PROPERTY(double, search_lat_high)
     TECA_ALGORITHM_PROPERTY(double, search_lon_low)
     TECA_ALGORITHM_PROPERTY(double, search_lon_high)
 
     // set/get the number of iterations to search for the
-    // storm local minimum. raising this paramter might increase
-    // detections but the detector will run slowerd. default is
+    // storm local minimum. raising this parameter might increase
+    // detections but the detector will run slower. default is
     // 50.
     TECA_ALGORITHM_PROPERTY(int, minimizer_iterations)
 
-    // send humand readable representation to the
+    // send human readable representation to the
     // stream
     virtual void to_stream(std::ostream &os) const override;
 
diff --git a/alg/teca_tc_classify.cxx b/alg/teca_tc_classify.cxx
index 42ceca00e..503c58100 100644
--- a/alg/teca_tc_classify.cxx
+++ b/alg/teca_tc_classify.cxx
@@ -17,7 +17,7 @@
 #include <boost/program_options.hpp>
 #endif
 #if defined(TECA_HAS_UDUNITS)
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 #endif
 #if defined(TECA_HAS_MPI)
 #include <mpi.h>
@@ -81,6 +81,8 @@ void teca_tc_classify::get_properties_description(
             "each region. if not provided names are generated from ids")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -88,6 +90,8 @@ void teca_tc_classify::get_properties_description(
 void teca_tc_classify::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, track_id_column)
     TECA_POPTS_SET(opts, std::string, prefix, time_column)
     TECA_POPTS_SET(opts, std::string, prefix, surface_wind_column)
diff --git a/alg/teca_tc_classify.h b/alg/teca_tc_classify.h
index efec9e852..1f2ae884a 100644
--- a/alg/teca_tc_classify.h
+++ b/alg/teca_tc_classify.h
@@ -12,12 +12,12 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_tc_classify)
 
 /// an algorithm that classifies storms using Saphire-Simpson scale
 /**
-An algorithm that classifies storms using Saphire-Simpson scale
-a column containing the classification is added to the output
-
-An algorithm that sorts the storms by geographic region
-and category. tyhe output is a table where regions is
-mapped to columns and category is mapped to rows.
+ * An algorithm that classifies storms using Saphire-Simpson scale a column
+ * containing the classification is added to the output
+ *
+ * An algorithm that sorts the storms by geographic region and category. tyhe
+ * output is a table where regions is mapped to columns and category is mapped to
+rows.
 */
 class teca_tc_classify : public teca_algorithm
 {
diff --git a/alg/teca_tc_trajectory.cxx b/alg/teca_tc_trajectory.cxx
index 61889b7a3..a6b274c11 100644
--- a/alg/teca_tc_trajectory.cxx
+++ b/alg/teca_tc_trajectory.cxx
@@ -38,10 +38,12 @@ int teca_tc_trajectory(var_t r_crit, var_t wind_crit, double n_wind_crit,
     const int *storm_uid, const coord_t *d_lon, const coord_t *d_lat,
     const var_t *wind_max, const var_t *vort_max, const var_t *psl,
     const int *have_twc, const int *have_thick, const var_t *twc_max,
-    const var_t *thick_max, unsigned long n_rows, p_teca_table track_table)
+    const var_t *thick_max, unsigned long n_rows, p_teca_table track_table,
+    unsigned long &n_tracks)
 {
     const coord_t DEG_TO_RAD = M_PI/180.0;
     unsigned long track_id = 0;
+    n_tracks = 0;
 
     // convert from dsegrees to radians
     unsigned long nbytes = n_rows*sizeof(coord_t);
@@ -218,6 +220,8 @@ int teca_tc_trajectory(var_t r_crit, var_t wind_crit, double n_wind_crit,
     free(r_lat);
     free(available);
 
+    n_tracks = track_id + 1;
+
     return 0;
 }
 };
@@ -248,16 +252,18 @@ void teca_tc_trajectory::get_properties_description(
 
     opts.add_options()
         TECA_POPTS_GET(double, prefix, max_daily_distance,
-            "max distance a storm can move on the same track in single day (1600 km)")
+            "max distance a storm can move on the same track in single day")
         TECA_POPTS_GET(double, prefix, min_wind_speed,
-            "minimum wind speed to be worthy of tracking (17.0 ms^-1)")
+            "minimum wind speed to be worthy of tracking")
         TECA_POPTS_GET(double, prefix, min_wind_duration,
             "minimum number of, not necessarily consecutive, days thickness, "
-            "core temp, and wind speed criteria must be satisfied (2.0 days)")
+            "core temp, and wind speed criteria must be satisfied")
         TECA_POPTS_GET(unsigned long, prefix, step_interval,
-            "number of time steps between valid candidate data. (1 step)")
+            "number of time steps between valid candidate data.")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -265,6 +271,8 @@ void teca_tc_trajectory::get_properties_description(
 void teca_tc_trajectory::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, double, prefix, max_daily_distance)
     TECA_POPTS_SET(opts, double, prefix, min_wind_speed)
     TECA_POPTS_SET(opts, double, prefix, min_wind_duration)
@@ -405,7 +413,18 @@ const_p_teca_dataset teca_tc_trajectory::execute(
     }
 
     unsigned long n_rows = candidates->get_number_of_rows();
+
+    // check that there are some candidates to work with.
+    if (n_rows < 1)
+    {
+        TECA_ERROR("Failed to form TC tracks because there were no candiates")
+        return nullptr;
+    }
+
+    unsigned long n_tracks = 0;
+
     std::chrono::high_resolution_clock::time_point t0, t1;
+    t0 = std::chrono::high_resolution_clock::now();
 
     NESTED_TEMPLATE_DISPATCH_FP(const teca_variant_array_impl,
         lon.get(), _COORD,
@@ -445,24 +464,25 @@ const_p_teca_dataset teca_tc_trajectory::execute(
                 dynamic_cast<const TT_VAR*>(thick_max.get())->get();
 
             // invoke the track finder
-            t0 = std::chrono::high_resolution_clock::now();
             if (internal::teca_tc_trajectory(
                 static_cast<NT_VAR>(this->max_daily_distance),
                 static_cast<NT_VAR>(this->min_wind_speed), this->min_wind_duration,
                 this->step_interval, p_step, p_time, p_storm_id, p_lon, p_lat,
                 p_wind_max, p_vort_max, p_psl_min, p_have_twc, p_have_thick,
-                p_twc_max, p_thick_max, n_rows, storm_tracks))
+                p_twc_max, p_thick_max, n_rows, storm_tracks, n_tracks))
             {
-                TECA_ERROR("GFDL TC trajectory analysis encountered an error")
+                TECA_ERROR("Failed to form tracks")
                 return nullptr;
             }
-            t1 = std::chrono::high_resolution_clock::now();
             )
         )
 
+    t1 = std::chrono::high_resolution_clock::now();
     seconds_t dt(t1 - t0);
-    TECA_STATUS("teca_tc_trajectory n_candidates=" << n_rows << ", n_tracks="
-        << storm_tracks->get_number_of_rows() << ", dt=" << dt.count() << " sec")
+
+    TECA_STATUS("Formed " << n_tracks << " tracks comprised of "
+        << storm_tracks->get_number_of_rows() << " of the " << n_rows
+        << " avilable candidates in " << dt.count() << " seconds")
 
     return storm_tracks;
 }
diff --git a/alg/teca_tc_trajectory.h b/alg/teca_tc_trajectory.h
index 2154cc881..26c487e6a 100644
--- a/alg/teca_tc_trajectory.h
+++ b/alg/teca_tc_trajectory.h
@@ -11,28 +11,25 @@
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_tc_trajectory)
 
 /// GFDL tropical storms trajectory tracking algorithm
-/**
-GFDL tropical storms trajectory tracking algorithm
-
-for more information see
-"Seasonal forecasting of tropical storms using coupled GCM integrations"
-
-computes trajectories from table of detections. trajectories
-are stored in a table.
-
-the trajectory computation makes use of the following paramteters:
-
-max_daily_distance (1600 km)
-    event must be within this distance on the
-    following day to be considered as part of the trajectory.
-
-min_wind_speed (17 m/s)
-    850 mb wind sped must be above this value.
-
-min_wind_duration (2 days)
-    criteria must be satisfied for this many days to be
-    a candidate
-*/
+/** for more information see
+ * "Seasonal forecasting of tropical storms using coupled GCM integrations"
+ *
+ * computes trajectories from table of detections. trajectories
+ * are stored in a table.
+ *
+ * the trajectory computation makes use of the following paramteters:
+ *
+ * max_daily_distance (1600 km)
+ *     event must be within this distance on the
+ *     following day to be considered as part of the trajectory.
+ *
+ * min_wind_speed (17 m/s)
+ *     850 mb wind sped must be above this value.
+ *
+ * min_wind_duration (2 days)
+ *     criteria must be satisfied for this many days to be
+ *     a candidate
+ */
 class teca_tc_trajectory : public teca_algorithm
 {
 public:
diff --git a/alg/teca_tc_wind_radii.cxx b/alg/teca_tc_wind_radii.cxx
index 20ba6713c..de14e7c00 100644
--- a/alg/teca_tc_wind_radii.cxx
+++ b/alg/teca_tc_wind_radii.cxx
@@ -596,6 +596,8 @@ void teca_tc_wind_radii::get_properties_description(const std::string &prefix,
             "the average wind speed over the interval is used.")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -603,6 +605,8 @@ void teca_tc_wind_radii::get_properties_description(const std::string &prefix,
 void teca_tc_wind_radii::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, storm_id_column)
     TECA_POPTS_SET(opts, std::string, prefix, storm_x_coordinate_column)
     TECA_POPTS_SET(opts, std::string, prefix, storm_y_coordinate_column)
diff --git a/alg/teca_tc_wind_radii.h b/alg/teca_tc_wind_radii.h
index 6b9befc38..d44b0282d 100644
--- a/alg/teca_tc_wind_radii.h
+++ b/alg/teca_tc_wind_radii.h
@@ -12,15 +12,14 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_tc_wind_radii)
 
 /// computes wind radius at the specified coordinates
 /**
-Compute storm size and adds it to the table. There are two inputs,
-the first serves up tables of storms to compute the storm radius
-for. One must set the names of the columns that contain storm ids,
-x-coordnates, y-coordinates, and time coordinate. For each event
-the wind radius is computed. Computations are parallelized over
-storm id. The second input serves up wind velocity data most likely
-this will be from a NetCDF CF2 simulation dataset. By default
-radius is computed at the transitions on the Saffir-Simpson
-scale. 
+ * Compute storm size and adds it to the table. There are two inputs, the first
+ * serves up tables of storms to compute the storm radius for. One must set the
+ * names of the columns that contain storm ids, x-coordnates, y-coordinates,
+ * and time coordinate. For each event the wind radius is computed.
+ * Computations are parallelized over storm id. The second input serves up wind
+ * velocity data most likely this will be from a NetCDF CF2 simulation dataset.
+ * By default radius is computed at the transitions on the Saffir-Simpson
+ * scale.
 */
 class teca_tc_wind_radii : public teca_algorithm
 {
@@ -35,59 +34,110 @@ class teca_tc_wind_radii : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the name of the column that defines the track ids
-    // if set the specified column is coppied into the output
-    // metadata and accessed with the key event_id
+    /** @name storm_id_column
+     * set the name of the column that defines the track ids if set the
+     * specified column is coppied into the output metadata and accessed with
+     * the key event_id
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, storm_id_column)
-
-    // set the name of the columns that define the event position
-    // if  set the columns are coppied into the output metadata
-    // and accessed with the keys storm_x_coordinate, storm_y_coordinate
+    ///@}
+
+    /** @name storm_x_coordinate_column
+     * set the name of the columns that define the event position if  set the
+     * columns are coppied into the output metadata and accessed with the keys
+     * storm_x_coordinate, storm_y_coordinate
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, storm_x_coordinate_column)
+    ///@}
+
+    /** @name storm_y_coordinate_column
+     * set the name of the columns that define the event position if  set the
+     * columns are coppied into the output metadata and accessed with the keys
+     * storm_x_coordinate, storm_y_coordinate
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, storm_y_coordinate_column)
+    ///@}
 
-    // set the name of the column containing peak instantanious
-    // surface wind speed
+    /** @name storm_wind_speed_column
+     * set the name of the column containing peak instantanious surface wind
+     * speed
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, storm_wind_speed_column)
-
-    // set the name of the column that defines the event time
-    // if set the specified column is coppied into the output
-    // metadata and accessed with the key event_time
+    ///@}
+
+    /** @name storm_time_column
+     * set the name of the column that defines the event time if set the
+     * specified column is coppied into the output metadata and accessed with
+     * the key event_time
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, storm_time_column)
+    ///@}
 
     // set the name of the wind variable components
+    /** @name wind_u_variable
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, wind_u_variable)
+    ///@}
+
+    /** @name wind_v_variable
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, wind_v_variable)
+    ///@}
 
-    // set the radius in degrees of latitude to sample the wind
-    // field
+    /** @name search_radius
+     * set the radius in degrees of latitude to sample the wind field
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(double, search_radius)
-
-    // set the radius in degrees of latitude beyond which to
-    // terminate the search for peak wind speed. if the peak
-    // lies beyond this distance search is terminated and a
-    // warning is displayed.
+    ///@}
+
+    /** @name core_radius
+     * set the radius in degrees of latitude beyond which to terminate the
+     * search for peak wind speed. if the peak lies beyond this distance search
+     * is terminated and a warning is displayed.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(double, core_radius)
+    ///@}
 
-    // number of bins to discetize by in the radial direction
+    /** @name number_of_radial_bins
+     * number of bins to discetize by in the radial direction
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, number_of_radial_bins)
+    ///@}
 
-    // set the wind speeds (in m/s) to find the radius of. the
-    // defualt values are the transition speeds of the Saffir-Simpson
-    // scale.
+    /** @name critical_wind_speed
+     * set the wind speeds (in m/s) to find the radius of. the defualt values
+     * are the transition speeds of the Saffir-Simpson scale.
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(double, critical_wind_speed)
-
-    // set the profile type. PROFILE_MAX uses the maximum
-    // wind speed on each interval of the discretization, while
-    // PROFILE_AVERAGE uses the average on each interval
+    ///@}
+
+    /** @name profile_type
+     * Set the profile type. PROFILE_MAX uses the maximum wind speed on each
+     * interval of the discretization, while PROFILE_AVERAGE uses the average
+     * on each interval
+     */
+    ///@{
+    /// Profile types
     enum {PROFILE_MAX = 0, PROFILE_AVERAGE = 1};
-    TECA_ALGORITHM_PROPERTY(int, profile_type);
 
+    TECA_ALGORITHM_PROPERTY(int, profile_type)
+    ///@}
 
-    // override the input connections because we are going to
-    // take the first input and use it to generate metadata.
-    // the second input then becomes the only one the pipeline
-    // knows about.
+    /** override the input connections because we are going to take the first
+     * input and use it to generate metadata.  the second input then becomes
+     * the only one the pipeline knows about.
+     */
     void set_input_connection(unsigned int id,
         const teca_algorithm_output_port &port) override;
 
diff --git a/alg/teca_temporal_reduction.py b/alg/teca_temporal_reduction.py
index 034d551f2..005f9125f 100644
--- a/alg/teca_temporal_reduction.py
+++ b/alg/teca_temporal_reduction.py
@@ -1,7 +1,7 @@
 import sys
 import numpy as np
 
-
+# @cond
 class teca_temporal_reduction_internals:
     class time_point:
         """
@@ -181,7 +181,7 @@ def __next__(self):
                 sm = self.month
 
                 t0 = '%04d-%02d-01 00:00:00' % (sy, sm)
-                i0 = coordinate_util.time_step_of(self.t, True, True,
+                i0 = coordinate_util.time_step_of(self.t, False, True,
                                                   self.calendar,
                                                   self.units, t0)
 
@@ -259,7 +259,7 @@ def __next__(self):
                 month = self.month
 
                 t0 = '%04d-%02d-01 00:00:00' % (self.year, self.month)
-                i0 = coordinate_util.time_step_of(self.t, True, True,
+                i0 = coordinate_util.time_step_of(self.t, False, True,
                                                   self.calendar,
                                                   self.units, t0)
 
@@ -350,7 +350,7 @@ def __next__(self):
                 t0 = '%04d-%02d-%02d 00:00:00' % \
                     (self.year, self.month, self.day)
 
-                i0 = coordinate_util.time_step_of(self.t, True, True,
+                i0 = coordinate_util.time_step_of(self.t, False, True,
                                                   self.calendar,
                                                   self.units, t0)
 
@@ -531,6 +531,7 @@ def New(op_name):
                     reduction_operator.maximum()
 
             raise RuntimeError('Invalid operator %s' % (op_name))
+# @endcond
 
 
 class teca_temporal_reduction(teca_threaded_python_algorithm):
diff --git a/alg/teca_unpack_data.cxx b/alg/teca_unpack_data.cxx
new file mode 100644
index 000000000..5972070f0
--- /dev/null
+++ b/alg/teca_unpack_data.cxx
@@ -0,0 +1,363 @@
+#include "teca_unpack_data.h"
+
+#include "teca_cartesian_mesh.h"
+#include "teca_array_collection.h"
+#include "teca_variant_array.h"
+#include "teca_metadata.h"
+#include "teca_array_attributes.h"
+
+#include <algorithm>
+#include <iostream>
+#include <string>
+#include <set>
+#include <cmath>
+
+#if defined(TECA_HAS_BOOST)
+#include <boost/program_options.hpp>
+#endif
+
+//#define TECA_DEBUG
+
+namespace
+{
+template <typename input_t, typename output_t>
+void transform(output_t * __restrict__ p_out, input_t * __restrict__ p_in,
+    size_t n, output_t scale, output_t offset)
+{
+    for (size_t i = 0; i < n; ++i)
+        p_out[i] = p_in[i] * scale + offset;
+}
+
+template <typename input_t, typename mask_t, typename output_t>
+void transform(output_t * __restrict__ p_out, input_t * __restrict__ p_in,
+    mask_t * __restrict__ p_mask, size_t n, output_t scale, output_t offset,
+    output_t fill)
+{
+    for (size_t i = 0; i < n; ++i)
+        p_out[i] = (p_mask[i] ? p_in[i] * scale + offset : fill);
+}
+}
+
+
+// --------------------------------------------------------------------------
+teca_unpack_data::teca_unpack_data() :
+    output_data_type(teca_variant_array_code<float>::get())
+{
+    this->set_number_of_input_connections(1);
+    this->set_number_of_output_ports(1);
+}
+
+// --------------------------------------------------------------------------
+teca_unpack_data::~teca_unpack_data()
+{}
+
+#if defined(TECA_HAS_BOOST)
+// --------------------------------------------------------------------------
+void teca_unpack_data::get_properties_description(
+    const std::string &prefix, options_description &global_opts)
+{
+    options_description opts("Options for "
+        + (prefix.empty()?"teca_unpack_data":prefix));
+
+    opts.add_options()
+        TECA_POPTS_GET(int, prefix, output_data_type,
+            "Sets the type of the transformed data to either single or double"
+            " precision floating point. Use 11 for single precision and 12 for"
+            " double precision.")
+        TECA_POPTS_GET(int, prefix, verbose, "Enables verbose output")
+        ;
+
+
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
+    global_opts.add(opts);
+}
+
+// --------------------------------------------------------------------------
+void teca_unpack_data::set_properties(
+    const std::string &prefix, variables_map &opts)
+{
+    this->teca_algorithm::set_properties(prefix, opts);
+
+    TECA_POPTS_SET(opts, int, prefix, output_data_type)
+    TECA_POPTS_SET(opts, int, prefix, verbose)
+}
+#endif
+
+// --------------------------------------------------------------------------
+int teca_unpack_data::validate_output_data_type(int val)
+{
+    // validate the output type
+    if ((val != ((int)teca_variant_array_code<float>::get())) &&
+        (val != ((int)teca_variant_array_code<double>::get())))
+    {
+        TECA_ERROR("Invlaid output data type " << val << ". Use "
+            << teca_variant_array_code<double>::get()
+            << " to select double precision output and "
+            << teca_variant_array_code<float>::get()
+            << " to select single precision output")
+        return -1;
+    }
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+teca_metadata teca_unpack_data::get_output_metadata(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md)
+{
+#ifdef TECA_DEBUG
+    std::cerr << teca_parallel_id()
+        << "teca_unpack_data::get_output_metadata" << endl;
+#endif
+    (void)port;
+
+    // for each array on the input look for the presence of scale_factor and
+    // add_offset if both attributes are present then modify the output data
+    // type.
+    teca_metadata out_md(input_md[0]);
+
+    std::vector<std::string> variables;
+    if (out_md.get("variables", variables))
+    {
+        TECA_ERROR("Failed to get the list of variables")
+        return teca_metadata();
+    }
+
+    teca_metadata attributes;
+    if (out_md.get("attributes", attributes))
+    {
+        TECA_ERROR("Failed to get the array attributes")
+        return teca_metadata();
+    }
+
+    size_t n_vars = variables.size();
+    for (size_t i = 0; i < n_vars; ++i)
+    {
+        const std::string &array_name = variables[i];
+
+        teca_metadata array_atts;
+        if (attributes.get(array_name, array_atts))
+        {
+            // this could be reported as an error or a warning but unless this
+            // becomes problematic quietly ignore it
+            continue;
+        }
+
+        // if both scale_factor and add_offset  attributes are present then
+        // the data will be transformed. Update the output type.
+        if (array_atts.has("scale_factor") && array_atts.has("add_offset"))
+        {
+            array_atts.set("type_code", this->output_data_type);
+
+            array_atts.remove("scale_factor");
+            array_atts.remove("add_offset");
+
+            if (array_atts.has("_FillValue") || array_atts.has("missing_value"))
+            {
+               array_atts.remove("_FillValue");
+               array_atts.remove("missing_value");
+
+               if (this->output_data_type == ((int)teca_variant_array_code<double>::get()))
+                   array_atts.set("_FillValue", 1e20);
+               else if (this->output_data_type == ((int)teca_variant_array_code<float>::get()))
+                   array_atts.set("_FillValue", 1e20f);
+            }
+
+            attributes.set(array_name, array_atts);
+        }
+    }
+
+    out_md.set("attributes", attributes);
+    return out_md;
+}
+
+// --------------------------------------------------------------------------
+std::vector<teca_metadata> teca_unpack_data::get_upstream_request(
+    unsigned int port,
+    const std::vector<teca_metadata> &input_md,
+    const teca_metadata &request)
+{
+    (void)port;
+
+    std::vector<teca_metadata> up_reqs;
+
+    // copy the incoming request to preserve the downstream
+    // requirements and add the arrays we need
+    teca_metadata req(request);
+
+    // get the list of variable available. we need to see if
+    // the valid value mask is available and if so request it
+    const teca_metadata &md = input_md[0];
+
+    std::set<std::string> variables;
+    if (md.get("variables", variables))
+    {
+        TECA_ERROR("Metadata issue. variables is missing")
+        return up_reqs;
+    }
+
+    teca_metadata attributes;
+    if (md.get("attributes", attributes))
+    {
+        TECA_ERROR("Failed to get the array attributes")
+        return up_reqs;
+    }
+
+    // add the dependent variables into the requested arrays
+    std::set<std::string> arrays_up;
+    if (req.has("arrays"))
+        req.get("arrays", arrays_up);
+
+    std::vector<std::string> arrays_in(arrays_up.begin(), arrays_up.end());
+    int n_arrays = arrays_in.size();
+    for (int i = 0; i < n_arrays; ++i)
+    {
+        const std::string &array_name = arrays_in[i];
+
+        teca_metadata array_atts;
+        if (attributes.get(array_name, array_atts))
+        {
+            // this could be reported as an error or a warning but unless this
+            // becomes problematic quietly ignore it
+            continue;
+        }
+
+        // if both scale_factor and add_offset  attributes are present then
+        // the data will be transformed. Update the output type.
+        if (array_atts.has("scale_factor") && array_atts.has("add_offset") &&
+            (array_atts.has("_FillValue") || array_atts.has("missing_value")))
+        {
+            // request the valid value mask if they are available.
+            std::string mask_var = array_name + "_valid";
+            if (variables.count(mask_var))
+                arrays_up.insert(mask_var);
+        }
+    }
+
+    // update the request
+    req.set("arrays", arrays_up);
+
+    // send it up
+    up_reqs.push_back(req);
+    return up_reqs;
+}
+
+// --------------------------------------------------------------------------
+const_p_teca_dataset teca_unpack_data::execute(
+    unsigned int port,
+    const std::vector<const_p_teca_dataset> &input_data,
+    const teca_metadata &request)
+{
+#ifdef TECA_DEBUG
+    std::cerr << teca_parallel_id() << "teca_unpack_data::execute" << endl;
+#endif
+    (void)port;
+    (void)request;
+
+    // get the input mesh
+    const_p_teca_mesh in_mesh
+        = std::dynamic_pointer_cast<const teca_mesh>(input_data[0]);
+
+    if (!in_mesh)
+    {
+        TECA_ERROR("Input dataset is not a teca_mesh")
+        return nullptr;
+    }
+
+    p_teca_mesh out_mesh =
+        std::static_pointer_cast<teca_mesh>(in_mesh->new_instance());
+
+    out_mesh->shallow_copy(std::const_pointer_cast<teca_mesh>(in_mesh));
+
+    teca_metadata attributes;
+    if (out_mesh->get_attributes(attributes))
+    {
+        TECA_ERROR("Failed to get attributes")
+        return nullptr;
+    }
+
+    // for each array
+    p_teca_array_collection point_arrays = out_mesh->get_point_arrays();
+    int n_arrays = point_arrays->size();
+    for (int i = 0; i < n_arrays; ++i)
+    {
+        const std::string &array_name = point_arrays->get_name(i);
+
+        // skip valid value masks
+        size_t len = array_name.size();
+        if ((len > 6) && (strcmp("_valid", array_name.c_str() + len - 6) == 0))
+            continue;
+
+        // check if this array is to be transformed
+        teca_metadata array_atts;
+        double scale = 0.0;
+        double offset = 0.0;
+        if (attributes.get(array_name, array_atts) ||
+            array_atts.get("scale_factor", scale) ||
+            array_atts.get("add_offset", offset))
+            continue;
+
+        // check for valid value mask
+        std::string mask_name = array_name + "_valid";
+        p_teca_variant_array mask = point_arrays->get(mask_name);
+
+        // get the input
+        p_teca_variant_array in_array = point_arrays->get(i);
+
+        // allocate the output
+        p_teca_variant_array out_array =
+            teca_variant_array_factory::New(this->output_data_type);
+        if (!out_array)
+        {
+            TECA_ERROR("Failed to allocate the output array")
+            return nullptr;
+        }
+
+        unsigned long n_elem = in_array->size();
+        out_array->resize(n_elem);
+
+        // transform arrays
+        NESTED_TEMPLATE_DISPATCH(teca_variant_array_impl,
+            in_array.get(),
+            _IN,
+            NT_IN *p_in = dynamic_cast<TT_IN*>(in_array.get())->get();
+            NESTED_TEMPLATE_DISPATCH_FP(teca_variant_array_impl,
+                out_array.get(),
+                _OUT,
+                NT_OUT *p_out = dynamic_cast<TT_OUT*>(out_array.get())->get();
+
+                if (mask)
+                {
+                    NESTED_TEMPLATE_DISPATCH_I(teca_variant_array_impl,
+                        mask.get(),
+                        _MASK,
+                        NT_MASK *p_mask = dynamic_cast<TT_MASK*>(mask.get())->get();
+                        ::transform(p_out, p_in, p_mask,
+                            n_elem, NT_OUT(scale), NT_OUT(offset), NT_OUT(1e20));
+                        )
+
+                }
+                else
+                {
+                    ::transform(p_out, p_in, n_elem, NT_OUT(scale), NT_OUT(offset));
+                }
+                )
+            )
+
+        // poass to the output
+        point_arrays->set(i, out_array);
+
+        // update the metadata
+        array_atts.set("type_code", this->output_data_type);
+        attributes.set(array_name, array_atts);
+
+        if (this->verbose)
+        {
+            TECA_STATUS("Unpacked \"" << array_name << "\" scale_factor = "
+                << scale << " add_offset = " << offset)
+        }
+    }
+
+    return out_mesh;
+}
diff --git a/alg/teca_unpack_data.h b/alg/teca_unpack_data.h
new file mode 100644
index 000000000..373535f2a
--- /dev/null
+++ b/alg/teca_unpack_data.h
@@ -0,0 +1,84 @@
+#ifndef teca_unpack_data_h
+#define teca_unpack_data_h
+
+#include "teca_shared_object.h"
+#include "teca_algorithm.h"
+#include "teca_metadata.h"
+#include "teca_variant_array.h"
+
+#include <string>
+#include <vector>
+
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_unpack_data)
+
+/// an algorithm that unpacks NetCDF packed values
+/**
+ * Applies a data transform according to the NetCDF attribute conventions for
+ * packed data values.
+ * https://www.unidata.ucar.edu/software/netcdf/docs/attribute_conventions.html
+ *
+ * Variables in the input dataset are scanned for the presence
+ * of the `scale_factor` and `add_offset` attributes. When both are present
+ * an element wise transformation is applied such that
+ *
+ * out[i] = scale_factor * in[i] + add_offset
+ *
+ * The input array is expected to be an integer type while the type of the output
+ * array may be either float or double. Valid value masks may be necessary for
+ * correct results, see `teca_valid_value_mask`.
+*/
+class teca_unpack_data : public teca_algorithm
+{
+public:
+    TECA_ALGORITHM_STATIC_NEW(teca_unpack_data)
+    TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_unpack_data)
+    TECA_ALGORITHM_CLASS_NAME(teca_unpack_data)
+    ~teca_unpack_data();
+
+    // report/initialize to/from Boost program options
+    // objects.
+    TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
+    TECA_SET_ALGORITHM_PROPERTIES()
+
+    /** @name output_data_type
+     * set the output data type.  use teca_variant_array_code<T>::get() to get
+     * the numeric code corresponding to the data type T. The default output
+     * data type is single precision floating point.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY_V(int, output_data_type)
+
+    /// set the output data type to double precision floating point
+    void set_output_data_type_to_float()
+    { this->set_output_data_type(teca_variant_array_code<float>::get()); }
+
+    /// set the output data type to single precision floating point
+    void set_output_data_type_to_double()
+    { this->set_output_data_type(teca_variant_array_code<double>::get()); }
+    ///@}
+
+protected:
+    teca_unpack_data();
+
+private:
+    teca_metadata get_output_metadata(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md) override;
+
+    std::vector<teca_metadata> get_upstream_request(
+        unsigned int port,
+        const std::vector<teca_metadata> &input_md,
+        const teca_metadata &request) override;
+
+    const_p_teca_dataset execute(
+        unsigned int port,
+        const std::vector<const_p_teca_dataset> &input_data,
+        const teca_metadata &request) override;
+
+    int validate_output_data_type(int val);
+
+private:
+    int output_data_type;
+};
+
+#endif
diff --git a/alg/teca_valid_value_mask.cxx b/alg/teca_valid_value_mask.cxx
index c9240efec..90cbddbfe 100644
--- a/alg/teca_valid_value_mask.cxx
+++ b/alg/teca_valid_value_mask.cxx
@@ -37,7 +37,7 @@ bool is_mask_array(const std::string &array)
 
 // --------------------------------------------------------------------------
 teca_valid_value_mask::teca_valid_value_mask() :
-    mask_arrays(), enable_valid_range(0), verbose(0)
+    mask_arrays(), enable_valid_range(0)
 {
     this->set_number_of_input_connections(1);
     this->set_number_of_output_ports(1);
@@ -62,10 +62,10 @@ void teca_valid_value_mask::get_properties_description(
         TECA_POPTS_GET(int, prefix, enable_valid_range,
             "If set non-zero vald_range, valid_min, and valid_max attributes"
             " would be used if there is no _FillValue attribute.")
-        TECA_POPTS_GET(int, prefix, verbose,
-            "If set then status messages are sent to the terminal.")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -73,9 +73,10 @@ void teca_valid_value_mask::get_properties_description(
 void teca_valid_value_mask::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::vector<std::string>, prefix, mask_arrays)
     TECA_POPTS_SET(opts, int, prefix, enable_valid_range)
-    TECA_POPTS_SET(opts, int, prefix, verbose)
 }
 #endif
 
diff --git a/alg/teca_valid_value_mask.h b/alg/teca_valid_value_mask.h
index ebea5f21a..dfa90b9a3 100644
--- a/alg/teca_valid_value_mask.h
+++ b/alg/teca_valid_value_mask.h
@@ -27,7 +27,7 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_valid_value_mask)
  * a variable named "V" it will be named "V_valid".
  *
  * Masks are requested for specific arrays in one of two ways. One may use the
- * @ref mask_arrays algorithm property to explicitly name the list of variables to
+ * mask_arrays algorithm property to explicitly name the list of variables to
  * compute masks for. Alternatively, a heuristic applied to incoming requests
  * determines if masks should be generated. Specifically the string "_valid" is
  * looked for at the end of each requested array.  If it is found then the mask
@@ -48,8 +48,7 @@ class teca_valid_value_mask : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    /** @anchor mask_arrays
-     * @name mask_arrays
+    /** @name mask_arrays
      * explicitly set a list of input arrays to process. By default
      * all arrays are processed. Use this property to compute masks
      * for a subset of the arrays,
@@ -58,8 +57,7 @@ class teca_valid_value_mask : public teca_algorithm
     TECA_ALGORITHM_VECTOR_PROPERTY(std::string, mask_array)
     ///@}
 
-    /** @anchor enable_valid_range
-     * @name enable_valid_range
+    /** @name enable_valid_range
      * enable the use of valid_range, valid_min, valid_max attributes.
      * by default this is off.
      */
@@ -67,15 +65,6 @@ class teca_valid_value_mask : public teca_algorithm
     TECA_ALGORITHM_PROPERTY(int, enable_valid_range)
     ///@}
 
-    /** @anchor verbose
-     * @name verbose
-     * if set to a non-zero value, rank 0 will send status information to the
-     * terminal. The default setting of zero results in minimal output.
-     */
-    ///@{
-    TECA_ALGORITHM_PROPERTY(int, verbose)
-    ///@}
-
 protected:
     teca_valid_value_mask();
 
@@ -94,7 +83,6 @@ class teca_valid_value_mask : public teca_algorithm
 private:
     std::vector<std::string> mask_arrays;
     int enable_valid_range;
-    int verbose;
 };
 
 #endif
diff --git a/alg/teca_variant_array_operand.h b/alg/teca_variant_array_operand.h
index b74b030d3..785a61f64 100644
--- a/alg/teca_variant_array_operand.h
+++ b/alg/teca_variant_array_operand.h
@@ -1,36 +1,43 @@
 #ifndef teca_variant_array_operand_h
 #define teca_variant_array_operand_h
 
+/// @file
+
 #include "teca_variant_array.h"
 #include "teca_array_collection.h"
 
+/// Codes dealing with the operands of run time specified operations on teca_variant_array
 namespace teca_variant_array_operand
 {
 
-// class that handles conversion of literals to varaint_arrays
-// and name resolution of variables.
+/** @brief
+ * Handles conversion of literals to variant_arrays and the name resolution of
+ * variables.
+ */
 class resolver
 {
 public:
-    // given a text representation of a numeric value in s
-    // convert and return a variant_array filled with the
-    // numeric value. the type is determined by the last
-    // 1 or 2 characters in the string, Valid type codes
-    // are:
-    //     d -- double
-    //     f -- float
-    //     L -- long long
-    //     l -- long
-    //     i -- int
-    //     s -- short
-    //     c -- char
-    //     u -- unsigned, augments any of the integer types
-    // the return is non-zero if an error occured, zero
-    // otherwise.
+    /**  given a text representation of a numeric value in s convert and
+     * return a variant_array filled with the numeric value. the type is
+     * determined by the last 1 or 2 characters in the string, Valid type
+     * codes are:
+     *
+     *      d -- double
+     *      f -- float
+     *      L -- long long
+     *      l -- long
+     *      i -- int
+     *      s -- short
+     *      c -- char
+     *      u -- unsigned, augments any of the integer types
+     *
+     * the return is non-zero if an error occurred, zero otherwise.
+     */
     int get_constant(const char *s, p_teca_variant_array &c);
 
-    // given the name of a variable in var_name, set var to point
-    // to the array of coresponding name. see set/get_variables.
+    /**  given the name of a variable in var_name, set var to point to the
+     * array of corresponding name. see set/get_variables.
+     */
     int get_variable(const char *var_name,
         const_p_teca_variant_array &var)
     {
@@ -39,11 +46,11 @@ class resolver
         return 0;
     }
 
-    // set/get the set of arrays used for variable name
-    // resolution.
+    /// get the set of arrays used for variable name resolution.
     const_p_teca_array_collection get_variables()
     { return m_variables; }
 
+    /// set the set of arrays used for variable name resolution.
     void set_variables(const_p_teca_array_collection v)
     { m_variables = v; }
 
diff --git a/alg/teca_variant_array_operator.h b/alg/teca_variant_array_operator.h
index e1c0decaf..f886af2d3 100644
--- a/alg/teca_variant_array_operator.h
+++ b/alg/teca_variant_array_operator.h
@@ -1,11 +1,15 @@
 #ifndef teca_variant_array_operator
 #define teca_variant_array_operator
 
+/// @file
+
 #include "teca_variant_array.h"
 #include "teca_type_select.h"
 
+/// Codes dealing with run time specified operations on teca_variant_arrays
 namespace teca_variant_array_operator
 {
+/// @cond
 namespace internal
 {
 // --------------------------------------------------------------------------
@@ -64,6 +68,7 @@ p_teca_variant_array apply(unsigned long n,
     return out;
 }
 };
+/// @endcond
 
 // --------------------------------------------------------------------------
 template <typename operator_t>
diff --git a/alg/teca_vertical_coordinate_transform.cxx b/alg/teca_vertical_coordinate_transform.cxx
index 6e9b25d72..6fba697a9 100644
--- a/alg/teca_vertical_coordinate_transform.cxx
+++ b/alg/teca_vertical_coordinate_transform.cxx
@@ -92,9 +92,11 @@ void teca_vertical_coordinate_transform::get_properties_description(
 
     opts.add_options()
         TECA_POPTS_GET(int, prefix, mode,
-            "transform mode (mode_wrf_v3)")
+            "Sets the coordinate transform mode. The modes are: mode_wrf_v3")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -102,6 +104,8 @@ void teca_vertical_coordinate_transform::get_properties_description(
 void teca_vertical_coordinate_transform::set_properties(
     const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, int, prefix, mode)
 }
 #endif
diff --git a/alg/teca_vertical_coordinate_transform.h b/alg/teca_vertical_coordinate_transform.h
index 1e3b27ba1..da5073bfb 100644
--- a/alg/teca_vertical_coordinate_transform.h
+++ b/alg/teca_vertical_coordinate_transform.h
@@ -10,10 +10,7 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_vertical_coordinate_transform)
 
-/// an algorithm that transforms vertical cooridinates
-/**
-An algorithm that transforms vertical coordinates of a mesh.
-*/
+/// An algorithm that transforms the vertical cooridinates of a mesh
 class teca_vertical_coordinate_transform : public teca_algorithm
 {
 public:
diff --git a/alg/teca_vertical_reduction.cxx b/alg/teca_vertical_reduction.cxx
index be806acdd..f823cfba7 100644
--- a/alg/teca_vertical_reduction.cxx
+++ b/alg/teca_vertical_reduction.cxx
@@ -35,9 +35,9 @@ void teca_vertical_reduction::get_properties_description(
         + (prefix.empty()?"teca_vertical_reduction":prefix));
 
     opts.add_options()
-        TECA_POPTS_GET(std::vector<std::string>, prefix, dependent_variables,
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, dependent_variables,
             "list of arrays needed to compute the derived quantity")
-        TECA_POPTS_GET(std::vector<std::string>, prefix, derived_variables,
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, derived_variables,
             "name of the derived quantity")
         ;
 
diff --git a/alg/teca_vertical_reduction.h b/alg/teca_vertical_reduction.h
index a47362408..bbeb72487 100644
--- a/alg/teca_vertical_reduction.h
+++ b/alg/teca_vertical_reduction.h
@@ -11,11 +11,11 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_vertical_reduction)
 
-/// base class for vertical reducitons
+/// The base class for vertical reducitons.
 /**
-implements common operations associated with computing a vertical
-reduction where a 3D dataset is transformed into a 2D dataset
-by a reduction along the 3rd spatial dimension.
+ * implements common operations associated with computing a vertical
+ * reduction where a 3D dataset is transformed into a 2D dataset
+ * by a reduction along the 3rd spatial dimension.
 */
 class teca_vertical_reduction : public teca_algorithm
 {
@@ -30,16 +30,27 @@ class teca_vertical_reduction : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set/get the list of variables that are needed to produce
-    // the derived quantity
+    /** @name dependent_variable
+     * set/get the list of variables that are needed to produce the derived
+     * quantity
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(std::string, dependent_variable)
+    ///@}
 
-    // set/get the name of the variable that is produced
+    /** @name derived_variable
+     * set/get the name of the variable that is produced
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(std::string, derived_variable)
+    ///@}
 
-    // set/get the attributes of the variable that is produced
-    TECA_ALGORITHM_VECTOR_PROPERTY(teca_array_attributes,
-        derived_variable_attribute)
+    /** @name derived_variable_attribute
+     * Set the attributes of the variable that is produced.
+     */
+    ///@{
+    TECA_ALGORITHM_VECTOR_PROPERTY(teca_array_attributes, derived_variable_attribute)
+    ///@}
 
 protected:
     teca_vertical_reduction();
diff --git a/alg/teca_vorticity.cxx b/alg/teca_vorticity.cxx
index 66fcf21d7..b6635686e 100644
--- a/alg/teca_vorticity.cxx
+++ b/alg/teca_vorticity.cxx
@@ -161,6 +161,8 @@ void teca_vorticity::get_properties_description(
             "array to store the computed vorticity in")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -168,6 +170,8 @@ void teca_vorticity::get_properties_description(
 void teca_vorticity::set_properties(
     const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, component_0_variable)
     TECA_POPTS_SET(opts, std::string, prefix, component_1_variable)
     TECA_POPTS_SET(opts, std::string, prefix, vorticity_variable)
diff --git a/alg/teca_vorticity.h b/alg/teca_vorticity.h
index 7ac3226f6..b42cd0d6c 100644
--- a/alg/teca_vorticity.h
+++ b/alg/teca_vorticity.h
@@ -10,10 +10,7 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_vorticity)
 
-/// an algorithm that computes vorticity
-/**
-Compute vorticity from a vector field.
-*/
+/// An algorithm that computes vorticity from a vector field.
 class teca_vorticity : public teca_algorithm
 {
 public:
@@ -27,14 +24,29 @@ class teca_vorticity : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the arrays that contain the vector components
-    // to compute vorticity from
+    /** @name component_0_variable
+     * set the arrays that contain the vector components to compute vorticity
+     * from.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_0_variable)
+    ///@}
+
+    /** @name component_1_variable
+     * set the arrays that contain the vector components to compute vorticity
+     * from.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, component_1_variable)
+    ///@}
 
-    // set the name of the array to store the result in.
-    // the default is "vorticity"
+    /** @name vorticity_variable
+     * set the name of the array to store the result in.  the default is
+     * "vorticity"
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, vorticity_variable)
+    ///@}
 
 protected:
     teca_vorticity();
diff --git a/apps/CMakeLists.txt b/apps/CMakeLists.txt
index 2d8a1be85..67b18de57 100644
--- a/apps/CMakeLists.txt
+++ b/apps/CMakeLists.txt
@@ -22,6 +22,9 @@ teca_add_app(teca_bayesian_ar_detect LIBS ${teca_app_link}
 teca_add_app(teca_integrated_vapor_transport LIBS ${teca_app_link}
     FEATURES ${TECA_HAS_BOOST} ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS})
 
+teca_add_app(teca_integrated_water_vapor LIBS ${teca_app_link}
+    FEATURES ${TECA_HAS_BOOST} ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS})
+
 teca_add_app(teca_tc_detect LIBS ${teca_app_link}
     FEATURES ${TECA_HAS_BOOST} ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS})
 
diff --git a/apps/teca_app_util.h b/apps/teca_app_util.h
index 9269c9896..5b4f4967e 100644
--- a/apps/teca_app_util.h
+++ b/apps/teca_app_util.h
@@ -1,25 +1,30 @@
 #ifndef teca_app_util_h
 #define teca_app_util_h
 
+/// @file
+
 #include "teca_config.h"
 
 #include <string>
 #include <boost/program_options.hpp>
 
+/// Codes shared among the command line applications
 namespace teca_app_util
 {
 
-// check for flag and if found print the help message
-// and the option definitions. return non-zero if the flag
-// was found.
+/** Check for flag and if found print the help message
+ * and the option definitions. return non-zero if the flag
+ * was found.
+ */
 int process_command_line_help(int rank, const std::string &flag,
     boost::program_options::options_description &opt_defs,
     boost::program_options::variables_map &opt_vals);
 
-// parses the command line options and checks for --help, --advanced_help, and
-// --full_help flags.  if any are found prints the associated option
-// defintions.  if any of the help flags were found 1 is returned. If there is
-// an error -1 is returned. Otherwise 0 is returned.
+/** parses the command line options and checks for --help, --advanced_help, and
+ * --full_help flags.  if any are found prints the associated option
+ * defintions.  if any of the help flags were found 1 is returned. If there is
+ * an error -1 is returned. Otherwise 0 is returned.
+ */
 int process_command_line_help(int rank, int argc, char **argv,
     boost::program_options::options_description &basic_opt_defs,
     boost::program_options::options_description &advanced_opt_defs,
diff --git a/apps/teca_bayesian_ar_detect.cpp b/apps/teca_bayesian_ar_detect.cpp
index dedfb99bc..9d11971ce 100644
--- a/apps/teca_bayesian_ar_detect.cpp
+++ b/apps/teca_bayesian_ar_detect.cpp
@@ -8,15 +8,21 @@
 #include "teca_bayesian_ar_detect_parameters.h"
 #include "teca_binary_segmentation.h"
 #include "teca_l2_norm.h"
+#include "teca_apply_binary_mask.h"
 #include "teca_multi_cf_reader.h"
 #include "teca_integrated_vapor_transport.h"
 #include "teca_valid_value_mask.h"
+#include "teca_cartesian_mesh_source.h"
+#include "teca_cartesian_mesh_regrid.h"
+#include "teca_indexed_dataset_cache.h"
+#include "teca_elevation_mask.h"
+#include "teca_unpack_data.h"
 #include "teca_mpi_manager.h"
 #include "teca_coordinate_util.h"
 #include "teca_table.h"
 #include "teca_dataset_source.h"
 #include "teca_app_util.h"
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 
 #include <vector>
 #include <string>
@@ -82,6 +88,22 @@ int main(int argc, char **argv)
         ("write_ivt", "\nwhen this flag is present IVT vector is written to disk with"
             " the result\n")
 
+        ("dem", value<std::string>(), "\nA teca_cf_reader regex identifying the"
+            " file containing surface elevation field or DEM.\n")
+        ("dem_variable", value<std::string>()->default_value("Z"),
+            "\nSets the name of the variable containing the surface elevation field\n")
+        ("mesh_height", value<std::string>()->default_value("Zg"),
+            "\nSets the name of the variable containing the point wise vertical height"
+            " in meters above mean sea level\n")
+
+        ("ar_probability", value<std::string>()->default_value("ar_probability"),
+            "\nSets the name of the variable to store the computed AR probability mask in.\n")
+
+        ("ar_weighted_variables", value<std::vector<std::string>>()->multitoken(),
+            "\nAn optional list of variables to weight with the computed AR probability."
+            " Each such variable will be multiplied by the computed AR probability, and"
+            " written to disk as \"NAME_ar_wgtd\".\n")
+
         ("x_axis_variable", value<std::string>()->default_value("lon"),
             "\nname of x coordinate variable\n")
         ("y_axis_variable", value<std::string>()->default_value("lat"),
@@ -92,16 +114,29 @@ int main(int argc, char **argv)
         ("periodic_in_x", value<int>()->default_value(1),
             "\nFlags whether the x dimension (typically longitude) is periodic.\n")
 
-        ("binary_ar_threshold", value<double>()->default_value(2.0/3.0,"0.667"),
-            "\nprobability threshold for segmenting ar_probability to produce ar_binary_tag\n")
-
-        ("output_file", value<std::string>()->default_value(std::string("CASCADE_BARD_%t%.nc")),
+        ("segment_ar_probability", "\nA flag that enables a binary segmentation of AR"
+            " probability to be produced. --segment_threshold controls the segmentation."
+            " threshold and --segment_variable to set the name of the variable to store"
+            " the result in.\n")
+        ("segment_threshold", value<double>()->default_value(2.0/3.0,"0.667"),
+            "\nSets the threshold value that is used when segmenting ar_probability."
+            " See also --segment_ar_probability\n")
+        ("segment_variable", value<std::string>()->default_value("ar_binary_tag"),
+            "\nSet the name of the variable to store the result of a binary"
+            " segmentation of AR probabilty. See also --segment_ar_probability.")
+
+        ("output_file", value<std::string>()->default_value(std::string("TECA_BARD_%t%.nc")),
             "\nA path and file name pattern for the output NetCDF files. %t% is replaced with a"
             " human readable date and time corresponding to the time of the first time step in"
             " the file. Use --cf_writer::date_format to change the formatting\n")
-
+        ("file_layout", value<std::string>()->default_value("monthly"),
+            "\nSelects the size and layout of the set of output files. May be one of"
+            " number_of_steps, daily, monthly, seasonal, or yearly. Files are structured"
+            " such that each file contains one of the selected interval. For the number_of_steps"
+            " option use --steps_per_file.\n")
         ("steps_per_file", value<long>()->default_value(128),
-            "\nnumber of time steps per output file\n")
+            "\nThe number of time steps per output file when --file_layout number_of_steps is"
+            " specified.\n")
 
         ("first_step", value<long>()->default_value(0), "\nfirst time step to process\n")
         ("last_step", value<long>()->default_value(-1), "\nlast time step to process\n")
@@ -142,6 +177,38 @@ int main(int argc, char **argv)
     p_teca_multi_cf_reader mcf_reader = teca_multi_cf_reader::New();
     mcf_reader->get_properties_description("mcf_reader", advanced_opt_defs);
 
+    p_teca_valid_value_mask vv_mask = teca_valid_value_mask::New();
+    vv_mask->get_properties_description("vv_mask", advanced_opt_defs);
+
+    p_teca_unpack_data unpack = teca_unpack_data::New();
+    unpack->get_properties_description("unpack", advanced_opt_defs);
+
+    p_teca_normalize_coordinates norm_coords = teca_normalize_coordinates::New();
+    norm_coords->get_properties_description("norm_coords", advanced_opt_defs);
+
+    p_teca_cf_reader elev_reader = teca_cf_reader::New();
+    elev_reader->get_properties_description("elev_reader", advanced_opt_defs);
+    elev_reader->set_t_axis_variable("");
+
+    p_teca_normalize_coordinates elev_coords = teca_normalize_coordinates::New();
+    elev_coords->get_properties_description("elev_coords", advanced_opt_defs);
+    elev_coords->set_enable_periodic_shift_x(1);
+
+    p_teca_indexed_dataset_cache elev_cache = teca_indexed_dataset_cache::New();
+    elev_cache->get_properties_description("elev_cache", advanced_opt_defs);
+    elev_cache->set_max_cache_size(1);
+
+    p_teca_cartesian_mesh_source elev_mesh = teca_cartesian_mesh_source::New();
+    elev_mesh->get_properties_description("elev_mesh", advanced_opt_defs);
+
+    p_teca_cartesian_mesh_regrid elev_regrid = teca_cartesian_mesh_regrid::New();
+    elev_regrid->get_properties_description("elev_regrid", advanced_opt_defs);
+
+    p_teca_elevation_mask elev_mask = teca_elevation_mask::New();
+    elev_mask->get_properties_description("elev_mask", advanced_opt_defs);
+    elev_mask->set_surface_elevation_variable("Z");
+    elev_mask->set_mesh_height_variable("ZG");
+
     p_teca_l2_norm l2_norm = teca_l2_norm::New();
     l2_norm->get_properties_description("ivt_magnitude", advanced_opt_defs);
     l2_norm->set_component_0_variable("IVT_U");
@@ -156,12 +223,6 @@ int main(int argc, char **argv)
     ivt_int->set_ivt_u_variable("IVT_U");
     ivt_int->set_ivt_v_variable("IVT_V");
 
-    p_teca_valid_value_mask vv_mask = teca_valid_value_mask::New();
-    vv_mask->get_properties_description("vv_mask", advanced_opt_defs);
-
-    p_teca_normalize_coordinates norm_coords = teca_normalize_coordinates::New();
-    norm_coords->get_properties_description("norm_coords", advanced_opt_defs);
-
     // parameter source
     p_teca_bayesian_ar_detect_parameters params
         = teca_bayesian_ar_detect_parameters::New();
@@ -172,7 +233,7 @@ int main(int argc, char **argv)
     p_teca_bayesian_ar_detect ar_detect = teca_bayesian_ar_detect::New();
     ar_detect->get_properties_description("ar_detect", advanced_opt_defs);
     ar_detect->set_ivt_variable("IVT");
-
+    ar_detect->set_ar_probability_variable("ar_probability");
 
     // segment the ar probability field
     p_teca_binary_segmentation ar_tag = teca_binary_segmentation::New();
@@ -180,6 +241,12 @@ int main(int argc, char **argv)
     ar_tag->set_threshold_variable("ar_probability");
     ar_tag->set_segmentation_variable("ar_binary_tag");
 
+    // mask any requested variables by the AR probability
+    p_teca_apply_binary_mask ar_mask = teca_apply_binary_mask::New();
+    ar_mask->get_properties_description("ar_mask", advanced_opt_defs);
+    ar_mask->set_mask_variable("ar_probability");
+    ar_mask->set_output_variable_prefix("ar_wgtd_");
+
     // Add an executive for the writer
     p_teca_index_executive exec = teca_index_executive::New();
 
@@ -189,16 +256,21 @@ int main(int argc, char **argv)
     cf_writer->set_verbose(0);
     cf_writer->set_thread_pool_size(1);
     cf_writer->set_steps_per_file(128);
+    cf_writer->set_layout(teca_cf_writer::monthly);
 
     // package basic and advanced options for display
     options_description all_opt_defs(help_width, help_width - 4);
     all_opt_defs.add(basic_opt_defs).add(advanced_opt_defs);
 
     // parse the command line
+    int ierr = 0;
     variables_map opt_vals;
-    if (teca_app_util::process_command_line_help(mpi_man.get_comm_rank(),
-        argc, argv, basic_opt_defs, advanced_opt_defs, all_opt_defs, opt_vals))
+    if ((ierr = teca_app_util::process_command_line_help(
+        mpi_man.get_comm_rank(), argc, argv, basic_opt_defs,
+        advanced_opt_defs, all_opt_defs, opt_vals)))
     {
+        if (ierr == 1)
+            return 0;
         return -1;
     }
 
@@ -207,34 +279,60 @@ int main(int argc, char **argv)
     // options will override them
     cf_reader->set_properties("cf_reader", opt_vals);
     mcf_reader->set_properties("mcf_reader", opt_vals);
-    l2_norm->set_properties("ivt_magnitude", opt_vals);
-    ivt_int->set_properties("ivt_integral", opt_vals);
     vv_mask->set_properties("vv_mask", opt_vals);
     norm_coords->set_properties("norm_coords", opt_vals);
+    unpack->set_properties("unpack", opt_vals);
+    elev_reader->set_properties("elev_reader", opt_vals);
+    elev_coords->set_properties("elev_coords", opt_vals);
+    elev_mesh->set_properties("elev_mesh", opt_vals);
+    elev_cache->set_properties("elev_cache", opt_vals);
+    elev_regrid->set_properties("elev_regrid", opt_vals);
+    elev_mask->set_properties("elev_mask", opt_vals);
+    l2_norm->set_properties("ivt_magnitude", opt_vals);
+    ivt_int->set_properties("ivt_integral", opt_vals);
     params->set_properties("parameter_table", opt_vals);
     ar_detect->set_properties("ar_detect", opt_vals);
+    ar_mask->set_properties("ar_mask", opt_vals);
     cf_writer->set_properties("cf_writer", opt_vals);
 
     // now pass in the basic options, these are processed
     // last so that they will take precedence
     // configure the pipeline from the command line options.
-    p_teca_algorithm head;
 
     // configure the reader
     bool have_file = opt_vals.count("input_file");
     bool have_regex = opt_vals.count("input_regex");
 
+    if ((have_file && have_regex) || !(have_file || have_regex))
+    {
+        if (mpi_man.get_comm_rank() == 0)
+        {
+            TECA_ERROR("Extacly one of --input_file or --input_regex can be specified. "
+                "Use --input_file to activate the multi_cf_reader (HighResMIP datasets) "
+                "and --input_regex to activate the cf_reader (CAM like datasets)")
+        }
+        return -1;
+    }
+
+
+    p_teca_algorithm reader;
     if (have_file)
     {
         mcf_reader->set_input_file(opt_vals["input_file"].as<string>());
-        head = mcf_reader;
+        reader = mcf_reader;
     }
     else if (have_regex)
     {
         cf_reader->set_files_regex(opt_vals["input_regex"].as<string>());
-        head = cf_reader;
+        reader = cf_reader;
     }
-    p_teca_algorithm reader = head;
+
+    // add transformation stages to the pipeline
+    norm_coords->set_input_connection(reader->get_output_port());
+    vv_mask->set_input_connection(norm_coords->get_output_port());
+    unpack->set_input_connection(vv_mask->get_output_port());
+
+    p_teca_algorithm head = unpack;
 
     if (!opt_vals["periodic_in_x"].defaulted())
     {
@@ -290,10 +388,21 @@ int main(int argc, char **argv)
         ar_detect->set_ivt_variable(opt_vals["ivt"].as<string>());
     }
 
-    // add the ivt caluation stages if needed
+    // add the ivt calculation stages if needed
     bool do_ivt = opt_vals.count("compute_ivt");
     bool do_ivt_magnitude = opt_vals.count("compute_ivt_magnitude");
 
+    if (do_ivt && do_ivt_magnitude)
+    {
+        if (mpi_man.get_comm_rank() == 0)
+        {
+            TECA_ERROR("Only one of --compute_ivt and compute_ivt_magnitude can "
+                "be specified. --compute_ivt implies --compute_ivt_magnitude")
+        }
+        return -1;
+    }
+
+    teca_metadata md;
     if (do_ivt)
     {
         std::string z_var = "plev";
@@ -303,8 +412,51 @@ int main(int argc, char **argv)
         cf_reader->set_z_axis_variable(z_var);
         mcf_reader->set_z_axis_variable(z_var);
 
-        vv_mask->set_input_connection(head->get_output_port());
-        ivt_int->set_input_connection(vv_mask->get_output_port());
+        // add the elevation mask stages
+        if (opt_vals.count("dem"))
+        {
+            if (mpi_man.get_comm_rank() == 0)
+                TECA_STATUS("Generating elevation mask")
+
+            elev_reader->set_files_regex(opt_vals["dem"].as<string>());
+
+            elev_coords->set_input_connection(elev_reader->get_output_port());
+
+            md = head->update_metadata();
+
+            elev_mesh->set_spatial_bounds(md, false);
+            elev_mesh->set_spatial_extents(md, false);
+            elev_mesh->set_x_axis_variable(md);
+            elev_mesh->set_y_axis_variable(md);
+            elev_mesh->set_z_axis_variable(md);
+            elev_mesh->set_t_axis_variable(md);
+            elev_mesh->set_t_axis(md);
+
+            elev_regrid->set_input_connection(0, elev_mesh->get_output_port());
+            elev_regrid->set_input_connection(1, elev_coords->get_output_port());
+
+            elev_cache->set_input_connection(elev_regrid->get_output_port());
+
+            elev_mask->set_input_connection(0, head->get_output_port());
+            elev_mask->set_input_connection(1, elev_cache->get_output_port());
+
+            if (!opt_vals["dem_variable"].defaulted())
+                elev_mask->set_surface_elevation_variable(
+                    opt_vals["dem_variable"].as<string>());
+
+            if (!opt_vals["mesh_height"].defaulted())
+                elev_mask->set_mesh_height_variable(
+                    opt_vals["mesh_height"].as<string>());
+
+            elev_mask->set_mask_variables({
+                ivt_int->get_specific_humidity_variable() + "_valid",
+                ivt_int->get_wind_u_variable() + "_valid",
+                ivt_int->get_wind_v_variable() + "_valid"});
+
+            head = elev_mask;
+        }
+
+        ivt_int->set_input_connection(head->get_output_port());
         l2_norm->set_input_connection(ivt_int->get_output_port());
 
         head = l2_norm;
@@ -315,8 +467,71 @@ int main(int argc, char **argv)
         head = l2_norm;
     }
 
+    // connect the detector and post detector operations
+    ar_detect->set_input_connection(0, params->get_output_port());
+    ar_detect->set_input_connection(1, head->get_output_port());
+
+    if (!opt_vals["ar_probability"].defaulted())
+        ar_detect->set_ar_probability_variable(
+            opt_vals["ar_probability"].as<std::string>());
+
+    head = ar_detect;
+
+    // configure binary segmentation
+    bool do_segment = opt_vals.count("segment_ar_probability");
+    if (do_segment)
+    {
+        ar_tag->set_input_connection(0, ar_detect->get_output_port());
+
+        // set input and output variable names
+        ar_tag->set_threshold_variable(
+            ar_detect->get_ar_probability_variable());
+
+        if (!opt_vals["segement_variable"].defaulted())
+            ar_tag->set_segmentation_variable(
+                opt_vals["segment_variable"].as<std::string>());
+
+        // set threshold value
+        double ar_tag_threshold = opt_vals["segment_threshold"].as<double>();
+        ar_tag->set_low_threshold_value(ar_tag_threshold);
+
+        // add I/O metadata
+        teca_metadata seg_atts;
+        seg_atts.set("long_name", std::string("binary indicator of atmospheric river"));
+        seg_atts.set("description", std::string("binary indicator of atmospheric river"));
+        seg_atts.set("scheme", std::string("TECA_BARD"));
+        seg_atts.set("version", std::string("1.0"));
+        seg_atts.set("note",
+            std::string("derived by thresholding ar_probability >= ") +
+            std::to_string(ar_tag_threshold));
+
+        ar_tag->set_segmentation_variable_attributes(seg_atts);
+
+        head = ar_tag;
+    }
+
+    // configure weight by AR probability
+    std::vector<std::string> weighted_vars;
+    int do_weighted = opt_vals.count("ar_weighted_variables");
+    if (opt_vals.count("ar_weighted_variables"))
+    {
+        weighted_vars =
+            opt_vals["ar_weighted_variables"].as<std::vector<std::string>>();
+
+        ar_mask->set_input_connection(0, head->get_output_port());
+        ar_mask->set_masked_variables(weighted_vars);
+        ar_mask->set_mask_variable(ar_detect->get_ar_probability_variable());
+
+        head = ar_mask;
+    }
+
+    // connect and configure the writer
+    cf_writer->set_input_connection(head->get_output_port());
+
     // tell the writer to write ivt if needed
-    std::vector<std::string> point_arrays({"ar_probability", "ar_binary_tag"});
+    std::vector<std::string> point_arrays(
+        {ar_detect->get_ar_probability_variable()});
+
     if ((do_ivt || do_ivt_magnitude) && opt_vals.count("write_ivt_magnitude"))
     {
         point_arrays.push_back(l2_norm->get_l2_norm_variable());
@@ -328,12 +543,23 @@ int main(int argc, char **argv)
         point_arrays.push_back(ivt_int->get_ivt_v_variable());
     }
 
-    cf_writer->set_information_arrays({"ar_count", "parameter_table_row"});
-    cf_writer->set_point_arrays(point_arrays);
+    if (do_segment)
+    {
+        point_arrays.push_back(ar_tag->get_segmentation_variable());
+    }
+
+    // tell the writer to write ar weighted variables if needed
+    if (do_weighted)
+    {
+        point_arrays.insert(point_arrays.end(),
+            weighted_vars.begin(), weighted_vars.end());
 
+        ar_mask->get_output_variable_names(point_arrays);
+    }
 
-    if (!opt_vals["output_file"].defaulted())
-        cf_writer->set_file_name(opt_vals["output_file"].as<string>());
+    cf_writer->set_file_name(opt_vals["output_file"].as<string>());
+    cf_writer->set_information_arrays({"ar_count", "parameter_table_row"});
+    cf_writer->set_point_arrays(point_arrays);
 
     if (!opt_vals["steps_per_file"].defaulted())
         cf_writer->set_steps_per_file(opt_vals["steps_per_file"].as<long>());
@@ -344,6 +570,14 @@ int main(int argc, char **argv)
     if (!opt_vals["last_step"].defaulted())
         cf_writer->set_last_step(opt_vals["last_step"].as<long>());
 
+    if (!opt_vals["file_layout"].defaulted() &&
+        cf_writer->set_layout(opt_vals["file_layout"].as<std::string>()))
+    {
+        TECA_ERROR("An invalid file layout was provided \""
+            << opt_vals["file_layout"].as<std::string>() << "\"")
+        return -1;
+    }
+
     if (opt_vals.count("verbose"))
     {
         ar_detect->set_verbose(1);
@@ -356,29 +590,6 @@ int main(int argc, char **argv)
     else
         ar_detect->set_thread_pool_size(-1);
 
-
-    // some minimal check for missing options
-    if ((have_file && have_regex) || !(have_file || have_regex))
-    {
-        if (mpi_man.get_comm_rank() == 0)
-        {
-            TECA_ERROR("Extacly one of --input_file or --input_regex can be specified. "
-                "Use --input_file to activate the multi_cf_reader (HighResMIP datasets) "
-                "and --input_regex to activate the cf_reader (CAM like datasets)")
-        }
-        return -1;
-    }
-
-    if (do_ivt && do_ivt_magnitude)
-    {
-        if (mpi_man.get_comm_rank() == 0)
-        {
-            TECA_ERROR("Only one of --compute_ivt and compute_ivt_magnitude can "
-                "be specified. --compute_ivt implies --compute_ivt_magnitude")
-        }
-        return -1;
-    }
-
     if (cf_writer->get_file_name().empty())
     {
         if (mpi_man.get_comm_rank() == 0)
@@ -389,20 +600,14 @@ int main(int argc, char **argv)
         return -1;
     }
 
-    // connect the fixed stages of the pipeline
-    norm_coords->set_input_connection(head->get_output_port());
-    ar_detect->set_input_connection(0, params->get_output_port());
-    ar_detect->set_input_connection(1, norm_coords->get_output_port());
-    ar_tag->set_input_connection(0, ar_detect->get_output_port());
-    cf_writer->set_input_connection(ar_tag->get_output_port());
-
     // look for requested time step range, start
     bool parse_start_date = opt_vals.count("start_date");
     bool parse_end_date = opt_vals.count("end_date");
     if (parse_start_date || parse_end_date)
     {
         // run the reporting phase of the pipeline
-        teca_metadata md = reader->update_metadata();
+        if (md.empty())
+            md = reader->update_metadata();
 
         teca_metadata atrs;
         if (md.get("attributes", atrs))
@@ -423,10 +628,8 @@ int main(int argc, char **argv)
         }
 
         teca_metadata coords;
-        p_teca_double_array time;
-        if (md.get("coordinates", coords) ||
-            !(time = std::dynamic_pointer_cast<teca_double_array>(
-                coords.get("t"))))
+        p_teca_variant_array time;
+        if (md.get("coordinates", coords) || !(time = coords.get("t")))
         {
             TECA_ERROR("failed to determine time coordinate")
             return -1;
@@ -463,20 +666,6 @@ int main(int argc, char **argv)
         }
     }
 
-    // set the threshold for calculating ar_binary_tag
-    double ar_tag_threshold = opt_vals["binary_ar_threshold"].as<double>();
-    ar_tag->set_low_threshold_value(ar_tag_threshold);
-
-    // add metadata for ar_binary_tag
-    teca_metadata seg_atts;
-    seg_atts.set("long_name", std::string("binary indicator of atmospheric river"));
-    seg_atts.set("description", std::string("binary indicator of atmospheric river"));
-    seg_atts.set("scheme", std::string("cascade_bard"));
-    seg_atts.set("version", std::string("1.0"));
-    seg_atts.set("note",
-        std::string("derived by thresholding ar_probability >= ") +
-        std::to_string(ar_tag_threshold));
-    ar_tag->set_segmentation_variable_attributes(seg_atts);
 
     // run the pipeline
     cf_writer->set_executive(exec);
diff --git a/apps/teca_cartesian_mesh_diff.cpp b/apps/teca_cartesian_mesh_diff.cpp
index 26be1d2e2..d950b814e 100644
--- a/apps/teca_cartesian_mesh_diff.cpp
+++ b/apps/teca_cartesian_mesh_diff.cpp
@@ -66,9 +66,10 @@ int main(int argc, char **argv)
     // initialize command line options description
     // set up some common options to simplify use for most
     // common scenarios
+    int help_width = 100;
     options_description basic_opt_defs(
         "teca_cartesian_mesh_diff an application that compares two datasets.\n\n"
-        "Command line options", 120, -1
+        "Command line options", help_width, help_width - 4
         );
     basic_opt_defs.add_options()
         ("reference_dataset", value<std::string>()->required(),
@@ -105,7 +106,7 @@ int main(int argc, char **argv)
         "control over all runtime modifiable parameters. The basic options\n"
         "(see" "--help) map to these, and will override them if both are\n"
         "specified.\n\n"
-        "Advanced command line options", -1, 1
+        "Advanced command line options", help_width, help_width - 4
         );
 
     // create the pipeline stages here, they contain the
@@ -125,7 +126,7 @@ int main(int argc, char **argv)
     }
 
     // package basic and advanced options for display
-    options_description all_opt_defs(-1, -1);
+    options_description all_opt_defs(help_width, help_width - 4);
     all_opt_defs.add(basic_opt_defs).add(advanced_opt_defs);
 
     // parse the command line
@@ -149,7 +150,7 @@ int main(int argc, char **argv)
                     << std::endl
                     << basic_opt_defs << std::endl
                     << std::endl;
-                return -1;
+                return 0;
             }
 
             if (opt_vals.count("advanced_help"))
@@ -159,7 +160,7 @@ int main(int argc, char **argv)
                     << std::endl
                     << advanced_opt_defs << std::endl
                     << std::endl;
-                return -1;
+                return 0;
             }
 
             if (opt_vals.count("full_help"))
@@ -169,7 +170,7 @@ int main(int argc, char **argv)
                     << std::endl
                     << all_opt_defs << std::endl
                     << std::endl;
-                return -1;
+                return 0;
             }
         }
 
diff --git a/apps/teca_cf_restripe.cpp b/apps/teca_cf_restripe.cpp
index bbf7584bd..ae2496a9e 100644
--- a/apps/teca_cf_restripe.cpp
+++ b/apps/teca_cf_restripe.cpp
@@ -4,6 +4,10 @@
 #include "teca_variant_array.h"
 #include "teca_cf_reader.h"
 #include "teca_multi_cf_reader.h"
+#include "teca_normalize_coordinates.h"
+#include "teca_cartesian_mesh_regrid.h"
+#include "teca_cartesian_mesh_source.h"
+#include "teca_rename_variables.h"
 #include "teca_cf_writer.h"
 #include "teca_dataset_diff.h"
 #include "teca_index_executive.h"
@@ -13,7 +17,7 @@
 #include "teca_mpi_manager.h"
 #include "teca_mpi.h"
 #include "teca_app_util.h"
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 
 #include <iostream>
 #include <string>
@@ -56,19 +60,37 @@ int main(int argc, char **argv)
 
         ("point_arrays", value<std::vector<std::string>>()->multitoken(),
             "\nA list of point centered arrays to write\n")
-
         ("information_arrays", value<std::vector<std::string>>()->multitoken(),
             "\nA list of non-geometric arrays to write\n")
-
-        ("output_file", value<std::string>()->default_value(std::string("IVT_%t%.nc")),
+        ("output_file", value<std::string>(),
             "\nA path and file name pattern for the output NetCDF files. %t% is replaced with a"
             " human readable date and time corresponding to the time of the first time step in"
             " the file. Use --cf_writer::date_format to change the formatting\n")
-
-        ("steps_per_file", value<long>(), "\nnumber of time steps per output file\n")
-
+        ("file_layout", value<std::string>()->default_value("monthly"),
+            "\nSelects the size and layout of the set of output files. May be one of"
+            " number_of_steps, daily, monthly, seasonal, or yearly. Files are structured"
+            " such that each file contains one of the selected interval. For the number_of_steps"
+            " option use --steps_per_file.\n")
+        ("steps_per_file", value<long>(), "\nThe number of time steps per output file when "
+            " --file_layout number_of_steps is specified.\n")
+
+        ("normalize_coordinates", "\nEnable coordinate normalization pipeline stage\n")
+
+        ("regrid", "\nEnable mesh regridding pipeline stage. When enabled requires --dims"
+            " to be provided\n")
+        ("dims", value<std::vector<unsigned long>>()->multitoken(),
+            "\nA 3-tuple of values specifying the mesh size of the output dataset in the x, y,"
+            " and z dimensions. The accepted format for dimensions is: nx ny nz\n")
         ("bounds", value<std::vector<double>>()->multitoken(),
-            "\nlat lon lev bounding box to subset with\n")
+            "\nA hex-tuple of low and high values specifying lon lat lev bounding box to subset"
+            " the input dataset with. The accepted format for bounds is: x0 x1 y0 y1 z0 z1\n")
+
+        ("rename", "\nEnable variable renaming stage\n")
+        ("original_name", value<std::vector<std::string>>()->multitoken(),
+            "\nA list of variables to rename. Use --new_name to set the new names\n")
+        ("new_name", value<std::vector<std::string>>()->multitoken(),
+            "\nThe new names to use when renaming variables. Use --original_name to set the"
+            " list of variables to rename\n")
 
         ("first_step", value<long>(), "\nfirst time step to process\n")
         ("last_step", value<long>(), "\nlast time step to process\n")
@@ -97,15 +119,29 @@ int main(int argc, char **argv)
     // documentation and parse command line.
     // objects report all of their properties directly
     // set default options here so that command line options override
-    // them. while we are at it connect the pipeline
+    // them.
     p_teca_cf_reader cf_reader = teca_cf_reader::New();
     cf_reader->get_properties_description("cf_reader", advanced_opt_defs);
 
     p_teca_multi_cf_reader mcf_reader = teca_multi_cf_reader::New();
     mcf_reader->get_properties_description("mcf_reader", advanced_opt_defs);
 
+    p_teca_normalize_coordinates norm_coords = teca_normalize_coordinates::New();
+    norm_coords->get_properties_description("norm_coords", advanced_opt_defs);
+
+    p_teca_cartesian_mesh_regrid regrid = teca_cartesian_mesh_regrid::New();
+    regrid->set_interpolation_mode_linear();
+    regrid->get_properties_description("regrid", advanced_opt_defs);
+
+    p_teca_cartesian_mesh_source regrid_src = teca_cartesian_mesh_source::New();
+    regrid_src->get_properties_description("regrid_source", advanced_opt_defs);
+
+    p_teca_rename_variables rename = teca_rename_variables::New();
+    rename->get_properties_description("rename", advanced_opt_defs);
+
     p_teca_cf_writer cf_writer = teca_cf_writer::New();
     cf_writer->get_properties_description("cf_writer", advanced_opt_defs);
+    cf_writer->set_layout(teca_cf_writer::monthly);
 
     // Add an executive for the writer
     p_teca_index_executive exec = teca_index_executive::New();
@@ -115,10 +151,14 @@ int main(int argc, char **argv)
     all_opt_defs.add(basic_opt_defs).add(advanced_opt_defs);
 
     // parse the command line
+    int ierr = 0;
     variables_map opt_vals;
-    if (teca_app_util::process_command_line_help(mpi_man.get_comm_rank(),
-        argc, argv, basic_opt_defs, advanced_opt_defs, all_opt_defs, opt_vals))
+    if ((ierr = teca_app_util::process_command_line_help(
+        mpi_man.get_comm_rank(), argc, argv, basic_opt_defs,
+        advanced_opt_defs, all_opt_defs, opt_vals)))
     {
+        if (ierr == 1)
+            return 0;
         return -1;
     }
 
@@ -127,6 +167,10 @@ int main(int argc, char **argv)
     // options will override them
     cf_reader->set_properties("cf_reader", opt_vals);
     mcf_reader->set_properties("mcf_reader", opt_vals);
+    norm_coords->set_properties("norm_coords", opt_vals);
+    regrid->set_properties("regrid", opt_vals);
+    regrid_src->set_properties("regrid_source", opt_vals);
+    rename->set_properties("rename", opt_vals);
     cf_writer->set_properties("cf_writer", opt_vals);
 
     // now pass in the basic options, these are processed
@@ -175,6 +219,14 @@ int main(int argc, char **argv)
         cf_writer->set_information_arrays(
             opt_vals["information_arrays"].as<std::vector<std::string>>());
 
+    if (!opt_vals["file_layout"].defaulted() &&
+        cf_writer->set_layout(opt_vals["file_layout"].as<std::string>()))
+    {
+        TECA_ERROR("An invalid file layout was provided \""
+            << opt_vals["file_layout"].as<std::string>() << "\"")
+        return -1;
+    }
+
     if (opt_vals.count("steps_per_file"))
         cf_writer->set_steps_per_file(
             opt_vals["steps_per_file"].as<long>());
@@ -185,9 +237,48 @@ int main(int argc, char **argv)
     if (opt_vals.count("last_step"))
         cf_writer->set_last_step(opt_vals["last_step"].as<long>());
 
-    if (opt_vals.count("bounds"))
-        exec->set_bounds(
-            opt_vals["bounds"].as<std::vector<double>>());
+    std::vector<double> bounds;
+    bool have_bounds = opt_vals.count("bounds");
+    if (have_bounds)
+    {
+        bounds = opt_vals["bounds"].as<std::vector<double>>();
+        if (bounds.size() != 6)
+        {
+            TECA_ERROR("An invlaid bounds specification was provided in"
+                " --bounds, size != 6. Use: --bounds x0 x1 y0 y1 z0 z1")
+            return -1;
+        }
+    }
+
+    bool do_regrid = opt_vals.count("regrid");
+
+    // when not regriding let the executive subset. when regriding
+    // the regrid algorithm handles subsetting and the executive should
+    // request the entire domain.
+    if (have_bounds && !do_regrid)
+        exec->set_bounds(bounds);
+
+    // when regriding target mesh dimensions must be provided
+    std::vector<unsigned long> dims;
+    if (do_regrid)
+    {
+        if (opt_vals.count("dims"))
+        {
+            dims = opt_vals["dims"].as<std::vector<unsigned long>>();
+            if (dims.size() != 3)
+            {
+                TECA_ERROR("An invlaid dimension specification was provided in"
+                    " --dims, size != 3. Use: --dims nx ny nz")
+                return -1;
+            }
+        }
+        else
+        {
+            TECA_ERROR("The --regrid option requires that --dims"
+                " also be specified")
+            return -1;
+        }
+    }
 
     if (opt_vals.count("verbose"))
     {
@@ -222,10 +313,24 @@ int main(int argc, char **argv)
         return -1;
     }
 
+    // add the normalize coordinates stage before accessing metadata
+    p_teca_algorithm head = reader;
+    if (opt_vals.count("normalize_coordinates"))
+    {
+        if (mpi_man.get_comm_rank() == 0)
+            TECA_STATUS("Added cooridnate normalization stage");
+
+        norm_coords->set_input_connection(reader->get_output_port());
+        head = norm_coords;
+    }
+
     // if no point arrays were specified on the command line by default
     // write all point arrays
     teca_metadata md;
     teca_metadata atts;
+    teca_metadata time_atts;
+    std::string calendar;
+    std::string units;
     // TODO -- this will need some more work in the reader as currently
     // all arrays are marked as being point centered, but here we need
     // to identify only the arrays on the mesh.
@@ -233,7 +338,7 @@ int main(int argc, char **argv)
     {
         // run the reporting phase of the pipeline
         if (md.empty())
-            md = cf_reader->update_metadata();
+            md = head->update_metadata();
 
         // if array attributes are present, use them to locate the set of
         // point centered arrrays
@@ -271,32 +376,30 @@ int main(int argc, char **argv)
     {
         // run the reporting phase of the pipeline
         if (md.empty())
-            md = cf_reader->update_metadata();
+            md = head->update_metadata();
 
         if (atts.empty() && md.get("attributes", atts))
         {
-            TECA_ERROR("metadata missing attributes")
+            if (mpi_man.get_comm_rank() == 0)
+                TECA_ERROR("metadata missing attributes")
             return -1;
         }
 
-        teca_metadata time_atts;
-        std::string calendar;
-        std::string units;
         if (atts.get("time", time_atts)
            || time_atts.get("calendar", calendar)
            || time_atts.get("units", units))
         {
-            TECA_ERROR("failed to determine the calendaring parameters")
+            if (mpi_man.get_comm_rank() == 0)
+                TECA_ERROR("failed to determine the calendaring parameters")
             return -1;
         }
 
         teca_metadata coords;
-        p_teca_double_array time;
-        if (md.get("coordinates", coords) ||
-            !(time = std::dynamic_pointer_cast<teca_double_array>(
-                coords.get("t"))))
+        p_teca_variant_array time;
+        if (md.get("coordinates", coords) || !(time = coords.get("t")))
         {
-            TECA_ERROR("failed to determine time coordinate")
+            if (mpi_man.get_comm_rank() == 0)
+                TECA_ERROR("failed to determine time coordinate")
             return -1;
         }
 
@@ -308,8 +411,9 @@ int main(int argc, char **argv)
             if (teca_coordinate_util::time_step_of(time, true, true, calendar,
                  units, start_date, first_step))
             {
-                TECA_ERROR("Failed to locate time step for start date \""
-                    <<  start_date << "\"")
+                if (mpi_man.get_comm_rank() == 0)
+                    TECA_ERROR("Failed to locate time step for start date \""
+                        <<  start_date << "\"")
                 return -1;
             }
             cf_writer->set_first_step(first_step);
@@ -323,16 +427,114 @@ int main(int argc, char **argv)
             if (teca_coordinate_util::time_step_of(time, false, true, calendar,
                  units, end_date, last_step))
             {
-                TECA_ERROR("Failed to locate time step for end date \""
-                    <<  end_date << "\"")
+                if (mpi_man.get_comm_rank() == 0)
+                    TECA_ERROR("Failed to locate time step for end date \""
+                        <<  end_date << "\"")
                 return -1;
             }
             cf_writer->set_last_step(last_step);
         }
     }
 
-    // connect the pipeline
-    cf_writer->set_input_connection(reader->get_output_port());
+    // set up regriding
+    if (do_regrid)
+    {
+        if (mpi_man.get_comm_rank() == 0)
+            TECA_STATUS("Added regrid stage");
+
+        // run the reporting phase of the pipeline, the resulting metadata
+        // can be used to automatically determine the calendaring parameters
+        // and spatial bounds
+        if (md.empty())
+            md = head->update_metadata();
+
+        // use the calendar and time axis of the input dataset
+        if (regrid_src->set_t_axis_variable(md) || regrid_src->set_t_axis(md))
+        {
+            if (mpi_man.get_comm_rank() == 0)
+                TECA_WARNING("Failed to determine the time axis, assuming a"
+                    " single time step")
+
+            p_teca_double_array t = teca_double_array::New(1);
+            regrid_src->set_t_axis_variable("");
+            regrid_src->set_t_axis(t);
+        }
+
+        // to construct the target mesh we need bounds.  if no bounds are
+        // specified on the command line use those of the input dataset and
+        // error out if that fails
+        if (have_bounds)
+        {
+            // extend to include time
+            bounds.resize(8, 0.0);
+            regrid_src->set_bounds(bounds);
+        }
+        else
+        {
+            // try to determine the bounds from the input mesh metadata
+            if (regrid_src->set_spatial_bounds(md))
+            {
+                if (mpi_man.get_comm_rank() == 0)
+                    TECA_ERROR("Failed to determine target mesh bounds from the"
+                        " input metadata. Use --bounds to specify them manually.")
+                return -1;
+            }
+        }
+
+        // set the target mesh dimensions
+        regrid_src->set_whole_extents({0lu, dims[0] - 1lu,
+            0lu, dims[1] - 1lu, 0lu, dims[2] - 1lu, 0lu, 0lu});
+
+        // connect to the pipeline
+        regrid->set_input_connection(0, regrid_src->get_output_port());
+        regrid->set_input_connection(1, head->get_output_port());
+        head = regrid;
+    }
+
+    // add rename stage
+    if (opt_vals.count("rename"))
+    {
+        if (!opt_vals.count("original_name"))
+        {
+            if (mpi_man.get_comm_rank() == 0)
+                TECA_ERROR("--original_name is required when renaming variables")
+            return -1;
+        }
+
+        std::vector<std::string> original_name =
+            opt_vals["original_name"].as<std::vector<std::string>>();
+
+        if (!opt_vals.count("new_name"))
+        {
+            if (mpi_man.get_comm_rank() == 0)
+                TECA_ERROR("--new_name is required when renaming variables")
+            return -1;
+        }
+
+        std::vector<std::string> new_name =
+            opt_vals["new_name"].as<std::vector<std::string>>();
+
+        if (original_name.size() != new_name.size())
+        {
+            if (mpi_man.get_comm_rank() == 0)
+                TECA_ERROR("--original_name and --new_name must have the same"
+                    " number of values")
+            return -1;
+
+        }
+
+        if (mpi_man.get_comm_rank() == 0)
+            TECA_STATUS("Added rename stage");
+
+        rename->set_input_connection(head->get_output_port());
+        rename->set_original_variable_names(original_name);
+        rename->set_new_variable_names(new_name);
+
+        head = rename;
+    }
+
+    // add the writer last
+    cf_writer->set_input_connection(head->get_output_port());
 
     // run the pipeline
     cf_writer->set_executive(exec);
diff --git a/apps/teca_deeplab_ar_detect.in b/apps/teca_deeplab_ar_detect.in
index 6d07f5c3d..e124de1e6 100755
--- a/apps/teca_deeplab_ar_detect.in
+++ b/apps/teca_deeplab_ar_detect.in
@@ -87,6 +87,14 @@ parser.add_argument('--output_file', type=str, required=True,
          ' time of the first time step in the file. Use --date_format to change'
          ' the formatting')
 
+parser.add_argument('--file_layout', type=str, default='monthly',
+                    help='Selects the size and layout of the set of output'
+                         ' files. May be one of number_of_steps, daily,'
+                         ' monthly, seasonal, or yearly. Files are structured'
+                         ' such that each file contains one of the selected'
+                         ' interval. For the number_of_steps option use'
+                         ' --steps_per_file.')
+
 parser.add_argument('--steps_per_file', type=int, required=False, default=128,
     help='number of time steps per output file')
 
@@ -112,7 +120,7 @@ parser.add_argument('--pytorch_model', type=str, required=False,
 parser.add_argument('--t_axis_variable', type=str, required=False,
     help='time dimension name')
 
-parser.add_argument('--t_calendar', type=str, required=False,
+parser.add_argument('--calendar', type=str, required=False,
     help='time calendar')
 
 parser.add_argument('--t_units', type=str, required=False,
@@ -165,8 +173,8 @@ reader.set_y_axis_variable(args.y_axis_variable)
 if args.t_axis_variable is not None:
     reader.set_t_axis_variable(args.t_axis_variable)
 
-if args.t_calendar:
-    reader.set_t_calendar(args.t_calendar)
+if args.calendar:
+    reader.set_calendar(args.calendar)
 
 if args.t_units:
     reader.set_t_units(args.t_units)
@@ -241,6 +249,7 @@ writer.set_input_connection(ar_tag.get_output_port())
 writer.set_executive(exe)
 writer.set_thread_pool_size(1)
 writer.set_file_name(args.output_file)
+writer.set_layout(args.file_layout)
 writer.set_steps_per_file(args.steps_per_file)
 writer.set_first_step(args.first_step)
 writer.set_last_step(args.last_step)
diff --git a/apps/teca_integrated_vapor_transport.cpp b/apps/teca_integrated_vapor_transport.cpp
index d078f6b31..b8b0d89eb 100644
--- a/apps/teca_integrated_vapor_transport.cpp
+++ b/apps/teca_integrated_vapor_transport.cpp
@@ -10,18 +10,25 @@
 #include "teca_multi_cf_reader.h"
 #include "teca_integrated_vapor_transport.h"
 #include "teca_valid_value_mask.h"
+#include "teca_unpack_data.h"
+#include "teca_cartesian_mesh_source.h"
+#include "teca_cartesian_mesh_regrid.h"
+#include "teca_elevation_mask.h"
+#include "teca_indexed_dataset_cache.h"
 #include "teca_mpi_manager.h"
 #include "teca_coordinate_util.h"
 #include "teca_table.h"
 #include "teca_dataset_source.h"
 #include "teca_app_util.h"
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 
 #include <vector>
 #include <string>
 #include <iostream>
 #include <boost/program_options.hpp>
 
+#include "teca_cartesian_mesh_writer.h"
+
 using namespace std;
 
 using boost::program_options::value;
@@ -57,13 +64,11 @@ int main(int argc, char **argv)
 
         ("wind_u", value<std::string>()->default_value("U"),
             "\nname of variable with the 3D longitudinal component of the wind vector.\n")
-
         ("wind_v", value<std::string>()->default_value("V"),
             "\nname of variable with the 3D latitudinal component of the wind vector.\n")
 
         ("ivt_u", value<std::string>()->default_value("IVT_U"),
             "\nname to use for the longitudinal component of the integrated vapor transport vector.\n")
-
         ("ivt_v", value<std::string>()->default_value("IVT_V"),
             "\nname to use for the latitudinal component of the integrated vapor transport vector.\n")
 
@@ -84,9 +89,14 @@ int main(int argc, char **argv)
             "\nA path and file name pattern for the output NetCDF files. %t% is replaced with a"
             " human readable date and time corresponding to the time of the first time step in"
             " the file. Use --cf_writer::date_format to change the formatting\n")
-
+        ("file_layout", value<std::string>()->default_value("monthly"),
+            "\nSelects the size and layout of the set of output files. May be one of"
+            " number_of_steps, daily, monthly, seasonal, or yearly. Files are structured"
+            " such that each file contains one of the selected interval. For the number_of_steps"
+            " option use --steps_per_file.\n")
         ("steps_per_file", value<long>()->default_value(128),
-            "\nnumber of time steps per output file\n")
+            "\nThe number of time steps per output file when --file_layout number_of_steps is"
+            " specified.\n")
 
         ("x_axis_variable", value<std::string>()->default_value("lon"),
             "\nname of x coordinate variable\n")
@@ -95,6 +105,16 @@ int main(int argc, char **argv)
         ("z_axis_variable", value<std::string>()->default_value("plev"),
             "\nname of z coordinate variable\n")
 
+        ("dem", value<std::string>(), "\nA teca_cf_reader regex identifying the"
+            " file containing surface elevation field or DEM.\n")
+
+        ("dem_variable", value<std::string>()->default_value("Z"),
+            "\nSets the name of the variable containing the surface elevation field\n")
+
+        ("mesh_height", value<std::string>()->default_value("Zg"),
+            "\nSets the name of the variable containing the point wise vertical height"
+            " in meters above mean sea level\n")
+
         ("first_step", value<long>()->default_value(0), "\nfirst time step to process\n")
         ("last_step", value<long>()->default_value(-1), "\nlast time step to process\n")
 
@@ -102,9 +122,9 @@ int main(int argc, char **argv)
             " format. Note: There must be a space between the date and time specification\n")
         ("end_date", value<std::string>(), "\nThe last time to process in 'Y-M-D h:m:s' format\n")
 
-        ("n_threads", value<int>(), "\nSets the thread pool size on each MPI rank. When the default"
-            " value of -1 is used TECA will coordinate the thread pools across ranks such each"
-            " thread is bound to a unique physical core.\n")
+        ("n_threads", value<int>()->default_value(-1), "\nSets the thread pool size on each MPI"
+            "  rank. When the default value of -1 is used TECA will coordinate the thread pools"
+            " across ranks such each thread is bound to a unique physical core.\n")
 
         ("verbose", "\nenable extra terminal output\n")
 
@@ -140,6 +160,38 @@ int main(int argc, char **argv)
     p_teca_multi_cf_reader mcf_reader = teca_multi_cf_reader::New();
     mcf_reader->get_properties_description("mcf_reader", advanced_opt_defs);
 
+    p_teca_normalize_coordinates norm_coords = teca_normalize_coordinates::New();
+    norm_coords->get_properties_description("norm_coords", advanced_opt_defs);
+
+    p_teca_valid_value_mask vv_mask = teca_valid_value_mask::New();
+    vv_mask->get_properties_description("vv_mask", advanced_opt_defs);
+
+    p_teca_unpack_data unpack = teca_unpack_data::New();
+    unpack->get_properties_description("unpack", advanced_opt_defs);
+
+    p_teca_cf_reader elev_reader = teca_cf_reader::New();
+    elev_reader->get_properties_description("elev_reader", advanced_opt_defs);
+    elev_reader->set_t_axis_variable("");
+
+    p_teca_normalize_coordinates elev_coords = teca_normalize_coordinates::New();
+    elev_coords->get_properties_description("elev_coords", advanced_opt_defs);
+    elev_coords->set_enable_periodic_shift_x(1);
+
+    p_teca_indexed_dataset_cache elev_cache = teca_indexed_dataset_cache::New();
+    elev_cache->get_properties_description("elev_cache", advanced_opt_defs);
+    elev_cache->set_max_cache_size(1);
+
+    p_teca_cartesian_mesh_source elev_mesh = teca_cartesian_mesh_source::New();
+    elev_mesh->get_properties_description("elev_mesh", advanced_opt_defs);
+
+    p_teca_cartesian_mesh_regrid elev_regrid = teca_cartesian_mesh_regrid::New();
+    elev_regrid->get_properties_description("elev_regrid", advanced_opt_defs);
+
+    p_teca_elevation_mask elev_mask = teca_elevation_mask::New();
+    elev_mask->get_properties_description("elev_mask", advanced_opt_defs);
+    elev_mask->set_surface_elevation_variable("Z");
+    elev_mask->set_mesh_height_variable("ZG");
+
     p_teca_integrated_vapor_transport ivt_int = teca_integrated_vapor_transport::New();
     ivt_int->get_properties_description("ivt_integral", advanced_opt_defs);
     ivt_int->set_specific_humidity_variable("Q");
@@ -154,9 +206,6 @@ int main(int argc, char **argv)
     l2_norm->set_component_1_variable("IVT_V");
     l2_norm->set_l2_norm_variable("IVT");
 
-    p_teca_valid_value_mask vv_mask = teca_valid_value_mask::New();
-    vv_mask->get_properties_description("vv_mask", advanced_opt_defs);
-
     // Add an executive for the writer
     p_teca_index_executive exec = teca_index_executive::New();
 
@@ -165,16 +214,21 @@ int main(int argc, char **argv)
     cf_writer->get_properties_description("cf_writer", advanced_opt_defs);
     cf_writer->set_verbose(0);
     cf_writer->set_steps_per_file(128);
+    cf_writer->set_layout(teca_cf_writer::monthly);
 
     // package basic and advanced options for display
-    options_description all_opt_defs(-1, -1);
+    options_description all_opt_defs(help_width, help_width - 4);
     all_opt_defs.add(basic_opt_defs).add(advanced_opt_defs);
 
     // parse the command line
+    int ierr = 0;
     variables_map opt_vals;
-    if (teca_app_util::process_command_line_help(mpi_man.get_comm_rank(),
-        argc, argv, basic_opt_defs, advanced_opt_defs, all_opt_defs, opt_vals))
+    if ((ierr = teca_app_util::process_command_line_help(
+        mpi_man.get_comm_rank(), argc, argv, basic_opt_defs,
+        advanced_opt_defs, all_opt_defs, opt_vals)))
     {
+        if (ierr == 1)
+            return 0;
         return -1;
     }
 
@@ -183,7 +237,15 @@ int main(int argc, char **argv)
     // options will override them
     cf_reader->set_properties("cf_reader", opt_vals);
     mcf_reader->set_properties("mcf_reader", opt_vals);
+    norm_coords->set_properties("norm_coords", opt_vals);
     vv_mask->set_properties("vv_mask", opt_vals);
+    unpack->set_properties("unpack", opt_vals);
+    elev_reader->set_properties("elev_reader", opt_vals);
+    elev_coords->set_properties("elev_coords", opt_vals);
+    elev_mesh->set_properties("elev_mesh", opt_vals);
+    elev_cache->set_properties("elev_cache", opt_vals);
+    elev_regrid->set_properties("elev_regrid", opt_vals);
+    elev_mask->set_properties("elev_mask", opt_vals);
     ivt_int->set_properties("ivt_integral", opt_vals);
     l2_norm->set_properties("ivt_magnitude", opt_vals);
     cf_writer->set_properties("cf_writer", opt_vals);
@@ -191,23 +253,33 @@ int main(int argc, char **argv)
     // now pass in the basic options, these are processed
     // last so that they will take precedence
     // configure the pipeline from the command line options.
-    p_teca_algorithm head;
+    p_teca_algorithm reader;
 
     // configure the reader
     bool have_file = opt_vals.count("input_file");
     bool have_regex = opt_vals.count("input_regex");
+    if ((have_file && have_regex) || !(have_file || have_regex))
+    {
+        if (mpi_man.get_comm_rank() == 0)
+        {
+            TECA_ERROR("Extacly one of --input_file or --input_regex can be specified. "
+                "Use --input_file to activate the multi_cf_reader (HighResMIP datasets) "
+                "and --input_regex to activate the cf_reader (CAM like datasets)")
+        }
+        return -1;
+    }
 
     if (opt_vals.count("input_file"))
     {
         mcf_reader->set_input_file(opt_vals["input_file"].as<string>());
-        head = mcf_reader;
+        reader = mcf_reader;
     }
     else if (opt_vals.count("input_regex"))
     {
         cf_reader->set_files_regex(opt_vals["input_regex"].as<string>());
-        head = cf_reader;
+        reader = cf_reader;
     }
-    p_teca_algorithm reader = head;
+    p_teca_algorithm head = reader;
 
     if (!opt_vals["x_axis_variable"].defaulted())
     {
@@ -221,6 +293,13 @@ int main(int argc, char **argv)
         mcf_reader->set_y_axis_variable(opt_vals["y_axis_variable"].as<string>());
     }
 
+    std::string z_var = "plev";
+    if (!opt_vals["z_axis_variable"].defaulted())
+        z_var = opt_vals["z_axis_variable"].as<string>();
+
+    cf_reader->set_z_axis_variable(z_var);
+    mcf_reader->set_z_axis_variable(z_var);
+
     // set the inputs to the integrator
     if (!opt_vals["wind_u"].defaulted())
     {
@@ -257,24 +336,88 @@ int main(int argc, char **argv)
     }
 
     // add the valid value mask stage
-    vv_mask->set_input_connection(head->get_output_port());
-    head = vv_mask;
+    norm_coords->set_input_connection(head->get_output_port());
+    vv_mask->set_input_connection(norm_coords->get_output_port());
+    unpack->set_input_connection(vv_mask->get_output_port());
+    head = unpack;
 
     // add the ivt caluation stages if needed
     bool do_ivt = opt_vals["write_ivt"].as<int>();
     bool do_ivt_magnitude = opt_vals["write_ivt_magnitude"].as<int>();
+    if (!(do_ivt || do_ivt_magnitude))
 
-    std::string z_var = "plev";
-    if (!opt_vals["z_axis_variable"].defaulted())
-        z_var = opt_vals["z_axis_variable"].as<string>();
+    {
+        if (mpi_man.get_comm_rank() == 0)
+        {
+            TECA_ERROR("At least one of --write_ivt or --write_ivt_magnitude "
+                " must be set.")
+        }
+        return -1;
+    }
 
-    cf_reader->set_z_axis_variable(z_var);
-    mcf_reader->set_z_axis_variable(z_var);
+    // add the elevation mask stages
+    teca_metadata md;
+    if (opt_vals.count("dem"))
+    {
+        if (mpi_man.get_comm_rank() == 0)
+            TECA_STATUS("Generating elevation mask")
+
+        elev_reader->set_files_regex(opt_vals["dem"].as<string>());
+
+        elev_coords->set_input_connection(elev_reader->get_output_port());
+
+        md = head->update_metadata();
+
+        elev_mesh->set_spatial_bounds(md, false);
+        elev_mesh->set_spatial_extents(md, false);
+        elev_mesh->set_x_axis_variable(md);
+        elev_mesh->set_y_axis_variable(md);
+        elev_mesh->set_z_axis_variable(md);
+        elev_mesh->set_t_axis_variable(md);
+        elev_mesh->set_t_axis(md);
+
+        elev_regrid->set_input_connection(0, elev_mesh->get_output_port());
+        elev_regrid->set_input_connection(1, elev_coords->get_output_port());
+
+        elev_cache->set_input_connection(elev_regrid->get_output_port());
+
+        /*p_teca_cartesian_mesh_writer rdw = teca_cartesian_mesh_writer::New();
+        rdw->set_input_connection(elev_cache->get_output_port());
+        rdw->set_file_name("regrid_dem_%t%.vtk");*/
+
+        elev_mask->set_input_connection(0, head->get_output_port());
+        elev_mask->set_input_connection(1, elev_cache->get_output_port());
+        //elev_mask->set_input_connection(1, rdw->get_output_port());
+
+        if (!opt_vals["dem_variable"].defaulted())
+            elev_mask->set_surface_elevation_variable(
+                opt_vals["dem_variable"].as<string>());
+
+        if (!opt_vals["mesh_height"].defaulted())
+            elev_mask->set_mesh_height_variable(
+                opt_vals["mesh_height"].as<string>());
+
+        elev_mask->set_mask_variables({
+            ivt_int->get_specific_humidity_variable() + "_valid",
+            ivt_int->get_wind_u_variable() + "_valid",
+            ivt_int->get_wind_v_variable() + "_valid"});
+
+        /*p_teca_cartesian_mesh_writer emw = teca_cartesian_mesh_writer::New();
+        emw->set_input_connection(elev_mask->get_output_port());
+        emw->set_file_name("elev_mask_%t%.vtk");
+        emw->set_binary(1);
+        head = emw;*/
+
+        head = elev_mask;
+    }
 
     ivt_int->set_input_connection(head->get_output_port());
 
     if (do_ivt_magnitude)
     {
+        if (mpi_man.get_comm_rank() == 0)
+            TECA_STATUS("Computing IVT magnitude")
+
         l2_norm->set_input_connection(ivt_int->get_output_port());
         head = l2_norm;
     }
@@ -303,39 +446,23 @@ int main(int argc, char **argv)
     if (!opt_vals["last_step"].defaulted())
         cf_writer->set_last_step(opt_vals["last_step"].as<long>());
 
+    if (!opt_vals["file_layout"].defaulted() &&
+        cf_writer->set_layout(opt_vals["file_layout"].as<std::string>()))
+    {
+        TECA_ERROR("An invalid file layout was provided \""
+            << opt_vals["file_layout"].as<std::string>() << "\"")
+        return -1;
+    }
+
     if (opt_vals.count("verbose"))
     {
         cf_writer->set_verbose(1);
         exec->set_verbose(1);
     }
 
-    if (!opt_vals["n_threads"].defaulted())
-        cf_writer->set_thread_pool_size(opt_vals["n_threads"].as<int>());
-    else
-        cf_writer->set_thread_pool_size(-1);
+    cf_writer->set_thread_pool_size(opt_vals["n_threads"].as<int>());
 
     // some minimal check for missing options
-    if ((have_file && have_regex) || !(have_file || have_regex))
-    {
-        if (mpi_man.get_comm_rank() == 0)
-        {
-            TECA_ERROR("Extacly one of --input_file or --input_regex can be specified. "
-                "Use --input_file to activate the multi_cf_reader (HighResMIP datasets) "
-                "and --input_regex to activate the cf_reader (CAM like datasets)")
-        }
-        return -1;
-    }
-
-    if (!(do_ivt || do_ivt_magnitude))
-    {
-        if (mpi_man.get_comm_rank() == 0)
-        {
-            TECA_ERROR("AT least one of --write_ivt or --write_ivt_magnitude "
-                " must be set.")
-        }
-        return -1;
-    }
-
     if (cf_writer->get_file_name().empty())
     {
         if (mpi_man.get_comm_rank() == 0)
@@ -355,7 +482,8 @@ int main(int argc, char **argv)
     if (parse_start_date || parse_end_date)
     {
         // run the reporting phase of the pipeline
-        teca_metadata md = reader->update_metadata();
+        if (md.empty())
+            md = reader->update_metadata();
 
         teca_metadata atrs;
         if (md.get("attributes", atrs))
@@ -376,10 +504,8 @@ int main(int argc, char **argv)
         }
 
         teca_metadata coords;
-        p_teca_double_array time;
-        if (md.get("coordinates", coords) ||
-            !(time = std::dynamic_pointer_cast<teca_double_array>(
-                coords.get("t"))))
+        p_teca_variant_array time;
+        if (md.get("coordinates", coords) || !(time = coords.get("t")))
         {
             TECA_ERROR("failed to determine time coordinate")
             return -1;
diff --git a/apps/teca_integrated_water_vapor.cpp b/apps/teca_integrated_water_vapor.cpp
new file mode 100644
index 000000000..405a83aa2
--- /dev/null
+++ b/apps/teca_integrated_water_vapor.cpp
@@ -0,0 +1,454 @@
+#include "teca_config.h"
+#include "teca_cf_reader.h"
+#include "teca_cf_writer.h"
+#include "teca_index_executive.h"
+#include "teca_normalize_coordinates.h"
+#include "teca_metadata.h"
+#include "teca_integrated_water_vapor.h"
+#include "teca_binary_segmentation.h"
+#include "teca_l2_norm.h"
+#include "teca_multi_cf_reader.h"
+#include "teca_integrated_water_vapor.h"
+#include "teca_valid_value_mask.h"
+#include "teca_unpack_data.h"
+#include "teca_cartesian_mesh_source.h"
+#include "teca_cartesian_mesh_regrid.h"
+#include "teca_elevation_mask.h"
+#include "teca_indexed_dataset_cache.h"
+#include "teca_mpi_manager.h"
+#include "teca_coordinate_util.h"
+#include "teca_table.h"
+#include "teca_dataset_source.h"
+#include "teca_app_util.h"
+#include "teca_calcalcs.h"
+
+#include <vector>
+#include <string>
+#include <iostream>
+#include <boost/program_options.hpp>
+
+#include "teca_cartesian_mesh_writer.h"
+
+using namespace std;
+
+using boost::program_options::value;
+
+// --------------------------------------------------------------------------
+int main(int argc, char **argv)
+{
+    // initialize mpi
+    teca_mpi_manager mpi_man(argc, argv);
+
+    // initialize command line options description
+    // set up some common options to simplify use for most
+    // common scenarios
+    int help_width = 100;
+    options_description basic_opt_defs(
+        "Basic usage:\n\n"
+        "The following options are the most commonly used. Information\n"
+        "on advanced options can be displayed using --advanced_help\n\n"
+        "Basic command line options", help_width, help_width - 4
+        );
+    basic_opt_defs.add_options()
+        ("input_file", value<std::string>(), "\na teca_multi_cf_reader configuration file"
+            " identifying the set of NetCDF CF2 files to process. When present data is"
+            " read using the teca_multi_cf_reader. Use one of either --input_file or"
+            " --input_regex.\n")
+
+        ("input_regex", value<std::string>(), "\na teca_cf_reader regex identifying the"
+            " set of NetCDF CF2 files to process. When present data is read using the"
+            " teca_cf_reader. Use one of either --input_file or --input_regex.\n")
+
+        ("specific_humidity", value<std::string>()->default_value("Q"),
+            "\nname of variable with the 3D specific humidity field.\n")
+
+        ("iwv", value<std::string>()->default_value("IWV"),
+            "\nname to use for the longitudinal component of the integrated vapor transport vector.\n")
+
+        ("output_file", value<std::string>()->default_value("IWV_%t%.nc"),
+            "\nA path and file name pattern for the output NetCDF files. %t% is replaced with a"
+            " human readable date and time corresponding to the time of the first time step in"
+            " the file. Use --cf_writer::date_format to change the formatting\n")
+        ("file_layout", value<std::string>()->default_value("monthly"),
+            "\nSelects the size and layout of the set of output files. May be one of"
+            " number_of_steps, daily, monthly, seasonal, or yearly. Files are structured"
+            " such that each file contains one of the selected interval. For the number_of_steps"
+            " option use --steps_per_file.\n")
+        ("steps_per_file", value<long>()->default_value(128),
+            "\nThe number of time steps per output file when --file_layout number_of_steps is"
+            " specified.\n")
+
+        ("x_axis_variable", value<std::string>()->default_value("lon"),
+            "\nname of x coordinate variable\n")
+        ("y_axis_variable", value<std::string>()->default_value("lat"),
+            "\nname of y coordinate variable\n")
+        ("z_axis_variable", value<std::string>()->default_value("plev"),
+            "\nname of z coordinate variable\n")
+
+        ("dem", value<std::string>(), "\nA teca_cf_reader regex identifying the"
+            " file containing surface elevation field or DEM.\n")
+
+        ("dem_variable", value<std::string>()->default_value("Z"),
+            "\nSets the name of the variable containing the surface elevation field\n")
+
+        ("mesh_height", value<std::string>()->default_value("Zg"),
+            "\nSets the name of the variable containing the point wise vertical height"
+            " in meters above mean sea level\n")
+
+        ("first_step", value<long>()->default_value(0), "\nfirst time step to process\n")
+        ("last_step", value<long>()->default_value(-1), "\nlast time step to process\n")
+
+        ("start_date", value<std::string>(), "\nThe first time to process in 'Y-M-D h:m:s'"
+            " format. Note: There must be a space between the date and time specification\n")
+        ("end_date", value<std::string>(), "\nThe last time to process in 'Y-M-D h:m:s' format\n")
+
+        ("n_threads", value<int>()->default_value(-1), "\nSets the thread pool size on each MPI"
+            "  rank. When the default value of -1 is used TECA will coordinate the thread pools"
+            " across ranks such each thread is bound to a unique physical core.\n")
+
+        ("verbose", "\nenable extra terminal output\n")
+
+        ("help", "\ndisplays documentation for application specific command line options\n")
+        ("advanced_help", "\ndisplays documentation for algorithm specific command line options\n")
+        ("full_help", "\ndisplays both basic and advanced documentation together\n")
+        ;
+
+    // add all options from each pipeline stage for more advanced use
+    options_description advanced_opt_defs(
+        "Advanced usage:\n\n"
+        "The following list contains the full set options giving one full\n"
+        "control over all runtime modifiable parameters. The basic options\n"
+        "(see" "--help) map to these, and will override them if both are\n"
+        "specified.\n\n"
+        "integrated vapor transport pipeline:\n\n"
+        "    (cf / mcf_reader)\n"
+        "            \\\n"
+        "        (iwv_integral)--(iwv_magnitude)\n"
+        "                                 \\\n"
+        "                              (cf_writer)\n\n"
+        "Advanced command line options", help_width, help_width - 4
+        );
+
+    // create the pipeline stages here, they contain the
+    // documentation and parse command line.
+    // objects report all of their properties directly
+    // set default options here so that command line options override
+    // them. while we are at it connect the pipeline
+    p_teca_cf_reader cf_reader = teca_cf_reader::New();
+    cf_reader->get_properties_description("cf_reader", advanced_opt_defs);
+
+    p_teca_multi_cf_reader mcf_reader = teca_multi_cf_reader::New();
+    mcf_reader->get_properties_description("mcf_reader", advanced_opt_defs);
+
+    p_teca_normalize_coordinates norm_coords = teca_normalize_coordinates::New();
+    norm_coords->get_properties_description("norm_coords", advanced_opt_defs);
+
+    p_teca_valid_value_mask vv_mask = teca_valid_value_mask::New();
+    vv_mask->get_properties_description("vv_mask", advanced_opt_defs);
+
+    p_teca_unpack_data unpack = teca_unpack_data::New();
+    unpack->get_properties_description("unpack", advanced_opt_defs);
+
+    p_teca_cf_reader elev_reader = teca_cf_reader::New();
+    elev_reader->get_properties_description("elev_reader", advanced_opt_defs);
+    elev_reader->set_t_axis_variable("");
+
+    p_teca_normalize_coordinates elev_coords = teca_normalize_coordinates::New();
+    elev_coords->get_properties_description("elev_coords", advanced_opt_defs);
+    elev_coords->set_enable_periodic_shift_x(1);
+
+    p_teca_indexed_dataset_cache elev_cache = teca_indexed_dataset_cache::New();
+    elev_cache->get_properties_description("elev_cache", advanced_opt_defs);
+    elev_cache->set_max_cache_size(1);
+
+    p_teca_cartesian_mesh_source elev_mesh = teca_cartesian_mesh_source::New();
+    elev_mesh->get_properties_description("elev_mesh", advanced_opt_defs);
+
+    p_teca_cartesian_mesh_regrid elev_regrid = teca_cartesian_mesh_regrid::New();
+    elev_regrid->get_properties_description("elev_regrid", advanced_opt_defs);
+
+    p_teca_elevation_mask elev_mask = teca_elevation_mask::New();
+    elev_mask->get_properties_description("elev_mask", advanced_opt_defs);
+    elev_mask->set_surface_elevation_variable("Z");
+    elev_mask->set_mesh_height_variable("ZG");
+
+    p_teca_integrated_water_vapor iwv_int = teca_integrated_water_vapor::New();
+    iwv_int->get_properties_description("iwv_integral", advanced_opt_defs);
+    iwv_int->set_specific_humidity_variable("Q");
+    iwv_int->set_iwv_variable("IWV");
+
+    // Add an executive for the writer
+    p_teca_index_executive exec = teca_index_executive::New();
+
+    // Add the writer
+    p_teca_cf_writer cf_writer = teca_cf_writer::New();
+    cf_writer->get_properties_description("cf_writer", advanced_opt_defs);
+    cf_writer->set_verbose(0);
+    cf_writer->set_steps_per_file(128);
+    cf_writer->set_layout(teca_cf_writer::monthly);
+
+    // package basic and advanced options for display
+    options_description all_opt_defs(help_width, help_width - 4);
+    all_opt_defs.add(basic_opt_defs).add(advanced_opt_defs);
+
+    // parse the command line
+    int ierr = 0;
+    variables_map opt_vals;
+    if ((ierr = teca_app_util::process_command_line_help(
+        mpi_man.get_comm_rank(), argc, argv, basic_opt_defs,
+        advanced_opt_defs, all_opt_defs, opt_vals)))
+    {
+        if (ierr == 1)
+            return 0;
+        return -1;
+    }
+
+    // pass command line arguments into the pipeline objects
+    // advanced options are processed first, so that the basic
+    // options will override them
+    cf_reader->set_properties("cf_reader", opt_vals);
+    mcf_reader->set_properties("mcf_reader", opt_vals);
+    norm_coords->set_properties("norm_coords", opt_vals);
+    vv_mask->set_properties("vv_mask", opt_vals);
+    unpack->set_properties("unpack", opt_vals);
+    elev_reader->set_properties("elev_reader", opt_vals);
+    elev_coords->set_properties("elev_coords", opt_vals);
+    elev_mesh->set_properties("elev_mesh", opt_vals);
+    elev_cache->set_properties("elev_cache", opt_vals);
+    elev_regrid->set_properties("elev_regrid", opt_vals);
+    elev_mask->set_properties("elev_mask", opt_vals);
+    iwv_int->set_properties("iwv_integral", opt_vals);
+    cf_writer->set_properties("cf_writer", opt_vals);
+
+    // now pass in the basic options, these are processed
+    // last so that they will take precedence
+    // configure the pipeline from the command line options.
+    p_teca_algorithm reader;
+
+    // configure the reader
+    bool have_file = opt_vals.count("input_file");
+    bool have_regex = opt_vals.count("input_regex");
+    if ((have_file && have_regex) || !(have_file || have_regex))
+    {
+        if (mpi_man.get_comm_rank() == 0)
+        {
+            TECA_ERROR("Extacly one of --input_file or --input_regex can be specified. "
+                "Use --input_file to activate the multi_cf_reader (HighResMIP datasets) "
+                "and --input_regex to activate the cf_reader (CAM like datasets)")
+        }
+        return -1;
+    }
+
+    if (opt_vals.count("input_file"))
+    {
+        mcf_reader->set_input_file(opt_vals["input_file"].as<string>());
+        reader = mcf_reader;
+    }
+    else if (opt_vals.count("input_regex"))
+    {
+        cf_reader->set_files_regex(opt_vals["input_regex"].as<string>());
+        reader = cf_reader;
+    }
+    p_teca_algorithm head = reader;
+
+    if (!opt_vals["x_axis_variable"].defaulted())
+    {
+        cf_reader->set_x_axis_variable(opt_vals["x_axis_variable"].as<string>());
+        mcf_reader->set_x_axis_variable(opt_vals["x_axis_variable"].as<string>());
+    }
+
+    if (!opt_vals["y_axis_variable"].defaulted())
+    {
+        cf_reader->set_y_axis_variable(opt_vals["y_axis_variable"].as<string>());
+        mcf_reader->set_y_axis_variable(opt_vals["y_axis_variable"].as<string>());
+    }
+
+    std::string z_var = "plev";
+    if (!opt_vals["z_axis_variable"].defaulted())
+        z_var = opt_vals["z_axis_variable"].as<string>();
+
+    cf_reader->set_z_axis_variable(z_var);
+    mcf_reader->set_z_axis_variable(z_var);
+
+    // set the inputs to the integrator
+    if (!opt_vals["specific_humidity"].defaulted())
+    {
+        iwv_int->set_specific_humidity_variable(
+            opt_vals["specific_humidity"].as<string>());
+    }
+
+    // set all that use or produce iwv
+    if (!opt_vals["iwv"].defaulted())
+        iwv_int->set_iwv_variable(opt_vals["iwv"].as<string>());
+
+    // add the valid value mask stage
+    norm_coords->set_input_connection(head->get_output_port());
+    vv_mask->set_input_connection(norm_coords->get_output_port());
+    unpack->set_input_connection(vv_mask->get_output_port());
+    head = unpack;
+
+    // add the elevation mask stages
+    teca_metadata md;
+    if (opt_vals.count("dem"))
+    {
+        if (mpi_man.get_comm_rank() == 0)
+            TECA_STATUS("Generating elevation mask")
+
+        elev_reader->set_files_regex(opt_vals["dem"].as<string>());
+
+        elev_coords->set_input_connection(elev_reader->get_output_port());
+
+        md = head->update_metadata();
+
+        elev_mesh->set_spatial_bounds(md, false);
+        elev_mesh->set_spatial_extents(md, false);
+        elev_mesh->set_x_axis_variable(md);
+        elev_mesh->set_y_axis_variable(md);
+        elev_mesh->set_z_axis_variable(md);
+        elev_mesh->set_t_axis_variable(md);
+        elev_mesh->set_t_axis(md);
+
+        elev_regrid->set_input_connection(0, elev_mesh->get_output_port());
+        elev_regrid->set_input_connection(1, elev_coords->get_output_port());
+
+        elev_cache->set_input_connection(elev_regrid->get_output_port());
+
+        elev_mask->set_input_connection(0, head->get_output_port());
+        elev_mask->set_input_connection(1, elev_cache->get_output_port());
+
+        if (!opt_vals["dem_variable"].defaulted())
+            elev_mask->set_surface_elevation_variable(
+                opt_vals["dem_variable"].as<string>());
+
+        if (!opt_vals["mesh_height"].defaulted())
+            elev_mask->set_mesh_height_variable(
+                opt_vals["mesh_height"].as<string>());
+
+        elev_mask->set_mask_variables({
+            iwv_int->get_specific_humidity_variable() + "_valid"});
+
+        head = elev_mask;
+    }
+
+    iwv_int->set_input_connection(head->get_output_port());
+    head = iwv_int;
+
+    // tell the writer to write iwv if needed
+    std::vector<std::string> point_arrays;
+    point_arrays.push_back(iwv_int->get_iwv_variable());
+
+    cf_writer->set_point_arrays(point_arrays);
+
+    cf_writer->set_file_name(opt_vals["output_file"].as<string>());
+
+    if (!opt_vals["steps_per_file"].defaulted())
+        cf_writer->set_steps_per_file(opt_vals["steps_per_file"].as<long>());
+
+    if (!opt_vals["first_step"].defaulted())
+        cf_writer->set_first_step(opt_vals["first_step"].as<long>());
+
+    if (!opt_vals["last_step"].defaulted())
+        cf_writer->set_last_step(opt_vals["last_step"].as<long>());
+
+    if (!opt_vals["file_layout"].defaulted() &&
+        cf_writer->set_layout(opt_vals["file_layout"].as<std::string>()))
+    {
+        TECA_ERROR("An invalid file layout was provided \""
+            << opt_vals["file_layout"].as<std::string>() << "\"")
+        return -1;
+    }
+
+    if (opt_vals.count("verbose"))
+    {
+        cf_writer->set_verbose(1);
+        exec->set_verbose(1);
+    }
+
+    cf_writer->set_thread_pool_size(opt_vals["n_threads"].as<int>());
+
+    // some minimal check for missing options
+    if (cf_writer->get_file_name().empty())
+    {
+        if (mpi_man.get_comm_rank() == 0)
+        {
+            TECA_ERROR("missing file name pattern for netcdf writer. "
+                "See --help for a list of command line options.")
+        }
+        return -1;
+    }
+
+    // connect the fixed stages of the pipeline
+    cf_writer->set_input_connection(head->get_output_port());
+
+    // look for requested time step range, start
+    bool parse_start_date = opt_vals.count("start_date");
+    bool parse_end_date = opt_vals.count("end_date");
+    if (parse_start_date || parse_end_date)
+    {
+        // run the reporting phase of the pipeline
+        if (md.empty())
+            md = reader->update_metadata();
+
+        teca_metadata atrs;
+        if (md.get("attributes", atrs))
+        {
+            TECA_ERROR("metadata missing attributes")
+            return -1;
+        }
+
+        teca_metadata time_atts;
+        std::string calendar;
+        std::string units;
+        if (atrs.get("time", time_atts)
+           || time_atts.get("calendar", calendar)
+           || time_atts.get("units", units))
+        {
+            TECA_ERROR("failed to determine the calendaring parameters")
+            return -1;
+        }
+
+        teca_metadata coords;
+        p_teca_variant_array time;
+        if (md.get("coordinates", coords) || !(time = coords.get("t")))
+        {
+            TECA_ERROR("failed to determine time coordinate")
+            return -1;
+        }
+
+        // convert date string to step, start date
+        if (parse_start_date)
+        {
+            unsigned long first_step = 0;
+            std::string start_date = opt_vals["start_date"].as<string>();
+            if (teca_coordinate_util::time_step_of(time, true, true, calendar,
+                 units, start_date, first_step))
+            {
+                TECA_ERROR("Failed to locate time step for start date \""
+                    <<  start_date << "\"")
+                return -1;
+            }
+            cf_writer->set_first_step(first_step);
+        }
+
+        // and end date
+        if (parse_end_date)
+        {
+            unsigned long last_step = 0;
+            std::string end_date = opt_vals["end_date"].as<string>();
+            if (teca_coordinate_util::time_step_of(time, false, true, calendar,
+                 units, end_date, last_step))
+            {
+                TECA_ERROR("Failed to locate time step for end date \""
+                    <<  end_date << "\"")
+                return -1;
+            }
+            cf_writer->set_last_step(last_step);
+        }
+    }
+
+    // run the pipeline
+    cf_writer->set_executive(exec);
+    cf_writer->update();
+
+    return 0;
+}
diff --git a/apps/teca_metadata_probe.cpp b/apps/teca_metadata_probe.cpp
index 6d9f3d192..992d8d4da 100644
--- a/apps/teca_metadata_probe.cpp
+++ b/apps/teca_metadata_probe.cpp
@@ -3,6 +3,7 @@
 #include "teca_netcdf_util.h"
 #include "teca_cf_reader.h"
 #include "teca_multi_cf_reader.h"
+#include "teca_normalize_coordinates.h"
 #include "teca_array_collection.h"
 #include "teca_variant_array.h"
 #include "teca_coordinate_util.h"
@@ -11,7 +12,7 @@
 #include "teca_app_util.h"
 
 #if defined(TECA_HAS_UDUNITS)
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 #endif
 
 #include <vector>
@@ -93,15 +94,22 @@ int main(int argc, char **argv)
     p_teca_multi_cf_reader mcf_reader = teca_multi_cf_reader::New();
     mcf_reader->get_properties_description("mcf_reader", advanced_opt_defs);
 
+    p_teca_normalize_coordinates norm_coords = teca_normalize_coordinates::New();
+    norm_coords->get_properties_description("norm_coords", advanced_opt_defs);
+
     // package basic and advanced options for display
     options_description all_opt_defs(help_width, help_width - 4);
     all_opt_defs.add(basic_opt_defs).add(advanced_opt_defs);
 
     // parse the command line
+    int ierr = 0;
     variables_map opt_vals;
-    if (teca_app_util::process_command_line_help(mpi_man.get_comm_rank(),
-        argc, argv, basic_opt_defs, advanced_opt_defs, all_opt_defs, opt_vals))
+    if ((ierr = teca_app_util::process_command_line_help(
+        mpi_man.get_comm_rank(), argc, argv, basic_opt_defs,
+        advanced_opt_defs, all_opt_defs, opt_vals)))
     {
+        if (ierr == 1)
+            return 0;
         return -1;
     }
 
@@ -110,6 +118,7 @@ int main(int argc, char **argv)
     // options will override them
     cf_reader->set_properties("cf_reader", opt_vals);
     mcf_reader->set_properties("mcf_reader", opt_vals);
+    norm_coords->set_properties("norm_coords", opt_vals);
 
     // now pas in the basic options, these are procesed
     // last so that they will take precedence
@@ -138,6 +147,18 @@ int main(int argc, char **argv)
     bool have_file = opt_vals.count("input_file");
     bool have_regex = opt_vals.count("input_regex");
 
+    // validate the input method
+    if ((have_file && have_regex) || !(have_file || have_regex))
+    {
+        if (rank == 0)
+        {
+            TECA_ERROR("Extacly one of --input_file or --input_regex can be specified. "
+                "Use --input_file to activate the multi_cf_reader (CMIP6 datasets) "
+                "and --input_regex to activate the cf_reader (CAM like datasets)")
+        }
+        return -1;
+    }
+
     p_teca_algorithm reader;
     if (opt_vals.count("input_file"))
     {
@@ -155,6 +176,8 @@ int main(int argc, char **argv)
         z_var = cf_reader->get_z_axis_variable();
         reader = cf_reader;
     }
+    norm_coords->set_input_connection(reader->get_output_port());
+    norm_coords->set_verbose(2);
 
     std::string time_i;
     if (opt_vals.count("start_date"))
@@ -164,20 +187,8 @@ int main(int argc, char **argv)
     if (opt_vals.count("end_date"))
         time_j = opt_vals["end_date"].as<string>();
 
-    // some minimal check for mising options
-    if ((have_file && have_regex) || !(have_file || have_regex))
-    {
-        if (rank == 0)
-        {
-            TECA_ERROR("Extacly one of --input_file or --input_regex can be specified. "
-                "Use --input_file to activate the multi_cf_reader (HighResMIP datasets) "
-                "and --input_regex to activate the cf_reader (CAM like datasets)")
-        }
-        return -1;
-    }
-
     // run the reporting phase of the pipeline
-    teca_metadata md = reader->update_metadata();
+    teca_metadata md = norm_coords->update_metadata();
 
     // from here on out just rank 0
     if (rank == 0)
@@ -248,7 +259,7 @@ int main(int argc, char **argv)
         int Y = 0, M = 0, D = 0, h = 0, m = 0;
         double s = 0;
 #if defined(TECA_HAS_UDUNITS)
-        if (calcalcs::date(time->get(i0), &Y, &M, &D, &h, &m, &s,
+        if (teca_calcalcs::date(time->get(i0), &Y, &M, &D, &h, &m, &s,
             units.c_str(), calendar.c_str()))
         {
             TECA_ERROR("failed to detmine the first available time in the file")
@@ -264,7 +275,7 @@ int main(int argc, char **argv)
         // human readbale last time available
         Y = 0, M = 0, D = 0, h = 0, m = 0, s = 0;
 #if defined(TECA_HAS_UDUNITS)
-        if (calcalcs::date(time->get(i1), &Y, &M, &D, &h, &m, &s,
+        if (teca_calcalcs::date(time->get(i1), &Y, &M, &D, &h, &m, &s,
             units.c_str(), calendar.c_str()))
         {
             TECA_ERROR("failed to detmine the last available time in the file")
@@ -344,26 +355,56 @@ int main(int argc, char **argv)
         }
         std::cerr << std::endl;
 
+        // report extents
+        long extent[6] = {0l};
+        if (!md.get("whole_extent", extent, 6))
+        {
+            std::cerr << "Mesh extents: " << extent[0] << ", " << extent[1]
+                << ", " << extent[2] << ", " << extent[3];
+            if (!z_var.empty())
+            {
+                std::cerr << ", " << extent[4] << ", " << extent[5];
+            }
+            std::cerr << std::endl;
+        }
+
+        // report bounds
+        double bounds[6] = {0.0};
+        if (!md.get("bounds", bounds, 6))
+        {
+            std::cerr << "Mesh bounds: " << bounds[0] << ", " << bounds[1]
+                << ", " << bounds[2] << ", " << bounds[3];
+            if (!z_var.empty())
+            {
+                std::cerr << ", " << bounds[4] << ", " << bounds[5];
+            }
+            std::cerr << std::endl;
+        }
+
+
         // report the arrays
         size_t n_arrays = atrs.size();
 
         // column widths
-        int aiw = 0;
-        int anw = 0;
-        int atw = 0;
-        int adw = 0;
-        int asw = 0;
+        int aiw = 4;
+        int anw = 8;
+        int atw = 8;
+        int acw = 14;
+        int adw = 15;
+        int asw = 9;
 
         // column data
         std::vector<std::string> ai;
         std::vector<std::string> an;
         std::vector<std::string> at;
+        std::vector<std::string> ac;
         std::vector<std::string> ad;
         std::vector<std::string> as;
 
         ai.reserve(n_arrays);
         an.reserve(n_arrays);
         at.reserve(n_arrays);
+        ac.reserve(n_arrays);
         ad.reserve(n_arrays);
         as.reserve(n_arrays);
 
@@ -378,10 +419,14 @@ int main(int argc, char **argv)
             int id = 0;
             p_teca_size_t_array dims;
             p_teca_string_array dim_names;
+            int centering = 0;
+            int n_active_dims = 0;
 
             if (atrs.get(array, atts)
                 || atts.get("cf_type_code", 0, type)
                 || atts.get("cf_id", 0, id)
+                || atts.get("centering", centering)
+                || atts.get("n_active_dims", n_active_dims)
                 || !(dims = std::dynamic_pointer_cast<teca_size_t_array>(atts.get("cf_dims")))
                 || !(dim_names = std::dynamic_pointer_cast<teca_string_array>(atts.get("cf_dim_names"))))
             {
@@ -404,6 +449,11 @@ int main(int argc, char **argv)
                 )
             atw = std::max<int>(atw, at.back().size() + 4);
 
+            // centering
+            ac.push_back(teca_array_attributes::centering_to_string(centering) +
+                std::string(" ") + std::to_string(n_active_dims) + "D");
+            acw = std::max<int>(acw, ac.back().size() + 4);
+
             // dims
             int n_dims = dim_names->size();
 
@@ -444,10 +494,11 @@ int main(int argc, char **argv)
             << std::setw(aiw) << std::left << "Id"
             << std::setw(anw) << std::left << "Name"
             << std::setw(atw) << std::left << "Type"
+            << std::setw(acw) << std::left << "Centering"
             << std::setw(adw) << std::left << "Dimensions"
             << std::setw(asw) << std::left << "Shape" << std::endl;
 
-        int tw =  anw + atw + adw + asw;
+        int tw =  aiw + anw + atw + adw + acw + asw;
         for (int i = 0; i < tw; ++i)
             std::cerr << '-';
         std::cerr << std::endl;
@@ -459,6 +510,7 @@ int main(int argc, char **argv)
                 << std::setw(aiw) << std::left << ai[i]
                 << std::setw(anw) << std::left << an[i]
                 << std::setw(atw) << std::left << at[i]
+                << std::setw(acw) << std::left << ac[i]
                 << std::setw(adw) << std::left << ad[i]
                 << std::setw(asw) << std::left << as[i]
                 << std::endl;
diff --git a/apps/teca_tc_detect.cpp b/apps/teca_tc_detect.cpp
index f8483f171..8171d27eb 100644
--- a/apps/teca_tc_detect.cpp
+++ b/apps/teca_tc_detect.cpp
@@ -19,7 +19,7 @@
 #include "teca_mpi_manager.h"
 #include "teca_coordinate_util.h"
 #include "teca_app_util.h"
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 
 #include <vector>
 #include <string>
@@ -204,14 +204,18 @@ int main(int argc, char **argv)
     track_writer->get_properties_description("track_writer", advanced_opt_defs);
 
     // package basic and advanced options for display
-    options_description all_opt_defs(-1, -1);
+    options_description all_opt_defs(help_width, help_width - 4);
     all_opt_defs.add(basic_opt_defs).add(advanced_opt_defs);
 
     // parse the command line
+    int ierr = 0;
     variables_map opt_vals;
-    if (teca_app_util::process_command_line_help(mpi_man.get_comm_rank(),
-        argc, argv, basic_opt_defs, advanced_opt_defs, all_opt_defs, opt_vals))
+    if ((ierr = teca_app_util::process_command_line_help(
+        mpi_man.get_comm_rank(), argc, argv, basic_opt_defs,
+        advanced_opt_defs, all_opt_defs, opt_vals)))
     {
+        if (ierr == 1)
+            return 0;
         return -1;
     }
 
@@ -267,22 +271,21 @@ int main(int argc, char **argv)
         surf_wind->set_component_1_variable(
             opt_vals["surface_wind_v"].as<string>());
 
-    std::vector<std::string> dep_var;
-    core_temp->get_dependent_variables(dep_var);
     if (!opt_vals["500mb_temp"].defaulted())
-        dep_var[0] = opt_vals["500mb_temp"].as<string>();
+        core_temp->set_dependent_variable(0,
+            opt_vals["500mb_temp"].as<string>());
+
     if (!opt_vals["200mb_temp"].defaulted())
-        dep_var[1] = opt_vals["200mb_temp"].as<string>();
-    core_temp->set_dependent_variables(dep_var);
-    dep_var.clear();
+        core_temp->set_dependent_variable(1,
+            opt_vals["200mb_temp"].as<string>());
 
-    thickness->get_dependent_variables(dep_var);
     if (!opt_vals["1000mb_height"].defaulted())
-        dep_var[0] = opt_vals["1000mb_height"].as<string>();
+        thickness->set_dependent_variable(0,
+            opt_vals["1000mb_height"].as<string>());
+
     if (!opt_vals["200mb_height"].defaulted())
-        dep_var[1] = opt_vals["200mb_height"].as<string>();
-    thickness->set_dependent_variables(dep_var);
-    dep_var.clear();
+        thickness->set_dependent_variable(1,
+            opt_vals["200mb_height"].as<string>());
 
     if (!opt_vals["sea_level_pressure"].defaulted())
         candidates->set_sea_level_pressure_variable(
@@ -375,29 +378,31 @@ int main(int argc, char **argv)
 
     // now that command line opts have been parsed we can create
     // the programmable algorithms' functors
-    core_temp->get_dependent_variables(dep_var);
-    if (dep_var.size() != 2)
+    size_t n_var = core_temp->get_number_of_dependent_variables();
+    if (n_var != 2)
     {
         TECA_ERROR("core temperature calculation requires 2 "
-            "variables. given " << dep_var.size())
+            "variables. given " << n_var)
         return -1;
     }
     core_temp->set_execute_callback(
-        point_wise_average(dep_var[0], dep_var[1],
-        core_temp->get_derived_variable()));
-    dep_var.clear();
+        point_wise_average(
+            core_temp->get_dependent_variable(0),
+            core_temp->get_dependent_variable(1),
+            core_temp->get_derived_variable()));
 
-    thickness->get_dependent_variables(dep_var);
-    if (dep_var.size() != 2)
+    n_var = thickness->get_number_of_dependent_variables();
+    if (n_var != 2)
     {
         TECA_ERROR("thickness calculation requires 2 "
-            "variables. given " << dep_var.size())
+            "variables. given " << n_var)
         return -1;
     }
     thickness->set_execute_callback(
-        point_wise_difference(dep_var[0], dep_var[1],
-        thickness->get_derived_variable()));
-    dep_var.clear();
+        point_wise_difference(
+            thickness->get_dependent_variable(0),
+            thickness->get_dependent_variable(1),
+            thickness->get_derived_variable()));
 
     // and tell the candidate stage what variables the functors produce
     candidates->set_surface_wind_speed_variable(surf_wind->get_l2_norm_variable());
@@ -432,10 +437,8 @@ int main(int argc, char **argv)
         }
 
         teca_metadata coords;
-        p_teca_double_array time;
-        if (md.get("coordinates", coords) ||
-            !(time = std::dynamic_pointer_cast<teca_double_array>(
-                coords.get("t"))))
+        p_teca_variant_array time;
+        if (md.get("coordinates", coords) || !(time = coords.get("t")))
         {
             TECA_ERROR("failed to determine time coordinate")
             return -1;
diff --git a/apps/teca_tc_trajectory.cpp b/apps/teca_tc_trajectory.cpp
index 6e9c190dd..a7a945b98 100644
--- a/apps/teca_tc_trajectory.cpp
+++ b/apps/teca_tc_trajectory.cpp
@@ -16,7 +16,7 @@
 #include "teca_table_writer.h"
 #include "teca_mpi_manager.h"
 #include "teca_coordinate_util.h"
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 #include "teca_app_util.h"
 
 #include <vector>
@@ -105,10 +105,14 @@ int main(int argc, char **argv)
     all_opt_defs.add(basic_opt_defs).add(advanced_opt_defs);
 
     // parse the command line
+    int ierr = 0;
     variables_map opt_vals;
-    if (teca_app_util::process_command_line_help(mpi_man.get_comm_rank(),
-        argc, argv, basic_opt_defs, advanced_opt_defs, all_opt_defs, opt_vals))
+    if ((ierr = teca_app_util::process_command_line_help(
+        mpi_man.get_comm_rank(), argc, argv, basic_opt_defs,
+        advanced_opt_defs, all_opt_defs, opt_vals)))
     {
+        if (ierr == 1)
+            return 0;
         return -1;
     }
 
diff --git a/apps/teca_tc_wind_radii.cpp b/apps/teca_tc_wind_radii.cpp
index 4ded8748e..8654d748a 100644
--- a/apps/teca_tc_wind_radii.cpp
+++ b/apps/teca_tc_wind_radii.cpp
@@ -42,7 +42,7 @@ int main(int argc, char **argv)
         "Basic command line options", help_width, help_width - 4
         );
     basic_opt_defs.add_options()
-        ("track_file", value<std::string>(), "\na file containing cyclone tracks (tracks.bin)\n")
+        ("track_file", value<std::string>(), "\na file containing cyclone tracks\n")
 
         ("input_file", value<std::string>(), "\na teca_multi_cf_reader configuration file"
             " identifying the set of NetCDF CF2 files to process. When present data is"
@@ -135,10 +135,14 @@ int main(int argc, char **argv)
     all_opt_defs.add(basic_opt_defs).add(advanced_opt_defs);
 
     // parse the command line
+    int ierr = 0;
     variables_map opt_vals;
-    if (teca_app_util::process_command_line_help(mpi_man.get_comm_rank(),
-        argc, argv, basic_opt_defs, advanced_opt_defs, all_opt_defs, opt_vals))
+    if ((ierr = teca_app_util::process_command_line_help(
+        mpi_man.get_comm_rank(), argc, argv, basic_opt_defs,
+        advanced_opt_defs, all_opt_defs, opt_vals)))
     {
+        if (ierr == 1)
+            return 0;
         return -1;
     }
 
@@ -156,12 +160,33 @@ int main(int argc, char **argv)
 
     // now pass in the basic options, these are processed
     // last so that they will take precedence
-    if (!opt_vals["track_file"].defaulted())
-        track_reader->set_file_name(opt_vals["track_file"].as<std::string>());
+    if (!opt_vals.count("track_file"))
+    {
+        if (mpi_man.get_comm_rank() == 0)
+        {
+            TECA_ERROR("A file with previously calculated storm tracks must be "
+                "specified with --track_file")
+        }
+        return -1;
+    }
+
+    track_reader->set_file_name(opt_vals["track_file"].as<std::string>());
 
     bool have_file = opt_vals.count("input_file");
     bool have_wind_files = opt_vals.count("wind_files");
     bool have_regex = opt_vals.count("input_regex");
+
+    if ((have_file && have_regex) || !(have_file || have_regex))
+    {
+        if (mpi_man.get_comm_rank() == 0)
+        {
+            TECA_ERROR("Extacly one of --input_file or --input_regex can be specified. "
+                "Use --input_file to activate the multi_cf_reader (HighResMIP datasets) "
+                "and --input_regex to activate the cf_reader (CAM like datasets)")
+        }
+        return -1;
+    }
+
     p_teca_algorithm wind_reader;
     if (have_file)
     {
@@ -236,18 +261,6 @@ int main(int argc, char **argv)
     else
         map_reduce->set_thread_pool_size(-1);
 
-    // some minimal check for missing options
-    if ((have_file && have_regex) || !(have_file || have_regex))
-    {
-        if (mpi_man.get_comm_rank() == 0)
-        {
-            TECA_ERROR("Extacly one of --input_file or --input_regex can be specified. "
-                "Use --input_file to activate the multi_cf_reader (HighResMIP datasets) "
-                "and --input_regex to activate the cf_reader (CAM like datasets)")
-        }
-        return -1;
-    }
-
     // connect the pipeline
     wind_coords->set_input_connection(wind_reader->get_output_port());
     wind_radii->set_input_connection(0, track_input->get_output_port());
diff --git a/apps/teca_temporal_reduction.in b/apps/teca_temporal_reduction.in
index f14d653df..22178f0f3 100755
--- a/apps/teca_temporal_reduction.in
+++ b/apps/teca_temporal_reduction.in
@@ -66,6 +66,14 @@ parser.add_argument('--output_file', type=str, required=True,
                          ' step in the file. Use --date_format to change'
                          ' the formatting')
 
+parser.add_argument('--file_layout', type=str, default='yearly',
+                    help='Selects the size and layout of the set of output'
+                         ' files. May be one of number_of_steps, daily,'
+                         ' monthly, seasonal, or yearly. Files are structured'
+                         ' such that each file contains one of the selected'
+                         ' interval. For the number_of_steps option use'
+                         ' --steps_per_file.')
+
 parser.add_argument('--steps_per_file', type=int, default=128,
                     help='number of time steps to write to each output '
                          'file')
@@ -85,7 +93,7 @@ parser.add_argument('--t_axis_variable', type=str, default='time',
                     help='name of the variable to use for t-coordinates')
 
 parser.add_argument('--n_threads', type=int, default=2,
-                    help='Number of threads to use when stremaing the '
+                    help='Number of threads to use when streaming the '
                          'reduction')
 
 parser.add_argument('--verbose', type=int, default=0,
@@ -99,6 +107,7 @@ except Exception:
 
 in_files = args.input_regex
 out_files = args.output_file
+layout = args.file_layout
 steps_per_file = args.steps_per_file
 n_threads = args.n_threads
 interval = args.interval
@@ -115,6 +124,7 @@ verbose = args.verbose
 if verbose and rank == 0:
     sys.stderr.write('running on %d ranks' % (n_ranks))
     sys.stderr.write('n_threads=%d\n' % (n_threads))
+    sys.stderr.write('file_layout=%s\n'%(layout))
     sys.stderr.write('steps_per_file=%d\n' % (steps_per_file))
     sys.stderr.write('interval=%s\n' % (interval))
     sys.stderr.write('operator=%s\n' % (operator))
@@ -152,6 +162,7 @@ cfw = teca_cf_writer.New()
 cfw.set_input_connection(mav.get_output_port())
 cfw.set_verbose(verbose)
 cfw.set_thread_pool_size(1)
+cfw.set_layout(layout)
 cfw.set_steps_per_file(steps_per_file)
 cfw.set_file_name(out_files)
 cfw.set_point_arrays(point_arrays)
diff --git a/core/CMakeLists.txt b/core/CMakeLists.txt
index 525e3bcef..c1251e2db 100644
--- a/core/CMakeLists.txt
+++ b/core/CMakeLists.txt
@@ -7,7 +7,6 @@ set(teca_core_srcs
     teca_algorithm_executive.cxx
     teca_bad_cast.cxx
     teca_binary_stream.cxx
-    teca_calendar.cxx
     teca_common.cxx
     teca_dataset.cxx
     teca_dataset_source.cxx
@@ -45,7 +44,7 @@ endif()
 if (TECA_HAS_UDUNITS)
     include_directories(SYSTEM ${UDUNITS_INCLUDE_DIR})
     list(APPEND teca_core_link ${UDUNITS_LIBRARY})
-    list(APPEND teca_core_srcs calcalcs.cxx)
+    list(APPEND teca_core_srcs teca_calcalcs.cxx)
 endif()
 
 list(APPEND teca_core_link pthread)
diff --git a/core/teca_algorithm.cxx b/core/teca_algorithm.cxx
index 8fe7136e9..d1801f035 100644
--- a/core/teca_algorithm.cxx
+++ b/core/teca_algorithm.cxx
@@ -12,6 +12,10 @@
 #include <algorithm>
 #include <mutex>
 
+#if defined(TECA_HAS_BOOST)
+#include <boost/program_options.hpp>
+#endif
+
 using std::vector;
 using std::map;
 using std::string;
@@ -382,7 +386,8 @@ void teca_algorithm_internals::from_stream(istream &is)
 
 
 // --------------------------------------------------------------------------
-teca_algorithm::teca_algorithm() : internals(new teca_algorithm_internals)
+teca_algorithm::teca_algorithm() : verbose(0),
+    internals(new teca_algorithm_internals)
 {}
 
 // --------------------------------------------------------------------------
@@ -403,6 +408,25 @@ MPI_Comm teca_algorithm::get_communicator()
     return this->internals->comm;
 }
 
+#if defined(TECA_HAS_BOOST)
+// --------------------------------------------------------------------------
+void teca_algorithm::get_properties_description(
+    const string &prefix, options_description &opts)
+{
+    opts.add_options()
+        TECA_POPTS_GET(int, prefix, verbose,
+            "Set to non-zero to send diagnostic messages to the terminal")
+        ;
+}
+
+// --------------------------------------------------------------------------
+void teca_algorithm::set_properties(
+    const string &prefix, variables_map &opts)
+{
+    TECA_POPTS_SET(opts, int, prefix, verbose)
+}
+#endif
+
 // --------------------------------------------------------------------------
 teca_algorithm_output_port teca_algorithm::get_output_port(
     unsigned int port)
diff --git a/core/teca_algorithm.h b/core/teca_algorithm.h
index 9a8dbb9ac..4fd2dc709 100644
--- a/core/teca_algorithm.h
+++ b/core/teca_algorithm.h
@@ -2,25 +2,238 @@
 #define teca_algorithm_h
 
 #include "teca_config.h"
-
-// forward delcaration of ref counted types
-#include "teca_dataset_fwd.h"
-#include "teca_algorithm_fwd.h"
-#include "teca_algorithm_executive_fwd.h"
-class teca_algorithm_internals;
-
-// for types used in the api
+#include "teca_shared_object.h"
+#include "teca_dataset.h"
+#include "teca_algorithm_executive.h"
 #include "teca_metadata.h"
-#include "teca_algorithm_output_port.h"
 #include "teca_program_options.h"
 #include "teca_mpi.h"
 
 #include <vector>
 #include <utility>
 #include <iosfwd>
+#include <initializer_list>
+#include <functional>
 
-// interface to teca pipeline architecture. all sources/readers
-// filters, sinks/writers will implement this interface
+class teca_algorithm_internals;
+
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_algorithm)
+
+/// An output port packages an algorithm and a port number
+using teca_algorithm_output_port
+    = std::pair<p_teca_algorithm, unsigned int>;
+
+/// get the algorithm from the output port
+inline
+p_teca_algorithm &get_algorithm(teca_algorithm_output_port &op)
+{ return op.first; }
+
+/// get port number from the output port
+inline
+unsigned int &get_port(teca_algorithm_output_port &op)
+{ return op.second; }
+
+/* this is a convenience macro to be used to declare a static New method that
+ * will be used to construct new objects in shared_ptr's. This manages the
+ * details of interoperability with std C++11 shared pointer
+ */
+#define TECA_ALGORITHM_STATIC_NEW(T)                \
+                                                    \
+/** Returns an instance of T */                     \
+static p_##T New()                                  \
+{                                                   \
+    return p_##T(new T);                            \
+}                                                   \
+                                                    \
+/** Enables the static constructor */               \
+std::shared_ptr<T> shared_from_this()               \
+{                                                   \
+    return std::static_pointer_cast<T>(             \
+        teca_algorithm::shared_from_this());        \
+}                                                   \
+                                                    \
+/** Enables the static constructor */               \
+std::shared_ptr<T const> shared_from_this() const   \
+{                                                   \
+    return std::static_pointer_cast<T const>(       \
+        teca_algorithm::shared_from_this());        \
+}
+
+#define TECA_ALGORITHM_CLASS_NAME(T)                \
+/** returns the name of the class */                \
+const char *get_class_name() const override         \
+{                                                   \
+    return #T;                                      \
+}
+
+/** this convenience macro removes copy and assignment operators
+ * which generally should not be defined for reference counted types
+ */
+#define TECA_ALGORITHM_DELETE_COPY_ASSIGN(T)    \
+                                                \
+    T(const T &src) = delete;                   \
+    T(T &&src) = delete;                        \
+                                                \
+    T &operator=(const T &src) = delete;        \
+    T &operator=(T &&src) = delete;
+
+/** convenience macro to declare standard set_NAME/get_NAME methods
+ * where NAME is the name of a class member. will manage the
+ * algorithm's modified state for the user.
+ */
+#define TECA_ALGORITHM_PROPERTY(T, NAME)                 \
+                                                         \
+/** Set the value of the NAME algorithm property */      \
+void set_##NAME(const T &v)                              \
+{                                                        \
+    if (this->NAME != v)                                 \
+    {                                                    \
+        this->NAME = v;                                  \
+        this->set_modified();                            \
+    }                                                    \
+}                                                        \
+                                                         \
+/** Get the value of the NAME algorithm property */      \
+const T &get_##NAME() const                              \
+{                                                        \
+    return this->NAME;                                   \
+}
+
+/** similar to TECA_ALGORITHM_PROPERTY but prior to setting NAME
+ * will call the member function int valididate_NAME(T v). If
+ * the value v is valid the fucntion should return 0. If the value
+ * is not zero the function should invoke TECA_ERROR with a
+ * descriptive message and return non-zero.
+ */
+#define TECA_ALGORITHM_PROPERTY_V(T, NAME)               \
+                                                         \
+/** Set the value of the NAME algorithm property */      \
+void set_##NAME(const T &v)                              \
+{                                                        \
+    if (this->validate_ ## NAME (v))                     \
+        return;                                          \
+                                                         \
+    if (this->NAME != v)                                 \
+    {                                                    \
+        this->NAME = v;                                  \
+        this->set_modified();                            \
+    }                                                    \
+}                                                        \
+                                                         \
+/** Get the value of the NAME algorithm property */      \
+const T &get_##NAME() const                              \
+{                                                        \
+    return this->NAME;                                   \
+}
+
+/** convenience macro to declare standard set_NAME/get_NAME methods
+ * where NAME is the name of a class member. will manage the
+ * algorithm's modified state for the user.
+ */
+#define TECA_ALGORITHM_VECTOR_PROPERTY(T, NAME)                           \
+                                                                          \
+/** get the size of the NAME algorithm vector property */                 \
+size_t get_number_of_##NAME##s ()                                         \
+{                                                                         \
+    return this->NAME##s.size();                                          \
+}                                                                         \
+                                                                          \
+/** append to the NAME algorithm vector property */                       \
+void append_##NAME(const T &v)                                            \
+{                                                                         \
+    this->NAME##s.push_back(v);                                           \
+    this->set_modified();                                                 \
+}                                                                         \
+                                                                          \
+/** set the i-th element of the NAME algorithm vector property */         \
+void set_##NAME(size_t i, const T &v)                                     \
+{                                                                         \
+    if (this->NAME##s[i] != v)                                            \
+    {                                                                     \
+        this->NAME##s[i] = v;                                             \
+        this->set_modified();                                             \
+    }                                                                     \
+}                                                                         \
+                                                                          \
+/** set the  NAME algorithm vector property */                            \
+void set_##NAME##s(const std::vector<T> &v)                               \
+{                                                                         \
+    if (this->NAME##s != v)                                               \
+    {                                                                     \
+        this->NAME##s = v;                                                \
+        this->set_modified();                                             \
+    }                                                                     \
+}                                                                         \
+                                                                          \
+/** set the  NAME algorithm vector property */                            \
+void set_##NAME##s(const std::initializer_list<T> &&l)                    \
+{                                                                         \
+    std::vector<T> v(l);                                                  \
+    if (this->NAME##s != v)                                               \
+    {                                                                     \
+        this->NAME##s = v;                                                \
+        this->set_modified();                                             \
+    }                                                                     \
+}                                                                         \
+                                                                          \
+/** get the i-th element of the NAME algorithm vector property */         \
+const T &get_##NAME(size_t i) const                                       \
+{                                                                         \
+    return this->NAME##s[i];                                              \
+}                                                                         \
+                                                                          \
+/** get the  NAME algorithm vector property */                            \
+const std::vector<T> &get_##NAME##s() const                               \
+{                                                                         \
+    return this->NAME##s;                                                 \
+}                                                                         \
+                                                                          \
+/** clear the  NAME algorithm vector property */                          \
+void clear_##NAME##s()                                                    \
+{                                                                         \
+    this->NAME##s.clear();                                                \
+}
+
+/// helper that allows us to use std::function as a TECA_ALGORITHM_PROPERTY
+template<typename T>
+bool operator!=(const std::function<T> &lhs, const std::function<T> &rhs)
+{
+    return &rhs != &lhs;
+}
+
+/** This is a work around for older versions of Apple clang
+ * Apple LLVM version 4.2 (clang-425.0.28) (based on LLVM 3.2svn)
+ * Target: x86_64-apple-darwin12.6.0
+ */
+#define TECA_ALGORITHM_CALLBACK_PROPERTY(T, NAME)   \
+                                                    \
+/** Set the NAME algorithm property */              \
+void set_##NAME(const T &v)                         \
+{                                                   \
+    /*if (this->NAME != v)*/                        \
+    /*{*/                                           \
+        this->NAME = v;                             \
+        this->set_modified();                       \
+    /*}*/                                           \
+}                                                   \
+                                                    \
+/** Get the NAME algorithm property */              \
+const T &get_##NAME() const                         \
+{                                                   \
+    return this->NAME;                              \
+}                                                   \
+                                                    \
+/** Get the NAME algorithm property */              \
+T &get_##NAME()                                     \
+{                                                   \
+    return this->NAME;                              \
+}
+
+
+/// The interface to TECA pipeline architecture.
+/**
+ * All sources/readers filters, sinks/writers will implement this interface.
+ */
 class teca_algorithm : public std::enable_shared_from_this<teca_algorithm>
 {
 public:
@@ -29,98 +242,131 @@ class teca_algorithm : public std::enable_shared_from_this<teca_algorithm>
 
     TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_algorithm)
 
-    // return the name of the class.
+    /// return the name of the class.
     virtual const char *get_class_name() const = 0;
 
-    // set/get the communicator to use at this stage of the pipeline this has
-    // no influence on other stages. We duplicate the passed in communicator
-    // providing an isolated communication space for subsequent operations. By
-    // default the communicator is initialized to MPI_COMM_WORLD, here it is not
-    // duplicated. Thus to put an algorithm into a unique communication space
-    // one should explicitly set a communicator. When an algorithm should not
-    // use MPI, for instance when it is in a nested pipeline, one may set the
-    // communicator to MPI_COMM_SELF.
+    /** set the communicator to use at this stage of the pipeline this has
+     * no influence on other stages. We duplicate the passed in communicator
+     * providing an isolated communication space for subsequent operations. By
+     * default the communicator is initialized to MPI_COMM_WORLD, here it is not
+     * duplicated. Thus to put an algorithm into a unique communication space
+     * one should explicitly set a communicator. When an algorithm should not
+     * use MPI, for instance when it is in a nested pipeline, one may set the
+     * communicator to MPI_COMM_SELF.
+     */
     void set_communicator(MPI_Comm comm);
+
+    /// get the active communicator
     MPI_Comm get_communicator();
 
 #if defined(TECA_HAS_BOOST)
-    // initialize the given options description
-    // with algorithm's properties
-    virtual void get_properties_description(const std::string &, options_description &)
-    {}
-
-    // initialize the algorithm from the given options
-    // variable map.
-    virtual void set_properties(const std::string &, variables_map &)
-    {}
+    /** initialize the given options description with algorithm's properties
+     * implementors should call the base implementation when overriding.
+     * this should be called after the override adds its options.
+     */
+    virtual void get_properties_description(const std::string &prefix,
+        options_description &opts);
+
+    /** initialize the algorithm from the given options variable map.
+     * implementors should call the base implementation when overriding.
+     * this should be called before the override sets its properties.
+     */
+    virtual void set_properties(const std::string &prefix,
+        variables_map &opts);
 #endif
 
-    // get an output port from the algorithm. to be used
-    // during pipeline building
+    /** @name verbose
+     * if set to a non-zero value, rank 0 will send status information to the
+     * terminal. The default setting of zero results in no output.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(int, verbose)
+    ///@}
+
+    /** get an output port from the algorithm. to be used during pipeline
+     * building
+     */
     virtual
     teca_algorithm_output_port get_output_port(unsigned int port = 0);
 
-    // set an input to this algorithm
+    /// set an input to this algorithm
     void set_input_connection(const teca_algorithm_output_port &port)
     { this->set_input_connection(0, port); }
 
+    /// set an input to this algorithm
     virtual
     void set_input_connection(unsigned int id,
         const teca_algorithm_output_port &port);
 
-    // remove input connections
+    /// remove input connections
     virtual
     void remove_input_connection(unsigned int id);
 
-    // remove all input connections
+    /// remove all input connections
     void clear_input_connections();
 
-    // access the cached data produced by this algorithm. when no
-    // request is specified the dataset on the top(most recent) of
-    // the cache is returned. When a request is specified it may
-    // optionally be filtered by the implementations cache key filter.
-    // see also get_cache_key (threadsafe)
+    /** access the cached data produced by this algorithm. when no request is
+     * specified the dataset on the top(most recent) of the cache is returned.
+     * When a request is specified it may optionally be filtered by the
+     * implementations cache key filter.  see also get_cache_key (threadsafe)
+     */
     const_p_teca_dataset get_output_data(unsigned int port = 0);
 
-    // remove a dataset from the top/bottom of the cache. the
-    // top of the cache has the most recently created dataset.
-    // top or bottom is selected via the boolean argument.
-    // (threadsafe)
+    /** remove a dataset from the top/bottom of the cache. the top of the cache
+     * has the most recently created dataset.  top or bottom is selected via
+     * the boolean argument.  (threadsafe)
+     */
     void pop_cache(unsigned int port = 0, int top = 0);
 
-    // set the cache size. the default is 1. (threadsafe)
+    /// set the cache size. the default is 1. (threadsafe)
     void set_cache_size(unsigned int n);
 
-    // execute the pipeline from this instance up.
+    /// execute the pipeline from this instance up.
     virtual int update();
+
+    /// execute the pipeline from this instance up.
     virtual int update(unsigned int port);
 
-    // get meta data considering this instance up.
+    /// get meta data considering this instance up.
     virtual teca_metadata update_metadata(unsigned int port = 0);
 
-    // set the executive
+    /// set the executive
     void set_executive(p_teca_algorithm_executive exe);
+
+    /// get the executive
     p_teca_algorithm_executive get_executive();
 
-    // serialize the configuration to a stream. this should
-    // store the public user modifiable properties so that
-    // runtime configuration may be saved and restored..
+    /** serialize the configuration to a stream. this should store the public
+     * user modifiable properties so that runtime configuration may be saved
+     * and restored.
+     */
     virtual void to_stream(std::ostream &s) const;
+
+    /// deserialize from the stream.
     virtual void from_stream(std::istream &s);
 
 protected:
     teca_algorithm();
 
-    // implementations should call this from their constructors
-    // to setup the internal caches and data structures required
-    // for execution.
+    /** Set the number of input connections. implementations should call this
+     * from their constructors to setup the internal caches and data structures
+     * required for execution.
+     */
     void set_number_of_input_connections(unsigned int n);
+
+    /** Set the number of output ports. implementations should call this from
+     * their constructors to setup the internal caches and data structures
+     * required for execution.
+     */
     void set_number_of_output_ports(unsigned int n);
 
-    // set the modified flag on the given output port's cache.
-    // should be called when user modifies properties on the
-    // object that require the output to be regenerated.
+    /** set the modified flag on the given output port's cache.  should be
+     * called when user modifies properties on the object that require the
+     * output to be regenerated.
+     */
     virtual void set_modified();
+
+    /// an overload to set_modified by port
     void set_modified(unsigned int port);
 
 protected:
@@ -129,46 +375,43 @@ class teca_algorithm : public std::enable_shared_from_this<teca_algorithm>
 // teca_algorithm's such as reader, filters, and
 // writers.
 
-    // implementations must override this method to provide
-    // information to downstream consumers about what data
-    // will be produced on each output port. The port to
-    // provide information about is named in the first argument
-    // the second argument contains a list of the metadata
-    // describing data on all of the inputs.
+    /** implementations must override this method to provide information to
+     * downstream consumers about what data will be produced on each output
+     * port. The port to provide information about is named in the first
+     * argument the second argument contains a list of the metadata describing
+     * data on all of the inputs.
+     */
     virtual
     teca_metadata get_output_metadata(unsigned int port,
         const std::vector<teca_metadata> &input_md);
 
-    // implementations must override this method and
-    // generate a set of requests describing the data
-    // required on the inputs to produce data for the
-    // named output port, given the upstream meta data
-    // and request. If no data is needed on an input
-    // then the list should contain a null request.
+    /** implementations must override this method and generate a set of
+     * requests describing the data required on the inputs to produce data for
+     * the named output port, given the upstream meta data and request. If no
+     * data is needed on an input then the list should contain a null request.
+     */
     virtual
     std::vector<teca_metadata> get_upstream_request(
         unsigned int port, const std::vector<teca_metadata> &input_md,
         const teca_metadata &request);
 
-    // implementations must override this method and
-    // produce the output dataset for the port named
-    // in the first argument. The second argument is
-    // a list of all of the input datasets. See also
-    // get_request. The third argument contains a request
-    // from the consumer which can spcify information
-    // such as arrays, subset region, timestep etc.
-    // The implementation is free to handle the request
-    // as it sees fit.
+    /** implementations must override this method and produce the output dataset
+     * for the port named in the first argument. The second argument is a list
+     * of all of the input datasets. See also get_request. The third argument
+     * contains a request from the consumer which can specify information such
+     * as arrays, subset region, timestep etc.  The implementation is free to
+     * handle the request as it sees fit.
+     */
     virtual
     const_p_teca_dataset execute(unsigned int port,
         const std::vector<const_p_teca_dataset> &input_data,
         const teca_metadata &request);
 
-    // implementations may choose to override this method
-    // to gain control of keys used in the cache. By default
-    // the passed in request is used as the key. This overide
-    // gives implementor the chance to filter the passed in
-    // request.
+    /** implementations may choose to override this method to gain control of
+     * keys used in the cache. By default the passed in request is used as the
+     * key. This override gives implementor the chance to filter the passed in
+     * request.
+     */
     virtual
     teca_metadata get_cache_key(unsigned int port,
         const teca_metadata &request) const;
@@ -176,62 +419,71 @@ class teca_algorithm : public std::enable_shared_from_this<teca_algorithm>
 protected:
 // this section contains methods that control the
 // pipeline's behavior. these would typically only
-// need to be overriden when designing a new class
+// need to be overridden when designing a new class
 // of algorithms.
 
-    // driver function that manage meta data reporting  phase
-    // of pipeline execution.
+    /** driver function that manage meta data reporting  phase of pipeline
+     * execution.
+     */
     virtual
     teca_metadata get_output_metadata(
         teca_algorithm_output_port &current);
 
-    // driver function that manages execution of the given
-    // requst on the named port
+    /* driver function that manages execution of the given request on the named
+     * port
+     */
     virtual
     const_p_teca_dataset request_data(
         teca_algorithm_output_port &port,
         const teca_metadata &request);
 
-    // driver function that clears the output data cache
-    // where modified flag has been set from the current
-    // port upstream.
+    /** driver function that clears the output data cache where modified flag
+     * has been set from the current port upstream.
+     */
     virtual
     int validate_cache(teca_algorithm_output_port &current);
 
-    // driver function that clears the modified flag on the
-    // named port and all of it's upstream connections.
+    /** driver function that clears the modified flag on the named port and all
+     * of it's upstream connections.
+     */
     virtual
     void clear_modified(teca_algorithm_output_port current);
 
 protected:
 // api exposing internals for use in driver methods
 
-    // search the given port's cache for the dataset associated
-    // with the given request. see also get_cache_key. (threadsafe)
+    /** search the given port's cache for the dataset associated
+     * with the given request. see also get_cache_key. (threadsafe)
+     */
     const_p_teca_dataset get_output_data(unsigned int port,
         const teca_metadata &request);
 
-    // add or update the given request , dataset pair in the cache.
-    // see also get_cache_key. (threadsafe)
+    /** add or update the given request , dataset pair in the cache.  see also
+     * get_cache_key. (threadsafe)
+     */
     int cache_output_data(unsigned int port,
         const teca_metadata &request, const_p_teca_dataset &data);
 
-    // clear the cache on the given output port
+    /// clear the cache on the given output port
     void clear_cache(unsigned int port);
 
-    // get the number of input connections
+    /// get the number of input connections
     unsigned int get_number_of_input_connections();
 
-    // get the output port associated with this algorithm's
-    // i'th input connection.
+    /** get the output port associated with this algorithm's i'th input
+     * connection.
+     */
     teca_algorithm_output_port &get_input_connection(unsigned int i);
 
-    // clear the modified flag on the i'th output
+    /// clear the modified flag on the i'th output
     void clear_modified(unsigned int port);
 
-    // return the output port's modified flag value
+    /// return the output port's modified flag value
     int get_modified(unsigned int port) const;
 
+protected:
+    int verbose;
+
 private:
     teca_algorithm_internals *internals;
 
diff --git a/core/teca_algorithm_executive.cxx b/core/teca_algorithm_executive.cxx
index 95e5fc865..e5361354f 100644
--- a/core/teca_algorithm_executive.cxx
+++ b/core/teca_algorithm_executive.cxx
@@ -13,6 +13,7 @@ int teca_algorithm_executive::initialize(MPI_Comm comm, const teca_metadata &md)
         return -1;
     }
 
+    m_request.set("index_request_key", request_key);
     m_request.set(request_key, 0);
 
     return 0;
diff --git a/core/teca_algorithm_executive.h b/core/teca_algorithm_executive.h
index 949ae4d3d..239480438 100644
--- a/core/teca_algorithm_executive.h
+++ b/core/teca_algorithm_executive.h
@@ -1,25 +1,57 @@
 #ifndef teca_algorithm_executive_h
 #define teca_algorithm_executive_h
 
-#include "teca_algorithm_executive_fwd.h"
 #include "teca_metadata.h"
 #include "teca_mpi.h"
+#include "teca_shared_object.h"
 
-// base class and default implementation for executives. algorithm
-// executives can control pipeline execution by providing a series
-// of requests. this allows for the executive to act as a load
-// balancer. the executive can for example partition requests across
-// spatial data, time steps, or file names. in an MPI parallel
-// setting the executive could coordinate this partitioning amongst
-// the ranks. However, the only requirement of an algorithm executive
-// is that it provide at least one non-empty request.
-//
-// the default implementation creates a single trivially non-empty
-// request containing the key "__request_empty = 0". This will cause
-// the pipeline to be executed once but will result in no data being
-// requested. Therefore when the default implementation is used
-// upstream algorithms must fill in the requests further to pull
-// data as needed.
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_algorithm_executive)
+
+/* this is a convenience macro to be used to declare a static
+ * New method that will be used to construct new objects in
+ * shared_ptr's. This manages the details of interoperability
+ * with std C++11 shared pointer
+ */
+#define TECA_ALGORITHM_EXECUTIVE_STATIC_NEW(T)                      \
+                                                                    \
+                                                                    \
+/** Allocate a new T */                                             \
+static p_##T New()                                                  \
+{                                                                   \
+    return p_##T(new T);                                            \
+}                                                                   \
+                                                                    \
+std::shared_ptr<T> shared_from_this()                               \
+{                                                                   \
+    return std::static_pointer_cast<T>(                             \
+        teca_algorithm_executive::shared_from_this());              \
+}                                                                   \
+                                                                    \
+std::shared_ptr<T const> shared_from_this() const                   \
+{                                                                   \
+    return std::static_pointer_cast<T const>(                       \
+        teca_algorithm_executive::shared_from_this());              \
+}
+
+
+
+/// Base class and default implementation for executives.
+/**
+ * Algorithm executives can control pipeline execution by providing
+ * a series of requests. this allows for the executive to act as a load
+ * balancer. the executive can for example partition requests across
+ * spatial data, time steps, or file names. in an MPI parallel
+ * setting the executive could coordinate this partitioning amongst
+ * the ranks. However, the only requirement of an algorithm executive
+ * is that it provide at least one non-empty request.
+ *
+ * The default implementation creates a single trivially non-empty
+ * request containing the key "__request_empty = 0". This will cause
+ * the pipeline to be executed once but will result in no data being
+ * requested. Therefore when the default implementation is used
+ * upstream algorithms must fill in the requests further to pull
+ * data as needed.
+ */
 class teca_algorithm_executive
     : public std::enable_shared_from_this<teca_algorithm_executive>
 {
diff --git a/core/teca_algorithm_executive_fwd.h b/core/teca_algorithm_executive_fwd.h
deleted file mode 100644
index 599cab2b5..000000000
--- a/core/teca_algorithm_executive_fwd.h
+++ /dev/null
@@ -1,31 +0,0 @@
-#ifndef teca_algorithm_executive_fwd_h
-#define teca_algorithm_executive_fwd_h
-
-#include "teca_shared_object.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_algorithm_executive)
-
-// this is a convenience macro to be used to declare a static
-// New method that will be used to construct new objects in
-// shared_ptr's. This manages the details of interoperability
-// with std C++11 shared pointer
-#define TECA_ALGORITHM_EXECUTIVE_STATIC_NEW(T)                      \
-                                                                    \
-static p_##T New()                                                  \
-{                                                                   \
-    return p_##T(new T);                                            \
-}                                                                   \
-                                                                    \
-std::shared_ptr<T> shared_from_this()                               \
-{                                                                   \
-    return std::static_pointer_cast<T>(                             \
-        teca_algorithm_executive::shared_from_this());              \
-}                                                                   \
-                                                                    \
-std::shared_ptr<T const> shared_from_this() const                   \
-{                                                                   \
-    return std::static_pointer_cast<T const>(                       \
-        teca_algorithm_executive::shared_from_this());              \
-}
-
-#endif
diff --git a/core/teca_algorithm_fwd.h b/core/teca_algorithm_fwd.h
deleted file mode 100644
index ee0a58b21..000000000
--- a/core/teca_algorithm_fwd.h
+++ /dev/null
@@ -1,173 +0,0 @@
-#ifndef teca_algorithm_fwd_h
-#define teca_algorithm_fwd_h
-
-#include "teca_shared_object.h"
-
-#include <initializer_list>
-#include <functional>
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_algorithm)
-
-// this is a convenience macro to be used to declare a static
-// New method that will be used to construct new objects in
-// shared_ptr's. This manages the details of interoperability
-// with std C++11 shared pointer
-#define TECA_ALGORITHM_STATIC_NEW(T)                \
-                                                    \
-static p_##T New()                                  \
-{                                                   \
-    return p_##T(new T);                            \
-}                                                   \
-                                                    \
-std::shared_ptr<T> shared_from_this()               \
-{                                                   \
-    return std::static_pointer_cast<T>(             \
-        teca_algorithm::shared_from_this());        \
-}                                                   \
-                                                    \
-std::shared_ptr<T const> shared_from_this() const   \
-{                                                   \
-    return std::static_pointer_cast<T const>(       \
-        teca_algorithm::shared_from_this());        \
-}
-
-#define TECA_ALGORITHM_CLASS_NAME(T)                \
-const char *get_class_name() const override         \
-{                                                   \
-    return #T;                                      \
-}
-
-// this convenience macro removes copy and aassignment operators
-// which generally should not be defined for reference counted types
-#define TECA_ALGORITHM_DELETE_COPY_ASSIGN(T)    \
-                                                \
-    T(const T &src) = delete;                   \
-    T(T &&src) = delete;                        \
-                                                \
-    T &operator=(const T &src) = delete;        \
-    T &operator=(T &&src) = delete;
-
-// convenience macro to declare standard set_X/get_X methods
-// where X is the name of a class member. will manage the
-// algorithm's modified state for the user.
-#define TECA_ALGORITHM_PROPERTY(T, NAME) \
-                                         \
-void set_##NAME(const T &v)              \
-{                                        \
-    if (this->NAME != v)                 \
-    {                                    \
-        this->NAME = v;                  \
-        this->set_modified();            \
-    }                                    \
-}                                        \
-                                         \
-const T &get_##NAME() const              \
-{                                        \
-    return this->NAME;                   \
-}
-
-// convenience macro to declare standard set_X/get_X methods
-// where X is the name of a class member. will manage the
-// algorithm's modified state for the user.
-#define TECA_ALGORITHM_VECTOR_PROPERTY(T, NAME)         \
-                                                        \
-size_t get_number_of_##NAME##s ()                       \
-{                                                       \
-    return this->NAME##s.size();                        \
-}                                                       \
-                                                        \
-void append_##NAME(const T &v)                          \
-{                                                       \
-    this->NAME##s.push_back(v);                         \
-    this->set_modified();                               \
-}                                                       \
-                                                        \
-void set_##NAME(size_t i, const T &v)                   \
-{                                                       \
-    if (this->NAME##s[i] != v)                          \
-    {                                                   \
-        this->NAME##s[i] = v;                           \
-        this->set_modified();                           \
-    }                                                   \
-}                                                       \
-                                                        \
-void set_##NAME##s(const std::vector<T> &v)             \
-{                                                       \
-    if (this->NAME##s != v)                             \
-    {                                                   \
-        this->NAME##s = v;                              \
-        this->set_modified();                           \
-    }                                                   \
-}                                                       \
-                                                        \
-void set_##NAME##s(const std::initializer_list<T> &&l)  \
-{                                                       \
-    std::vector<T> v(l);                                \
-    if (this->NAME##s != v)                             \
-    {                                                   \
-        this->NAME##s = v;                              \
-        this->set_modified();                           \
-    }                                                   \
-}                                                       \
-                                                        \
-void set_##NAME##s(const const_p_teca_variant_array &v) \
-{                                                       \
-    v->get(this->NAME##s);                              \
-    this->set_modified();                               \
-}                                                       \
-                                                        \
-const T &get_##NAME(size_t i) const                     \
-{                                                       \
-    return this->NAME##s[i];                            \
-}                                                       \
-                                                        \
-void get_##NAME##s(std::vector<T> &v) const             \
-{                                                       \
-    v = this->NAME##s;                                  \
-}                                                       \
-                                                        \
-void get_##NAME##s(const p_teca_variant_array &v) const \
-{                                                       \
-    v->set(this->NAME##s);                              \
-}                                                       \
-                                                        \
-void clear_##NAME##s()                                  \
-{                                                       \
-    this->NAME##s.clear();                              \
-}
-
-
-// helper that allows us to use std::function
-// as a TECA_ALGORITHM_PROPERTY
-template<typename T>
-bool operator!=(const std::function<T> &lhs, const std::function<T> &rhs)
-{
-    return &rhs != &lhs;
-}
-
-// TODO -- this is a work around for older versions
-// of Apple clang
-// Apple LLVM version 4.2 (clang-425.0.28) (based on LLVM 3.2svn)
-// Target: x86_64-apple-darwin12.6.0
-#define TECA_ALGORITHM_CALLBACK_PROPERTY(T, NAME)   \
-                                                    \
-void set_##NAME(const T &v)                         \
-{                                                   \
-    /*if (this->NAME != v)*/                        \
-    /*{*/                                           \
-        this->NAME = v;                             \
-        this->set_modified();                       \
-    /*}*/                                           \
-}                                                   \
-                                                    \
-const T &get_##NAME() const                         \
-{                                                   \
-    return this->NAME;                              \
-}                                                   \
-                                                    \
-T &get_##NAME()                                     \
-{                                                   \
-    return this->NAME;                              \
-}
-
-#endif
diff --git a/core/teca_algorithm_output_port.h b/core/teca_algorithm_output_port.h
index 3e7921148..70cce15f1 100644
--- a/core/teca_algorithm_output_port.h
+++ b/core/teca_algorithm_output_port.h
@@ -1,15 +1,18 @@
 #ifndef teca_algorithm_output_port_h
 #define teca_algorithm_output_port_h
 
+/// @file
+
+/// An output port packages an algorithm and a port number
 using teca_algorithm_output_port
     = std::pair<p_teca_algorithm, unsigned int>;
 
-// convenience functions for accessing port and algorithm
-// from an output port
+/// get the algorithm from the output port
 inline
 p_teca_algorithm &get_algorithm(teca_algorithm_output_port &op)
 { return op.first; }
 
+/// get port number from the output port
 inline
 unsigned int &get_port(teca_algorithm_output_port &op)
 { return op.second; }
diff --git a/core/teca_bad_cast.h b/core/teca_bad_cast.h
index bf4138c6e..9c8fcf889 100644
--- a/core/teca_bad_cast.h
+++ b/core/teca_bad_cast.h
@@ -4,6 +4,10 @@
 #include <exception>
 #include <string>
 
+/** @brief
+ * An exception that maybe thrown when a conversion between two data types
+ * fails.
+ */
 class teca_bad_cast : public std::exception
 {
 public:
@@ -18,6 +22,9 @@ class teca_bad_cast : public std::exception
     std::string m_what;
 };
 
+/** returns the class name of the teca_algorithm or the string "nullptr"
+ * if the algorithm is a nullptr.
+ */
 template <typename class_t>
 const std::string safe_class_name(const class_t &o)
 {
diff --git a/core/teca_binary_stream.h b/core/teca_binary_stream.h
index dac237602..22225707b 100644
--- a/core/teca_binary_stream.h
+++ b/core/teca_binary_stream.h
@@ -11,7 +11,7 @@
 #include <vector>
 
 
-// Serialize objects into a binary stream.
+/// Serialize objects into a binary stream.
 class teca_binary_stream
 {
 public:
@@ -35,7 +35,7 @@ class teca_binary_stream
     // state.
     void clear() noexcept;
 
-    // Alolocate n_bytes for the stream.
+    // Allocate n_bytes for the stream.
     void resize(unsigned long n_bytes);
 
     // ensures space for n_bytes more to the stream.
@@ -53,7 +53,7 @@ class teca_binary_stream
     unsigned long size() const noexcept
     { return m_write_p - m_data; }
 
-    // Get the sise of the internal buffer allocated
+    // Get the size of the internal buffer allocated
     // for the stream.
     unsigned long capacity() const noexcept
     { return m_size; }
diff --git a/core/calcalcs.cxx b/core/teca_calcalcs.cxx
similarity index 99%
rename from core/calcalcs.cxx
rename to core/teca_calcalcs.cxx
index d76612055..1e93e8cad 100644
--- a/core/calcalcs.cxx
+++ b/core/teca_calcalcs.cxx
@@ -1,4 +1,7 @@
 /*
+A threadsafe port of the calcalcs library
+Burlen Loring Thu Apr 22 06:22:16 PM PDT 2021
+
 The CalCalcs routines, a set of C-language routines to perform
 calendar calculations.
 
@@ -35,9 +38,9 @@ along with this program.  If not, see <http://www.gnu.org/licenses/>.
 #endif
 
 #include "udunits2.h"
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 
-namespace calcalcs
+namespace teca_calcalcs
 {
 
 static int c_isleap_gregorian    ( int year, int *leap );
diff --git a/core/calcalcs.h b/core/teca_calcalcs.h
similarity index 92%
rename from core/calcalcs.h
rename to core/teca_calcalcs.h
index 48fa55cad..4c837fb7c 100644
--- a/core/calcalcs.h
+++ b/core/teca_calcalcs.h
@@ -1,4 +1,7 @@
 /*
+A threadsafe port of the calcalcs library
+Burlen Loring Thu Apr 22 06:22:16 PM PDT 2021
+
 The CalCalcs routines, a set of C-language routines to perform
 calendar calculations.
 
@@ -22,11 +25,17 @@ along with this program.  If not, see <http://www.gnu.org/licenses/>.
 #ifndef calcalcs_h
 #define calcalcs_h
 
+/// @file
+
 #define CALCALCS_VERSION_NUMBER	1.0
 
-namespace calcalcs
+
+/// A threadsafe port of the calcalcs library.
+namespace teca_calcalcs
 {
 
+/// @cond
+
 struct cccalendar {
 	int	sig;
 	char	*name;
@@ -212,24 +221,22 @@ char *ccs_err_str(int ccs_errno);
 #define UT_ENOINIT -10
 #define UT_EINVALID -11
 
-/*--------------------------------------------------------------------------
- * high level thread safe initialize the library and select a calendar
+/// @endcond
+
+/** high level thread safe initialize the library and select a calendar
  * to use in subsequent calls.
  * return 0 upon success
  */
 int set_current_calendar( const char *calendar, const char *units );
 
-/*--------------------------------------------------------------------------
- * is_leap_year: determine if the specified year is a leap year in
- * 	the specified calendar. this wraps ccs_isleap such that initialization
- * 	is automatically handled and optimizes for repeat calls. return 0 
- * 	if successful.
+/** Determine if the specified year is a leap year in the specified calendar.
+ * this wraps ccs_isleap such that initialization is automatically handled and
+ * optimizes for repeat calls. @returns 0 if successful.
  */
 int is_leap_year( const char *calendar, const char *units,
                   int year, int &leap );
 
-/*--------------------------------------------------------------------------
- * days_in_month: returns the days per month for the given year/month.
+/** Returns the days per month for the given year/month.
  * Note that during the month that transitions from a Julian to a
  * Gregorian calendar, this might be a strange number of days. this
  * wraps ccs_dpm such that initialization is automatically handled and
@@ -238,8 +245,7 @@ int is_leap_year( const char *calendar, const char *units,
 int days_in_month( const char *calendar, const char *units,
                    int year, int month, int &dpm );
 
-/*--------------------------------------------------------------------------
- * date : given a floating point offset in the given calendar return
+/** Given a floating point offset in the given calendar return
  * year, month, day, hour, minute, seconds. returns 0 upon success.
  */
 int date( double val, int *year, int *month, int *day, int *hour,
@@ -247,8 +253,7 @@ int date( double val, int *year, int *month, int *day, int *hour,
           const char *calendar_name );
 
 
-/*--------------------------------------------------------------------------
- * given a year, month, day, hour, minute, second and calendar find
+/** given a year, month, day, hour, minute, second and calendar find
  * the floating point offset. returns 0 upon success.
  */
 int coordinate( int year, int month, int day, int hour, int minute,
diff --git a/core/teca_calendar.cxx b/core/teca_calendar.cxx
deleted file mode 100644
index 5d2cdd5de..000000000
--- a/core/teca_calendar.cxx
+++ /dev/null
@@ -1,43 +0,0 @@
-#include "teca_calendar.h"
-
-// --------------------------------------------------------------------------
-long gregorian_number(long y, long m, long d)
-{
-    m = (m + 9) % 12;
-    y = y - m/10;
-    return 365*y + y/4 - y/100 + y/400 + (m*306 + 5)/10 + (d - 1);
-}
-
-// --------------------------------------------------------------------------
-void date_from_gregorian_number(long g, long &y, long &m, long &d)
-{
-    y = (10000*g + 14780)/3652425;
-    long ddd = g - (365*y + y/4 - y/100 + y/400);
-    if (ddd < 0)
-    {
-        y = y - 1;
-        ddd = g - (365*y + y/4 - y/100 + y/400);
-    }
-
-    long mi = (100*ddd + 52)/3060;
-
-    m = (mi + 2)%12 + 1;
-    y = y + (mi + 2)/12;
-    d = ddd - (mi*306 + 5)/10 + 1;
-}
-
-// --------------------------------------------------------------------------
-bool valid_gregorian_date(long y, long m, long d)
-{
-    long g = gregorian_number(y,m,d);
-    if (g < 578027) // 578027 = gergorian_number(1582,10,1);
-        return false;
-
-    long yy, mm, dd;
-    date_from_gregorian_number(g, yy, mm, dd);
-
-    if ((y != yy) || (m != mm) || (d != dd))
-        return false;
-
-    return true;
-}
diff --git a/core/teca_calendar.h b/core/teca_calendar.h
deleted file mode 100644
index 350eb42a7..000000000
--- a/core/teca_calendar.h
+++ /dev/null
@@ -1,30 +0,0 @@
-#ifndef teca_calendar_h
-#define teca_calendar_h
-
-// functions for date computations in gregorian calendar.
-// to use convert the origin to a gergorian_number do the
-// calculation and convert the number back into a date useing
-// date_from_gregorian_number. for details about the math and
-// an explanation of the errors see
-// http://alcor.concordia.ca/~gpkatch/gdate-algorithm.html
-// y -- 4 digit year
-// m -- 2 digit month
-// d -- 2 digit day
-// returns a date number for the given date that can be used
-// in computations
-long gregorian_number(long y, long m, long d);
-
-// input
-// g -- date number computed from gregorian_number
-// returns
-// y -- 4 digit year
-// m -- 2 digit month
-// d -- 2 digit day
-// in the values provided
-void date_from_gregorian_number(long g, long &y, long &m, long &d);
-
-// return true if the date is valid in the gregorian
-// calendar and our conversion algorithm.
-bool valid_gregorian_date(long y, long m, long d);
-
-#endif
diff --git a/core/teca_common.cxx b/core/teca_common.cxx
index 52baaccef..b3c9f0dc2 100644
--- a/core/teca_common.cxx
+++ b/core/teca_common.cxx
@@ -1,5 +1,7 @@
 #include "teca_common.h"
 
+namespace std
+{
 // **************************************************************************
 std::ostream &operator<<(std::ostream &os, const std::vector<std::string> &vec)
 {
@@ -12,6 +14,7 @@ std::ostream &operator<<(std::ostream &os, const std::vector<std::string> &vec)
     }
     return os;
 }
+}
 
 // **************************************************************************
 int have_tty()
diff --git a/core/teca_common.h b/core/teca_common.h
index 61d06afcf..04e0c77cf 100644
--- a/core/teca_common.h
+++ b/core/teca_common.h
@@ -3,13 +3,18 @@
 
 #include "teca_config.h"
 #include "teca_parallel_id.h"
+
 #include <iostream>
 #include <unistd.h>
 #include <cstdio>
 #include <string>
 #include <vector>
 
-// send a vector to a stream
+// the operator<< overloads have to be namespace std in order for
+// boost to find them. they are needed for mutitoken program options
+namespace std
+{
+/// send a vector to a stream
 template <typename T>
 std::ostream &operator<<(std::ostream &os, const std::vector<T> &vec)
 {
@@ -23,11 +28,26 @@ std::ostream &operator<<(std::ostream &os, const std::vector<T> &vec)
     return os;
 }
 
-// send a vector of strings to a stream
+/// send a vector of strings to a stream
 std::ostream &operator<<(std::ostream &os, const std::vector<std::string> &vec);
+}
+
+#ifndef SWIG
+/// send a fixed length c-array to the stream
+template <typename num_t, int len,
+    typename = typename std::enable_if<!std::is_same<num_t,char>::value,bool>::type>
+std::ostream &operator<<(std::ostream &os, const num_t (& data)[len])
+{
+    os << data[0];
+    for (int i = 1; i < len; ++i)
+        os << ", " << data[i];
+    return os;
+}
+#endif
 
-// detect if we are writing to a tty, if not then
-// we should not use ansi color codes
+/** Return true if we are writing to a TTY. If we are not then we should not
+ * use ansi color codes.
+ */
 int have_tty();
 
 #define ANSI_RED "\033[1;31;40m"
diff --git a/core/teca_dataset.h b/core/teca_dataset.h
index 3f5b167a0..b8db4f646 100644
--- a/core/teca_dataset.h
+++ b/core/teca_dataset.h
@@ -1,21 +1,224 @@
 #ifndef teca_dataset_h
 #define teca_dataset_h
 
+#include "teca_common.h"
+#include "teca_shared_object.h"
 #include "teca_variant_array.h"
-#include "teca_dataset_fwd.h"
+
+#include <vector>
 #include <iosfwd>
+
 class teca_binary_stream;
 class teca_metadata;
 
-/**
-interface for teca datasets.
-*/
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_dataset)
+
+// this is a convenience macro to be used to
+// declare New and enable seamless operation
+// with std C++11 shared pointer
+#define TECA_DATASET_STATIC_NEW(T)                  \
+                                                    \
+static p_##T New()                                  \
+{                                                   \
+    return p_##T(new T);                            \
+}                                                   \
+                                                    \
+std::shared_ptr<T> shared_from_this()               \
+{                                                   \
+    return std::static_pointer_cast<T>(             \
+        teca_dataset::shared_from_this());          \
+}                                                   \
+                                                    \
+std::shared_ptr<T const> shared_from_this() const   \
+{                                                   \
+    return std::static_pointer_cast<T const>(       \
+        teca_dataset::shared_from_this());          \
+}
+
+// convenience macro implementing new_instance method
+#define TECA_DATASET_NEW_INSTANCE()                 \
+virtual p_teca_dataset new_instance() const override\
+{                                                   \
+    return this->New();                             \
+}
+
+// convenience macro implementing new_copy method
+#define TECA_DATASET_NEW_COPY()                     \
+virtual p_teca_dataset new_copy() const override    \
+{                                                   \
+    p_teca_dataset o = this->new_instance();        \
+    o->copy(this->shared_from_this());              \
+    return o;                                       \
+}                                                   \
+                                                    \
+virtual p_teca_dataset new_shallow_copy() override  \
+{                                                   \
+    p_teca_dataset o = this->new_instance();        \
+    o->shallow_copy(this->shared_from_this());      \
+    return o;                                       \
+}
+
+// convenience macro for adding properties to dataset
+// objects
+#define TECA_DATASET_PROPERTY(T, name)  \
+                                        \
+void set_##name(const T &val)           \
+{                                       \
+    this->name = val;                   \
+}                                       \
+                                        \
+const T &get_##name() const             \
+{                                       \
+    return this->name;                  \
+}                                       \
+                                        \
+T &get_##name()                         \
+{                                       \
+    return this->name;                  \
+}
+
+// convenience set get methods for dataset metadata
+#define TECA_DATASET_METADATA(key, T, len)          \
+TECA_DATASET_METADATA_V(T, key, len)                \
+TECA_DATASET_METADATA_A(T, key, len)                \
+TECA_DATASET_METADATA_ ## len (T, key)
+
+
+#define TECA_DATASET_METADATA_1(T, key)             \
+void set_##key(const T & val_1)                     \
+{                                                   \
+    this->get_metadata().set<T>(#key, val_1);       \
+}                                                   \
+                                                    \
+int get_##key(T &val_1) const                       \
+{                                                   \
+    return this->get_metadata().get<T>(             \
+        #key, val_1);                               \
+}
+
+#define TECA_DATASET_METADATA_2(T, key)             \
+void set_##key(const T & val_1, const T & val_2)    \
+{                                                   \
+    this->get_metadata().set<T>(                    \
+        #key, {val_1, val_2});                      \
+}                                                   \
+                                                    \
+int get_##key(T &val_1, T &val_2) const             \
+{                                                   \
+    std::vector<T> vals;                            \
+    if (this->get_metadata().get<T>(#key, vals))    \
+        return -1;                                  \
+    val_1 = vals[0];                                \
+    val_2 = vals[1];                                \
+    return 0;                                       \
+}
+
+#define TECA_DATASET_METADATA_3(T, key)             \
+void set_##key(const T & val_1, const T & val_2,    \
+    const T & val_3)                                \
+{                                                   \
+    this->get_metadata().set<T>(#key,               \
+        {val_1, val_2, val_3});                     \
+}                                                   \
+                                                    \
+int get_##key(T &val_1, T &val_2, T &val_3) const   \
+{                                                   \
+    std::vector<T> vals;                            \
+    if (this->get_metadata().get<T>(#key, vals))    \
+        return -1;                                  \
+    val_1 = vals[0];                                \
+    val_2 = vals[1];                                \
+    val_3 = vals[2];                                \
+    return 0;                                       \
+}
+
+#define TECA_DATASET_METADATA_4(T, key)             \
+void set_##key(const T & val_1, const T & val_2,    \
+    const T & val_3, const T & val_4)               \
+{                                                   \
+    this->get_metadata().set<T>(#key,               \
+         {val_1, val_2, val_3, val_4});             \
+}
+
+#define TECA_DATASET_METADATA_6(T, key)             \
+void set_##key(const T & val_1, const T & val_2,    \
+    const T & val_3, const T & val_4,               \
+    const T & val_5, const T & val_6)               \
+{                                                   \
+    this->get_metadata().set<T>(#key,               \
+        {val_1, val_2, val_3,                       \
+        val_4, val_5, val_6});                      \
+}
+
+#define TECA_DATASET_METADATA_8(T, key)             \
+void set_##key(const T & val_1, const T & val_2,    \
+    const T & val_3, const T & val_4,               \
+    const T & val_5, const T & val_6,               \
+    const T & val_7, const T & val_8)               \
+{                                                   \
+    this->get_metadata().set<T>(#key,               \
+        {val_1, val_2, val_3, val_4, val_5,         \
+         val_6, val_7, val_8});                     \
+}
+
+#define TECA_DATASET_METADATA_V(T, key, len)            \
+void set_##key(const std::vector<T> &vals)              \
+{                                                       \
+    if (vals.size() != len)                             \
+    {                                                   \
+        TECA_ERROR(#key " requires " #len " values")    \
+    }                                                   \
+    this->get_metadata().set<T>(#key, vals);            \
+}                                                       \
+                                                        \
+int get_##key(std::vector<T> &vals) const               \
+{                                                       \
+    return this->get_metadata().get<T>(#key, vals);     \
+}                                                       \
+                                                        \
+void set_##key(const p_teca_variant_array &vals)        \
+{                                                       \
+    if (vals->size() != len)                            \
+    {                                                   \
+        TECA_ERROR(#key " requires " #len " values")    \
+    }                                                   \
+    this->get_metadata().set(#key, vals);               \
+}                                                       \
+                                                        \
+int get_##key(p_teca_variant_array vals) const          \
+{                                                       \
+    return this->get_metadata().get(#key, vals);        \
+}                                                       \
+                                                        \
+void set_##key(const std::initializer_list<T> &l)       \
+{                                                       \
+    std::vector<T> vals(l);                             \
+    if (vals.size() != len)                             \
+    {                                                   \
+        TECA_ERROR(#key " requires " #len " values")    \
+    }                                                   \
+    this->get_metadata().set<T>(#key, vals);            \
+}                                                       \
+
+#define TECA_DATASET_METADATA_A(T, key, len)            \
+void set_##key(const T *vals)                           \
+{                                                       \
+    this->get_metadata().set<T>(#key, vals, len);       \
+}                                                       \
+                                                        \
+int get_##key(T *vals) const                            \
+{                                                       \
+    return this->get_metadata().get<T>(                 \
+        #key, vals, len);                               \
+}
+
+/// Interface for TECA datasets.
 class teca_dataset : public std::enable_shared_from_this<teca_dataset>
 {
 public:
     virtual ~teca_dataset();
 
-    // the name of the key that holds the index identifing this dataset
+    // the name of the key that holds the index identifying this dataset
     // this should be set by the algorithm that creates the dataset.
     TECA_DATASET_METADATA(index_request_key, std::string, 1)
 
@@ -26,7 +229,7 @@ class teca_dataset : public std::enable_shared_from_this<teca_dataset>
     virtual int set_request_index(const std::string &key, long val);
     virtual int set_request_index(long val);
 
-    // covert to bool. true if the dataset is not empty.
+    // covert to boolean. true if the dataset is not empty.
     // otherwise false.
     explicit operator bool() const noexcept
     { return !this->empty(); }
diff --git a/core/teca_dataset_capture.h b/core/teca_dataset_capture.h
index 04015cd26..52e8007c0 100644
--- a/core/teca_dataset_capture.h
+++ b/core/teca_dataset_capture.h
@@ -3,17 +3,19 @@
 
 #include "teca_algorithm.h"
 #include "teca_metadata.h"
-#include "teca_dataset_fwd.h"
+#include "teca_dataset.h"
 #include "teca_shared_object.h"
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_dataset_capture)
 
-/**
-An algorithm that takes a reference to dataset produced
-by the upstream algorithm it is connected to. The dataset
-is passed through so that this can be inserted anywhere
-giving one access to the intermediate data.
-*/
+/** @brief
+ * An algorithm that takes a reference to dataset produced
+ * by the upstream algorithm it is connected to.
+ *
+ * @details
+ * The dataset is passed through so that this can be inserted
+ * anywhere giving one access to the intermediate data.
+ */
 class teca_dataset_capture : public teca_algorithm
 {
 public:
diff --git a/core/teca_dataset_fwd.h b/core/teca_dataset_fwd.h
deleted file mode 100644
index 46fd125d9..000000000
--- a/core/teca_dataset_fwd.h
+++ /dev/null
@@ -1,210 +0,0 @@
-#ifndef teca_dataset_fwd_h
-#define teca_dataset_fwd_h
-
-#include "teca_common.h"
-#include "teca_shared_object.h"
-
-#include <vector>
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_dataset)
-
-// this is a convenience macro to be used to
-// declare New and enable seamless operation
-// with std C++11 shared pointer
-#define TECA_DATASET_STATIC_NEW(T)                  \
-                                                    \
-static p_##T New()                                  \
-{                                                   \
-    return p_##T(new T);                            \
-}                                                   \
-                                                    \
-std::shared_ptr<T> shared_from_this()               \
-{                                                   \
-    return std::static_pointer_cast<T>(             \
-        teca_dataset::shared_from_this());          \
-}                                                   \
-                                                    \
-std::shared_ptr<T const> shared_from_this() const   \
-{                                                   \
-    return std::static_pointer_cast<T const>(       \
-        teca_dataset::shared_from_this());          \
-}
-
-// convenience macro implementing new_instance method
-#define TECA_DATASET_NEW_INSTANCE()                 \
-virtual p_teca_dataset new_instance() const override\
-{                                                   \
-    return this->New();                             \
-}
-
-// convenience macro implementing new_copy method
-#define TECA_DATASET_NEW_COPY()                     \
-virtual p_teca_dataset new_copy() const override    \
-{                                                   \
-    p_teca_dataset o = this->new_instance();        \
-    o->copy(this->shared_from_this());              \
-    return o;                                       \
-}                                                   \
-                                                    \
-virtual p_teca_dataset new_shallow_copy() override  \
-{                                                   \
-    p_teca_dataset o = this->new_instance();        \
-    o->shallow_copy(this->shared_from_this());      \
-    return o;                                       \
-}
-
-// convenience macro for adding properties to dataset
-// objects
-#define TECA_DATASET_PROPERTY(T, name)  \
-                                        \
-void set_##name(const T &val)           \
-{                                       \
-    this->name = val;                   \
-}                                       \
-                                        \
-const T &get_##name() const             \
-{                                       \
-    return this->name;                  \
-}                                       \
-                                        \
-T &get_##name()                         \
-{                                       \
-    return this->name;                  \
-}
-
-// convenience set get methods for dataset metadata
-#define TECA_DATASET_METADATA(key, T, len)          \
-TECA_DATASET_METADATA_V(T, key, len)                \
-TECA_DATASET_METADATA_A(T, key, len)                \
-TECA_DATASET_METADATA_ ## len (T, key)
-
-
-#define TECA_DATASET_METADATA_1(T, key)             \
-void set_##key(const T & val_1)                     \
-{                                                   \
-    this->get_metadata().set<T>(#key, val_1);       \
-}                                                   \
-                                                    \
-int get_##key(T &val_1) const                       \
-{                                                   \
-    return this->get_metadata().get<T>(             \
-        #key, val_1);                               \
-}
-
-#define TECA_DATASET_METADATA_2(T, key)             \
-void set_##key(const T & val_1, const T & val_2)    \
-{                                                   \
-    this->get_metadata().set<T>(                    \
-        #key, {val_1, val_2});                      \
-}                                                   \
-                                                    \
-int get_##key(T &val_1, T &val_2) const             \
-{                                                   \
-    std::vector<T> vals;                            \
-    if (this->get_metadata().get<T>(#key, vals))    \
-        return -1;                                  \
-    val_1 = vals[0];                                \
-    val_2 = vals[1];                                \
-    return 0;                                       \
-}
-
-#define TECA_DATASET_METADATA_3(T, key)             \
-void set_##key(const T & val_1, const T & val_2,    \
-    const T & val_3)                                \
-{                                                   \
-    this->get_metadata().set<T>(#key,               \
-        {val_1, val_2, val_3});                     \
-}                                                   \
-                                                    \
-int get_##key(T &val_1, T &val_2, T &val_3) const   \
-{                                                   \
-    std::vector<T> vals;                            \
-    if (this->get_metadata().get<T>(#key, vals))    \
-        return -1;                                  \
-    val_1 = vals[0];                                \
-    val_2 = vals[1];                                \
-    val_3 = vals[2];                                \
-    return 0;                                       \
-}
-
-#define TECA_DATASET_METADATA_4(T, key)             \
-void set_##key(const T & val_1, const T & val_2,    \
-    const T & val_3, const T & val_4)               \
-{                                                   \
-    this->get_metadata().set<T>(#key,               \
-         {val_1, val_2, val_3, val_4});             \
-}
-
-#define TECA_DATASET_METADATA_6(T, key)             \
-void set_##key(const T & val_1, const T & val_2,    \
-    const T & val_3, const T & val_4,               \
-    const T & val_5, const T & val_6)               \
-{                                                   \
-    this->get_metadata().set<T>(#key,               \
-        {val_1, val_2, val_3,                       \
-        val_4, val_5, val_6});                      \
-}
-
-#define TECA_DATASET_METADATA_8(T, key)             \
-void set_##key(const T & val_1, const T & val_2,    \
-    const T & val_3, const T & val_4,               \
-    const T & val_5, const T & val_6,               \
-    const T & val_7, const T & val_8)               \
-{                                                   \
-    this->get_metadata().set<T>(#key,               \
-        {val_1, val_2, val_3, val_4, val_5,         \
-         val_6, val_7, val_8});                     \
-}
-
-#define TECA_DATASET_METADATA_V(T, key, len)            \
-void set_##key(const std::vector<T> &vals)              \
-{                                                       \
-    if (vals.size() != len)                             \
-    {                                                   \
-        TECA_ERROR(#key " requires " #len " values")    \
-    }                                                   \
-    this->get_metadata().set<T>(#key, vals);            \
-}                                                       \
-                                                        \
-int get_##key(std::vector<T> &vals) const               \
-{                                                       \
-    return this->get_metadata().get<T>(#key, vals);     \
-}                                                       \
-                                                        \
-void set_##key(const p_teca_variant_array &vals)        \
-{                                                       \
-    if (vals->size() != len)                            \
-    {                                                   \
-        TECA_ERROR(#key " requires " #len " values")    \
-    }                                                   \
-    this->get_metadata().set(#key, vals);               \
-}                                                       \
-                                                        \
-int get_##key(p_teca_variant_array vals) const          \
-{                                                       \
-    return this->get_metadata().get(#key, vals);        \
-}                                                       \
-                                                        \
-void set_##key(const std::initializer_list<T> &l)       \
-{                                                       \
-    std::vector<T> vals(l);                             \
-    if (vals.size() != len)                             \
-    {                                                   \
-        TECA_ERROR(#key " requires " #len " values")    \
-    }                                                   \
-    this->get_metadata().set<T>(#key, vals);            \
-}                                                       \
-
-#define TECA_DATASET_METADATA_A(T, key, len)            \
-void set_##key(const T *vals)                           \
-{                                                       \
-    this->get_metadata().set<T>(#key, vals, len);       \
-}                                                       \
-                                                        \
-int get_##key(T *vals) const                            \
-{                                                       \
-    return this->get_metadata().get<T>(                 \
-        #key, vals, len);                               \
-}
-
-#endif
diff --git a/core/teca_dataset_source.h b/core/teca_dataset_source.h
index 7269633f9..b7f96cf6d 100644
--- a/core/teca_dataset_source.h
+++ b/core/teca_dataset_source.h
@@ -3,18 +3,18 @@
 
 #include "teca_algorithm.h"
 #include "teca_metadata.h"
-#include "teca_dataset_fwd.h"
+#include "teca_dataset.h"
 #include "teca_shared_object.h"
 
 #include <vector>
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_dataset_source)
 
+/// An algorithm that serves up user provided data and metadata.
 /**
-An algorithm that serves up user provided data and metadata.
-This algorithm can be used to inject a dataset constructed
-on outside of TECA into a TECA pipleine.
-*/
+ * This algorithm can be used to inject a dataset constructed
+ * on outside of TECA into a TECA pipeline.
+ */
 class teca_dataset_source : public teca_algorithm
 {
 public:
diff --git a/core/teca_index_executive.cxx b/core/teca_index_executive.cxx
index d864cec5a..ec83dd3f1 100644
--- a/core/teca_index_executive.cxx
+++ b/core/teca_index_executive.cxx
@@ -166,6 +166,7 @@ int teca_index_executive::initialize(MPI_Comm comm, const teca_metadata &md)
         if ((index % this->stride) == 0)
         {
             this->requests.push_back(base_req);
+            this->requests.back().set("index_request_key", this->index_request_key);
             this->requests.back().set(this->index_request_key, index);
         }
     }
diff --git a/core/teca_index_executive.h b/core/teca_index_executive.h
index 7a8c8b290..8c70d9ece 100644
--- a/core/teca_index_executive.h
+++ b/core/teca_index_executive.h
@@ -10,27 +10,23 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_index_executive)
 
-///
-/**
-An executive that generates requests using a upstream
-or user defined index. an extent and list of arrays
-can be optionally set.
-
-meta data keys:
-
-     requires:
-
-     index_initializer_key -- holds the name of the key that tells how
-                              many indices are available. the named key
-                              must also be present and should conatin the
-                              number of indices available
-
-     index_request_key -- holds the name of the key used to request
-                          a specific index. request are generated with this
-                          name set to a specific index to be processed some
-                          upstream algorithm is expected to produce the data
-                          associated with the given index
-
+/// An executive that generates requests using a upstream or user defined index.
+/** An extent or bounds to subset by, and list of arrays can be optionally set.
+ *
+ * metadata keys:
+ *
+ * requires:
+ *
+ *      index_initializer_key -- holds the name of the key that tells how
+ *                               many indices are available. the named key
+ *                               must also be present and should contain the
+ *                               number of indices available
+ *
+ *      index_request_key -- holds the name of the key used to request
+ *                           a specific index. request are generated with this
+ *                           name set to a specific index to be processed some
+ *                           upstream algorithm is expected to produce the
+ *                           data associated with the given index
 */
 class teca_index_executive : public teca_algorithm_executive
 {
@@ -40,33 +36,33 @@ class teca_index_executive : public teca_algorithm_executive
     int initialize(MPI_Comm comm, const teca_metadata &md) override;
     teca_metadata get_next_request() override;
 
-    // set the index to process
+    /// set the index to process
     void set_index(long s);
 
-    // set the first time step in the series to process.
-    // default is 0.
+    // Set the first time step in the series to process. The default is 0.
     void set_start_index(long s);
 
-    // set the last time step in the series to process.
-    // default is -1. negative number results in the last
-    // available time step being used.
+    /** Set the last time step in the series to process.  default is -1.
+     * negative number results in the last available time step being used.
+     */
     void set_end_index(long s);
 
-    // set the stride to process time steps at. default
-    // is 1
+    /// Set the stride to process time steps at. The default is 1
     void set_stride(long s);
 
-    // set the extent to process. the default is the
-    // whole_extent.
+    /// Set the extent to process. The default is taken from whole_extent key.
     void set_extent(unsigned long *ext);
+
+    /// @copydoc set_extent
     void set_extent(const std::vector<unsigned long> &ext);
 
-    // set the bounds to process. If nothging is set then
-    // extent as provided by set_extent is used.
+    /** Set the bounds to process. If nothing is set then extent as provided by
+     * set_extent is used.
+     */
     void set_bounds(double *bounds);
     void set_bounds(const std::vector<double> &bounds);
 
-    // set the list of arrays to process
+    /// Set the list of arrays to process
     void set_arrays(const std::vector<std::string> &arrays);
 
 protected:
diff --git a/core/teca_index_reduce.cxx b/core/teca_index_reduce.cxx
index 741ec2c11..de17ad266 100644
--- a/core/teca_index_reduce.cxx
+++ b/core/teca_index_reduce.cxx
@@ -138,9 +138,9 @@ void teca_index_reduce::get_properties_description(const std::string &prefix,
         + (prefix.empty()?"teca_index_reduce":prefix));
 
     opts.add_options()
-        TECA_POPTS_GET(long, prefix, start_index, "first index to process (0)")
+        TECA_POPTS_GET(long, prefix, start_index, "first index to process")
         TECA_POPTS_GET(long, prefix, end_index, "last index to process. "
-            "If set to -1 all indices are processed. (-1)")
+            "If set to -1 all indices are processed.")
         ;
 
     global_opts.add(opts);
diff --git a/core/teca_index_reduce.h b/core/teca_index_reduce.h
index 818cb282c..85dae1786 100644
--- a/core/teca_index_reduce.h
+++ b/core/teca_index_reduce.h
@@ -1,38 +1,40 @@
 #ifndef teca_index_reduce_h
 #define teca_index_reduce_h
 
-#include "teca_dataset_fwd.h"
-#include "teca_index_reduce_fwd.h"
-
-#include "teca_threaded_algorithm.h"
+#include "teca_dataset.h"
 #include "teca_metadata.h"
+#include "teca_shared_object.h"
+#include "teca_threaded_algorithm.h"
 
 #include <vector>
 
-// base class for MPI + threads map reduce reduction over an index. the available
-// indices  are partitioned across MPI ranks and threads. one can restrict
-// operation to a range of time steps by setting first and last indeces to
-// process.
-//
-// meta data keys:
-//
-//      requires:
-//
-//      index_initializer_key -- holds the name of the key that tells how
-//                               many indices are available. the named key
-//                               must also be present and should conatin the
-//                               number of indices available
-//
-//      index_request_key -- holds the name of the key used to request
-//                           a specific index. request are generated with this
-//                           name set to a specific index to be processed some
-//                           upstream algorithm is expected to produce the data
-//                           associated with the given index
-//
-//      consumes:
-//
-//      the key named by index_request_key
-//
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_index_reduce)
+
+/// Base class for MPI + threads map reduce reduction over an index.
+/**
+ * The available indices are partitioned across MPI ranks and threads. One can
+ * restrict operation to a range of time steps by setting first and last
+ * indices to process.
+ *
+ * metadata keys:
+ *
+ *      requires:
+ *
+ *      index_initializer_key -- holds the name of the key that tells how
+ *                               many indices are available. the named key
+ *                               must also be present and should contain the
+ *                               number of indices available
+ *
+ *      index_request_key -- holds the name of the key used to request
+ *                           a specific index. request are generated with this
+ *                           name set to a specific index to be processed some
+ *                           upstream algorithm is expected to produce the
+ *                           data associated with the given index
+ *
+ *      consumes:
+ *
+ *      The key named by index_request_key
+ */
 class teca_index_reduce : public teca_threaded_algorithm
 {
 public:
diff --git a/core/teca_index_reduce_fwd.h b/core/teca_index_reduce_fwd.h
deleted file mode 100644
index 6f977040a..000000000
--- a/core/teca_index_reduce_fwd.h
+++ /dev/null
@@ -1,8 +0,0 @@
-#ifndef teca_index_reduce_fwd_h
-#define teca_index_reduce_fwd_h
-
-#include "teca_shared_object.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_index_reduce)
-
-#endif
diff --git a/core/teca_memory_profiler.h b/core/teca_memory_profiler.h
index 911f0eea3..4fe4c3ebc 100644
--- a/core/teca_memory_profiler.h
+++ b/core/teca_memory_profiler.h
@@ -6,14 +6,14 @@
 
 extern "C" void *profile(void *argp);
 
-// MemoryProfiler - A sampling memory use profiler
+/// MemoryProfiler - A sampling memory use profiler.
 /**
-The class samples process memory usage at the specified interval
-given in seconds. For each sample the time is aquired. Calling
-Initialize starts profiling, and Finalize ends it. During
-Finaliziation the buffers are written using MPI-I/O to the
-file name provided
-*/
+ * The class samples process memory usage at the specified interval
+ * given in seconds. For each sample the time is acquired. Calling
+ * Initialize starts profiling, and Finalize ends it. During
+ * Finalization the buffers are written using MPI-I/O to the
+ * file name provided.
+ */
 class teca_memory_profiler
 {
 public:
@@ -27,12 +27,12 @@ class teca_memory_profiler
     int initialize();
     int finalize();
 
-    // Set the interval in seconds between querrying
+    // Set the interval in seconds between querying
     // the processes memory use.
     void set_interval(double interval);
     double get_interval() const;
 
-    // Set the comunicator for parallel I/O
+    // Set the communicator for parallel I/O
     void set_communicator(MPI_Comm comm);
 
     // Set the file name to write the data to
diff --git a/core/teca_metadata.h b/core/teca_metadata.h
index 2168aae12..4272af62a 100644
--- a/core/teca_metadata.h
+++ b/core/teca_metadata.h
@@ -9,10 +9,12 @@
 #include <set>
 #include "teca_variant_array.h"
 
-// a generic container for meta data in the form
-// of name=value pairs. value arrays are supported.
-// see meta data producer-consumer documentation for
-// information about what names are valid.
+/// A generic container for meta data in the form of name=value pairs.
+/**
+ * Value arrays are supported. See metadata
+ * producer-consumer documentation for
+ * information about what names are valid.
+ */
 class teca_metadata
 {
 public:
@@ -129,6 +131,10 @@ class teca_metadata
     int get(const std::string &name,
         T *val, unsigned int n) const;
 
+    template<typename T, unsigned int N>
+    int get(const std::string &name, T (&val)[N]) const
+    { return this->get(name, val, N); }
+
     // copy prop values from the named prop into the passed in vector.
     // return 0 if successful
     template<typename T>
@@ -177,7 +183,7 @@ class teca_metadata
     int to_stream(teca_binary_stream &s) const;
     int from_stream(teca_binary_stream &s);
 
-    // serialize to/from ascii
+    // serialize to/from ASCII
     int to_stream(std::ostream &os) const;
     int from_stream(std::ostream &) { return -1; }
 
diff --git a/core/teca_metadata_util.cxx b/core/teca_metadata_util.cxx
index 8ac1498ef..9c27bda5a 100644
--- a/core/teca_metadata_util.cxx
+++ b/core/teca_metadata_util.cxx
@@ -1,33 +1,37 @@
 #include "teca_metadata_util.h"
 
+#include "teca_metadata.h"
+#include "teca_common.h"
+
 namespace teca_metadata_util
 {
-// remove post-fix from the arrays in get_upstream_request if
-// the post-fix is set. For example if post-fix is set to "_filtered"
-// then we remove all the variables in the "arrays" set that end with 
-// this post-fix, and replace it with the actual requested array.
-void remove_post_fix(std::set<std::string> &arrays, std::string post_fix)
+
+// **************************************************************************
+int get_array_extent(const teca_metadata &array_attributes,
+    const unsigned long mesh_extent[6], unsigned long array_extent[6])
 {
-    size_t postfix_len = post_fix.length();
+    for (int i = 0; i < 6; ++i)
+        array_extent[i] = mesh_extent[i];
 
-    std::set<std::string>::iterator arrays_it;
-    for (arrays_it=arrays.begin(); arrays_it!=arrays.end(); ++arrays_it)
+    unsigned long dim_active[4] = {0ul};
+    if (array_attributes.get("mesh_dim_active", dim_active, 4))
     {
-        std::string array_var = *arrays_it;
-        size_t array_var_len = array_var.length();
-
-        if (array_var_len > postfix_len)
-        {
-            size_t postfix_pos = array_var.find(post_fix, 
-                                            array_var_len - postfix_len);
-            if (postfix_pos != std::string::npos)
-            {
-                array_var.erase(array_var_len - postfix_len, postfix_len);
-
-                arrays.erase(arrays_it);
-                arrays.insert(array_var);
-            }
-        }
+        //TECA_ERROR("metadata issue. The array attributes collection is"
+        //    " missing the mesh_dim_active key")
+        return -1;
     }
+
+    // make the extent 1 in any direction that this array is undefined in
+    if (!dim_active[0])
+        array_extent[1] = array_extent[0] = 0;
+
+    if (!dim_active[1])
+        array_extent[3] = array_extent[2] = 0;
+
+    if (!dim_active[2])
+        array_extent[5] = array_extent[4] = 0;
+
+    return 0;
 }
-};
\ No newline at end of file
+
+};
diff --git a/core/teca_metadata_util.h b/core/teca_metadata_util.h
index 14213c971..ab3a61159 100644
--- a/core/teca_metadata_util.h
+++ b/core/teca_metadata_util.h
@@ -1,15 +1,21 @@
 #ifndef teca_metadata_util_h
 #define teca_metadata_util_h
 
-#include <string>
-#include <set>
+/// @file
 
+class teca_metadata;
+
+/// Codes for dealing with teca_metadata
 namespace teca_metadata_util
 {
-// given a set of names, where names end with a common string, here called
-// a post-fix, modifies the set of names by removing the post fix from each
-// name.
-void remove_post_fix(std::set<std::string> &names, std::string post_fix);
-
+/** Given a collection of array attributes (following the conventions used by
+ * the teca_cf_reader) and a mesh extent, compute and return the valid extent
+ * of the array. This takes into account 1d and 2d arrays on a 3d mesh. Return
+ * zero if successful. The mesh_dims_active key is required, if not found 1
+ * is returned and the array_extent is set to the mesh_extent.
+ */
+int get_array_extent(const teca_metadata &array_attributes,
+    const unsigned long mesh_extent[6], unsigned long array_extent[6]);
 };
+
 #endif
diff --git a/core/teca_mpi_util.cxx b/core/teca_mpi_util.cxx
index 8e9673dfd..df67b6ab1 100644
--- a/core/teca_mpi_util.cxx
+++ b/core/teca_mpi_util.cxx
@@ -22,7 +22,7 @@ int equipartition_communicator(MPI_Comm comm,
 
         if (n_ranks < new_comm_size)
         {
-            // can't increase beyond the original sizew
+            // can't increase beyond the original size
             return 0;
         }
 
@@ -51,4 +51,56 @@ int equipartition_communicator(MPI_Comm comm,
 #endif
     return 0;
 }
+
+// **************************************************************************
+int split_communicator(MPI_Comm world_comm,
+    int group_size, MPI_Comm *group_comm)
+{
+#if defined(TECA_HAS_MPI)
+    int is_init = 0;
+    MPI_Initialized(&is_init);
+    if (is_init)
+    {
+        int world_rank = 0;
+        int world_size = 1;
+
+        MPI_Comm_rank(world_comm, &world_rank);
+        MPI_Comm_size(world_comm, &world_size);
+
+        MPI_Group world_group = MPI_GROUP_EMPTY;
+        MPI_Comm_group(world_comm, &world_group);
+
+        int group_id = world_rank / group_size;
+        int group_start = group_id * group_size;
+        int group_end = std::min(world_size, group_start + group_size);
+        int group_range[3] = {group_start, group_end, 1};
+
+        MPI_Group sub_group = MPI_GROUP_EMPTY;
+        MPI_Group_range_incl(world_group, 1, &group_range, &sub_group);
+
+        MPI_Comm_create(world_comm, sub_group, group_comm);
+
+        MPI_Group_free(&world_group);
+        MPI_Group_free(&sub_group);
+    }
+#endif
+    return 0;
+}
+
+// **************************************************************************
+int mpi_rank_0(MPI_Comm comm)
+{
+    int rank = 0;
+#if defined(TECA_HAS_MPI)
+    int is_init = 0;
+    MPI_Initialized(&is_init);
+    if (is_init)
+    {
+        MPI_Comm_rank(comm, &rank);
+    }
+#endif
+    if (rank == 0)
+        return 1;
+    return 0;
+}
 }
diff --git a/core/teca_mpi_util.h b/core/teca_mpi_util.h
index 2b22c5b89..ccaa717c5 100644
--- a/core/teca_mpi_util.h
+++ b/core/teca_mpi_util.h
@@ -1,16 +1,28 @@
 #ifndef teca_mpi_util_h
 #define teca_mpi_util_h
 
+/// @file
+
 #include "teca_mpi.h"
 
+/// Codes dealing with MPI
 namespace teca_mpi_util
 {
-// subset the the communicator comm into a new communicator with
-// new_comm_size ranks. ranks are selected from comm with a uniform
-// stride spreading them approximatelyt equally across nodes.
+/** Subset the the communicator comm into a new communicator with new_comm_size
+ * ranks. ranks are selected from comm with a uniform stride spreading them
+ * approximatelyt equally across nodes.
+ */
 int equipartition_communicator(MPI_Comm comm,
     int new_comm_size, MPI_Comm *new_comm);
 
+/** Split the communicator into a number of new communicators such that each
+ * new communicator has group_size ranks.
+ */
+int split_communicator(MPI_Comm comm,
+    int group_size, MPI_Comm *new_comm);
+
+/// return non-zero if this process is MPI rank 0
+int mpi_rank_0(MPI_Comm comm);
 };
 
 #endif
diff --git a/core/teca_output_port.h b/core/teca_output_port.h
deleted file mode 100644
index 6afca8ffb..000000000
--- a/core/teca_output_port.h
+++ /dev/null
@@ -1,12 +0,0 @@
-#ifndef teca_output_port_h
-#define teca_output_port_h
-
-class teca_output_port
-{
-public:
-    teca_output_port(int port_id, 
-
-private:
-}
-
-#endif
diff --git a/core/teca_parallel_id.h b/core/teca_parallel_id.h
index 05e70549a..cbaab317d 100644
--- a/core/teca_parallel_id.h
+++ b/core/teca_parallel_id.h
@@ -1,13 +1,15 @@
 #ifndef teca_parallel_id_h
 #define teca_parallel_id_h
 
+/// @file
+
 #include <iosfwd>
 
-// a helper class for debug and error messages
+/// A helper class for debug and error messages.
 class teca_parallel_id
 {};
 
-// print the callers rank and thread id to the given stream.  this is a
+// Prints the callers rank and thread id to the given stream. This is a
 // debug/diagnostic message and hence rank will always be reported relative to
 // the WORLD communicator.
 std::ostream &operator<<(
diff --git a/core/teca_profiler.h b/core/teca_profiler.h
index 670b960a8..b491e87b4 100644
--- a/core/teca_profiler.h
+++ b/core/teca_profiler.h
@@ -9,9 +9,11 @@
 #include <ostream>
 
 
-// A class containing methods managing memory and time profiling
-// Each timed event logs rank, event name, start and end time, and
-// duration.
+/// A class containing methods managing memory and time profiling.
+/**
+ * Each timed event logs rank, event name, start and end time, and
+ * duration.
+ */
 class teca_profiler
 {
 public:
@@ -37,7 +39,7 @@ class teca_profiler
     static int finalize();
 
     // this can occur after MPI_Finalize. It should only be called by rank 0.
-    // Any remaining events will be appeneded to the log file. This is necessary
+    // Any remaining events will be appended to the log file. This is necessary
     // to time MPI_Initialize/Finalize and log associated I/O.
     static int flush();
 
@@ -47,26 +49,26 @@ class teca_profiler
     static void set_communicator(MPI_Comm comm);
 
     // Sets the path to write the timer log to
-    // overriden by PROFILER_LOG_FILE environment variable
+    // overridden by PROFILER_LOG_FILE environment variable
     // default value; Timer.csv
     static void set_timer_log_file(const std::string &file_name);
 
     // Sets the path to write the timer log to
-    // overriden by MEMPROF_LOG_FILE environment variable
+    // overridden by MEMPROF_LOG_FILE environment variable
     // default value: MemProfLog.csv
     static void set_mem_prof_log_file(const std::string &file_name);
 
     // Sets the number of seconds in between memory use recordings
-    // overriden by MEMPROF_INTERVAL environment variable.
+    // overridden by MEMPROF_INTERVAL environment variable.
     static void set_mem_prof_interval(int interval);
 
-    // Enable/Disable logging. Overriden by PROFILER_ENABLE environment
+    // Enable/Disable logging. Overridden by PROFILER_ENABLE environment
     // variable. In the default format a CSV file is generated capturing each
     // ranks timer events. default value: disabled
     static void enable(int arg = 0x03);
     static void disable();
 
-    // return true if loggin is enabled.
+    // return true if logging is enabled.
     static bool enabled();
 
     // @brief Log start of an event.
@@ -99,10 +101,12 @@ class teca_profiler
     static int to_stream(std::ostream &os);
 };
 
-// teca_time_event -- A helper class that times it's life.
-// A timer event is created that starts at the object's construction and ends
-// at its destruction. The pointer to the event name must be valid throughout
-// the objects life.
+/// A helper class that times it's life.
+/**
+ * A timer event is created that starts at the object's construction and ends
+ * at its destruction. The pointer to the event name must be valid throughout
+ * the objects life.
+ */
 template <int buffer_size>
 class teca_time_event
 {
diff --git a/core/teca_program_options.h b/core/teca_program_options.h
index be4340fe2..83a9f1771 100644
--- a/core/teca_program_options.h
+++ b/core/teca_program_options.h
@@ -1,7 +1,11 @@
 #ifndef teca_program_options_h
 #define teca_program_options_h
 
+/// @file
+
 #include "teca_config.h"
+#include "teca_common.h"
+#include "teca_mpi_util.h"
 
 #if defined(TECA_HAS_BOOST) && !defined(SWIG)
 namespace boost
@@ -13,25 +17,21 @@ namespace boost
     }
 };
 
-using options_description
-    = boost::program_options::options_description;
-
-using variables_map
-    = boost::program_options::variables_map;
+using options_description = boost::program_options::options_description;
+using variables_map = boost::program_options::variables_map;
 
-// initialize the given options description
-// with algorithm's properties
-#define TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION() \
-    void get_properties_description(                \
-        const std::string &prefix,                  \
-        options_description &opts) override;        \
+/// initialize the given options description with algorithm's properties
+#define TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()                         \
+                                                                            \
+    /** Adds the class algorithm properties to the description object */    \
+    void get_properties_description(const std::string &prefix,              \
+        boost::program_options::options_description &opts) override;        \
 
-// initialize the algorithm from the given options
-// variable map.
-#define TECA_SET_ALGORITHM_PROPERTIES()             \
-    void set_properties(                            \
-        const std::string &prefix,                  \
-        variables_map &opts) override;              \
+/// initialize the algorithm from the given options variable map.
+#define TECA_SET_ALGORITHM_PROPERTIES()                                     \
+    /** Sets the class algorithm properties from the map object */          \
+    void set_properties(const std::string &prefix,                          \
+        boost::program_options::variables_map &opts) override;              \
 
 // helpers for implementation dealing with Boost
 // program options. NOTE: because the above declarations
@@ -40,21 +40,30 @@ using variables_map
 // <boost/program_options.hpp>. These need to be
 // included in your cxx files.
 //
-#define TECA_POPTS_GET(_type, _prefix, _name, _desc)        \
-     (((_prefix.empty()?"":_prefix+"::") + #_name).c_str(), \
-         boost::program_options::value<_type>(), "\n" _desc "\n")
-
-#define TECA_POPTS_MULTI_GET(_type, _prefix, _name, _desc)     \
+#define TECA_POPTS_GET(_type, _prefix, _name, _desc)           \
      (((_prefix.empty()?"":_prefix+"::") + #_name).c_str(),    \
-         boost::program_options::value<_type>()->multitoken(), \
+         boost::program_options::value<_type>()->default_value \
+            (this->get_ ## _name()), "\n" _desc "\n")
+
+#define TECA_POPTS_MULTI_GET(_type, _prefix, _name, _desc)  \
+     (((_prefix.empty()?"":_prefix+"::") + #_name).c_str(), \
+         boost::program_options::value<_type>()->multitoken \
+            ()->default_value(this->get_ ## _name()),       \
          "\n" _desc "\n")
 
-#define TECA_POPTS_SET(_opts, _type, _prefix, _name)    \
-    {std::string opt_name =                             \
-        (_prefix.empty()?"":_prefix+"::") + #_name;     \
-    if (_opts.count(opt_name))                          \
-    {                                                   \
-        this->set_##_name(_opts[opt_name].as<_type>()); \
+#define TECA_POPTS_SET(_opts, _type, _prefix, _name)             \
+    {std::string opt_name =                                      \
+        (_prefix.empty()?"":_prefix+"::") + #_name;              \
+    bool defd = _opts[opt_name].defaulted();                     \
+    if (!defd)                                                   \
+    {                                                            \
+        _type val = _opts[opt_name].as<_type>();                 \
+        if (this->verbose &&                                     \
+            teca_mpi_util::mpi_rank_0(this->get_communicator())) \
+        {                                                        \
+            TECA_STATUS("Setting " << opt_name << " = " << val)  \
+        }                                                        \
+        this->set_##_name(val);                                  \
     }}
 
 #else
diff --git a/core/teca_programmable_algorithm.h b/core/teca_programmable_algorithm.h
index 43cb58dc9..bb4f0a449 100644
--- a/core/teca_programmable_algorithm.h
+++ b/core/teca_programmable_algorithm.h
@@ -2,57 +2,86 @@
 #define teca_programmable_algorithm_h
 
 #include "teca_algorithm.h"
+#include "teca_shared_object.h"
 #include "teca_metadata.h"
-#include "teca_dataset_fwd.h"
-#include "teca_programmable_algorithm_fwd.h"
-
-/// an algorithm implemented with  user provided callbacks
-/**
-The user can provide a callback for each of the three phases
-of pipeline execution. The number of input and output ports
-can also be set for filters (1 or more inputs, 1 or more outputs)
-sources, (no  inputs, 1 or more outputs), or sinks (1 or more
-inputs, no outputs).
-
-1) report phase. the report callback returns metadata
-    describing data that can be produced. The report callback
-    is optional. It's only needed if the algorithm will produce
-    new data or transform metadata.
-
-    the report callback must be callable with signature:
-    teca_metadata(unsigned int)
-
-2) request phase. the request callback generates a vector
-    of requests(metadata objects) that inform the upstream of
-    what data to generate. The request callback is optional.
-    It's only needed if the algorithm needs data from the
-    upstream or transform metadata.
-
-    the request callback must be callable with the signature:
-    std::vector<teca_metadata>(
-        unsigned int,
-        const std::vector<teca_metadata> &,
-        const teca_metadata &)
-
-3) execute phase. the execute callback is used to do useful
-    work on incoming or outgoing data. Examples include
-    generating new datasets, processing datasets, reading
-    and writing data to/from disk, and so on. The execute
-    callback is  optional.
-
-    the execute callback must be callable with the signature:
-    const_p_teca_dataset(
+#include "teca_dataset.h"
+
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_programmable_algorithm)
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_threaded_programmable_algorithm)
+
+#ifdef SWIG
+typedef void* report_callback_t;
+typedef void* request_callback_t;
+typedef void* execute_callback_t;
+typedef void* threaded_execute_callback_t;
+#else
+/// A callable implementing the report phase of pipeline execution
+using report_callback_t = std::function<teca_metadata(
+        unsigned int, const std::vector<teca_metadata>&)>;
+
+/// A callable implementing the request phase of pipeline execution
+using request_callback_t = std::function<std::vector<teca_metadata>(
+        unsigned int, const std::vector<teca_metadata> &,
+        const teca_metadata &)>;
+
+/// A callable implementing the execute phase of pipeline execution
+using execute_callback_t = std::function<const_p_teca_dataset(
         unsigned int, const std::vector<const_p_teca_dataset> &,
-        const teca_metadata &)
+        const teca_metadata &)>;
 
-see also:
+/// A callable implementing the streaming execute phase of pipeline execution
+using threaded_execute_callback_t = std::function<const_p_teca_dataset(
+        unsigned int, const std::vector<const_p_teca_dataset> &,
+        const teca_metadata &, int)>;
+#endif
 
-set_number_of_input_connections
-set_number_of_output_ports
-set_report_callback
-set_request_callback
-set_execute_callback
-*/
+/// An algorithm implemented with  user provided callbacks.
+/**
+ * The user can provide a callback for each of the three phases
+ * of pipeline execution. The number of input and output ports
+ * can also be set for filters (1 or more inputs, 1 or more outputs)
+ * sources, (no  inputs, 1 or more outputs), or sinks (1 or more
+ * inputs, no outputs).
+ *
+ * 1) report phase. the report callback returns metadata
+ *     describing data that can be produced. The report callback
+ *     is optional. It's only needed if the algorithm will produce
+ *     new data or transform metadata.
+ *
+ *     the report callback must be callable with signature:
+ *     teca_metadata(unsigned int)
+ *
+ * 2) request phase. the request callback generates a vector
+ *     of requests(metadata objects) that inform the upstream of
+ *     what data to generate. The request callback is optional.
+ *     It's only needed if the algorithm needs data from the
+ *     upstream or transform metadata.
+ *
+ *     the request callback must be callable with the signature:
+ *     std::vector<teca_metadata>(
+ *         unsigned int,
+ *         const std::vector<teca_metadata> &,
+ *         const teca_metadata &)
+ *
+ * 3) execute phase. the execute callback is used to do useful
+ *     work on incoming or outgoing data. Examples include
+ *     generating new datasets, processing datasets, reading
+ *     and writing data to/from disk, and so on. The execute
+ *     callback is  optional.
+ *
+ *     the execute callback must be callable with the signature:
+ *     const_p_teca_dataset(
+ *         unsigned int, const std::vector<const_p_teca_dataset> &,
+ *         const teca_metadata &)
+ *
+ * see also:
+ *
+ * set_number_of_input_connections
+ * set_number_of_output_ports
+ * set_report_callback
+ * set_request_callback
+ * set_execute_callback
+ */
 class teca_programmable_algorithm : public teca_algorithm
 {
 public:
diff --git a/core/teca_programmable_algorithm_fwd.h b/core/teca_programmable_algorithm_fwd.h
deleted file mode 100644
index 626fcfd57..000000000
--- a/core/teca_programmable_algorithm_fwd.h
+++ /dev/null
@@ -1,32 +0,0 @@
-#ifndef teca_program_algorithm_fwd_h
-#define teca_program_algorithm_fwd_h
-
-#include "teca_shared_object.h"
-#include "teca_metadata.h"
-#include "teca_dataset_fwd.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_programmable_algorithm)
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_threaded_programmable_algorithm)
-
-#ifdef SWIG
-typedef void* report_callback_t;
-typedef void* request_callback_t;
-typedef void* execute_callback_t;
-typedef void* threaded_execute_callback_t;
-#else
-using report_callback_t = std::function<teca_metadata(
-        unsigned int, const std::vector<teca_metadata>&)>;
-
-using request_callback_t = std::function<std::vector<teca_metadata>(
-        unsigned int, const std::vector<teca_metadata> &,
-        const teca_metadata &)>;
-
-using execute_callback_t = std::function<const_p_teca_dataset(
-        unsigned int, const std::vector<const_p_teca_dataset> &,
-        const teca_metadata &)>;
-
-using threaded_execute_callback_t = std::function<const_p_teca_dataset(
-        unsigned int, const std::vector<const_p_teca_dataset> &,
-        const teca_metadata &, int)>;
-#endif
-#endif
diff --git a/core/teca_programmable_reduce.h b/core/teca_programmable_reduce.h
index a0e14dc99..f4bade029 100644
--- a/core/teca_programmable_reduce.h
+++ b/core/teca_programmable_reduce.h
@@ -1,23 +1,39 @@
 #ifndef teca_programmable_reduce_h
 #define teca_programmable_reduce_h
 
-#include "teca_programmable_reduce_fwd.h"
-#include "teca_programmable_algorithm_fwd.h"
-#include "teca_index_reduce.h"
-#include "teca_dataset_fwd.h"
+#include "teca_dataset.h"
 #include "teca_metadata.h"
+#include "teca_shared_object.h"
+#include "teca_programmable_algorithm.h"
+#include "teca_index_reduce.h"
 
 #include <string>
 #include <vector>
+#include <functional>
+
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_programmable_reduce)
+
+#ifdef SWIG
+typedef void* reduce_callback_t;
+typedef void* finalize_callback_t;
+#else
+/// A callable that can reduce two datasets into one.
+using reduce_callback_t = std::function<p_teca_dataset(
+    const const_p_teca_dataset &, const const_p_teca_dataset &)>;
+
+/// A callable that can finalize the reduction.
+using finalize_callback_t = std::function<p_teca_dataset(
+    const const_p_teca_dataset &)>;
+#endif
 
-// callbacks implement a user defined reduction over time steps
+/// Callbacks implement a user defined reduction over time steps.
 /**
-callbacks implement a reduction on teca_datasets over time steps.
-user provides reduce callable that takes 2 datasets and produces
-a thrid reduced dataset. callbacks should be threadsafe as this is
-a parallel operation. see teca_index_reduce for details of
-parallelization.
-*/
+ * Callbacks implement a reduction on teca_datasets over time steps.
+ * User provides reduce callable that takes 2 datasets and produces
+ * a third reduced dataset. Callbacks should be threadsafe as this is
+ * a parallel operation. See teca_index_reduce for details of
+ * parallelization.
+ */
 class teca_programmable_reduce : public teca_index_reduce
 {
 public:
@@ -26,7 +42,7 @@ class teca_programmable_reduce : public teca_index_reduce
     ~teca_programmable_reduce(){}
 
     // set the implementation name, this is used in logging to
-    // identify the specific instance of programmable redeuce
+    // identify the specific instance of programmable reduce
     int set_name(const std::string &name);
 
     const char *get_class_name() const override
diff --git a/core/teca_programmable_reduce_fwd.h b/core/teca_programmable_reduce_fwd.h
deleted file mode 100644
index e17706fae..000000000
--- a/core/teca_programmable_reduce_fwd.h
+++ /dev/null
@@ -1,20 +0,0 @@
-#ifndef teca_program_reduce_fwd_h
-#define teca_program_reduce_fwd_h
-
-#include "teca_shared_object.h"
-#include "teca_dataset_fwd.h"
-#include <functional>
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_programmable_reduce)
-
-#ifdef SWIG
-typedef void* reduce_callback_t;
-typedef void* finalize_callback_t;
-#else
-using reduce_callback_t = std::function<p_teca_dataset(
-    const const_p_teca_dataset &, const const_p_teca_dataset &)>;
-
-using finalize_callback_t = std::function<p_teca_dataset(
-    const const_p_teca_dataset &)>;
-#endif
-#endif
diff --git a/core/teca_shared_object.h b/core/teca_shared_object.h
index 015c7d5af..739561127 100644
--- a/core/teca_shared_object.h
+++ b/core/teca_shared_object.h
@@ -1,14 +1,19 @@
 #ifndef teca_shared_object_h
 #define teca_shared_object_h
 
+/// @file
+
 #include <memory>
 
 // convenience macro. every teca_algrotihm/dataset
 // should have the following forward declarations
+
 #ifdef SWIG
+
 // SWIG doesn't handle alias templates yet. OK for the
 // shared object forward but the shared object template
 // forward has no direct mapping into c++03.
+
 #define TECA_SHARED_OBJECT_FORWARD_DECL(_cls)           \
     class _cls;                                         \
     typedef std::shared_ptr<_cls> p_##_cls;             \
@@ -16,19 +21,28 @@
 
 #define TECA_SHARED_OBJECT_TEMPLATE_FORWARD_DECL(_cls)  \
     template<typename T> class _cls;
+
 #else
+
 #define TECA_SHARED_OBJECT_FORWARD_DECL(_cls)           \
     class _cls;                                         \
+                                                        \
+    /** a shared pointer to an instance of _cls */      \
     using p_##_cls = std::shared_ptr<_cls>;             \
+                                                        \
+    /** A shared pointer to a const instance of _cls */ \
     using const_p_##_cls = std::shared_ptr<const _cls>;
 
 #define TECA_SHARED_OBJECT_TEMPLATE_FORWARD_DECL(_cls)  \
     template<typename T> class _cls;                    \
                                                         \
+    /** a shared pointer to an instance of _cls */      \
     template<typename T>                                \
     using p_##_cls = std::shared_ptr<_cls<T>>;          \
                                                         \
+    /** A shared pointer to a const instance of _cls */ \
     template<typename T>                                \
     using const_p_##_cls = std::shared_ptr<const _cls<T>>;
+
 #endif
 #endif
diff --git a/core/teca_string_util.cxx b/core/teca_string_util.cxx
index d1288eb29..39eb1b754 100644
--- a/core/teca_string_util.cxx
+++ b/core/teca_string_util.cxx
@@ -85,5 +85,30 @@ int tokenize(char *istr, char delim, int n_cols, char **ostr)
     return 0;
 }
 
+// **************************************************************************
+void remove_post_fix(std::set<std::string> &arrays, std::string post_fix)
+{
+    size_t postfix_len = post_fix.length();
+
+    std::set<std::string>::iterator arrays_it;
+    for (arrays_it=arrays.begin(); arrays_it!=arrays.end(); ++arrays_it)
+    {
+        std::string array_var = *arrays_it;
+        size_t array_var_len = array_var.length();
+
+        if (array_var_len > postfix_len)
+        {
+            size_t postfix_pos = array_var.find(post_fix,
+                                            array_var_len - postfix_len);
+            if (postfix_pos != std::string::npos)
+            {
+                array_var.erase(array_var_len - postfix_len, postfix_len);
+
+                arrays.erase(arrays_it);
+                arrays.insert(array_var);
+            }
+        }
+    }
 }
 
+}
diff --git a/core/teca_string_util.h b/core/teca_string_util.h
index e1d7ff54f..14d47897d 100644
--- a/core/teca_string_util.h
+++ b/core/teca_string_util.h
@@ -1,6 +1,8 @@
 #ifndef teca_string_util_h
 #define teca_string_util_h
 
+/// @file
+
 #include "teca_common.h"
 
 #include <cstdlib>
@@ -8,25 +10,30 @@
 #include <cerrno>
 #include <string>
 #include <vector>
+#include <set>
 
+/// Codes for dealing with string processing
 namespace teca_string_util
 {
-// convert the characters between the first and second double
-// quote to a std::string. Escaped characters are skipped. Return
-// 0 if successful.
+/** Convert the characters between the first and second double
+ * quote to a std::string. Escaped characters are skipped. Return
+ * 0 if successful.
+ */
 int extract_string(const char *istr, std::string &field);
 
-// scan the input string (istr) for the given a delimiter (delim). push a pointer
-// to the first non-delimiter character and the first character after each
-// instance of the delimiter.  return zero if successful. when successful there
-// will be at least one value.
+/** Scan the input string (istr) for the given a delimiter (delim). push a pointer
+ * to the first non-delimiter character and the first character after each
+ * instance of the delimiter.  return zero if successful. when successful there
+ * will be at least one value.
+ */
 int tokenize(char *istr, char delim, int n_cols, char **ostr);
 
 
-// scan the input string (istr) for the given a delimiter (delim). push a point
-// to the first non-delimiter character and the first character after each
-// instance of the delimiter.  return zero if successful. when successful there
-// will be at least one value.
+/** Scan the input string (istr) for the given a delimiter (delim). push a point
+ * to the first non-delimiter character and the first character after each
+ * instance of the delimiter.  return zero if successful. when successful there
+ * will be at least one value.
+ */
 template <typename container_t = std::vector<char*>>
 int tokenize(char *istr, char delim, container_t &ostr)
 {
@@ -62,8 +69,9 @@ int tokenize(char *istr, char delim, container_t &ostr)
     return 0;
 }
 
-// skip space, tabs, and new lines.  return non-zero if the end of the string
-// is reached before a non-pad character is encountered
+/** Skip space, tabs, and new lines.  return non-zero if the end of the string
+ * is reached before a non-pad character is encountered
+ */
 inline
 int skip_pad(char *&buf)
 {
@@ -73,7 +81,7 @@ int skip_pad(char *&buf)
     return *buf == '\0' ? -1 : 0;
 }
 
-// return 0 if the first non-pad character is #
+/// return 0 if the first non-pad character is #
 inline
 int is_comment(char *buf)
 {
@@ -83,15 +91,17 @@ int is_comment(char *buf)
     return 0;
 }
 
+/// A traits class for scanf conversion codes.
 template <typename num_t>
 struct scanf_tt {};
 
-#define DECLARE_SCANF_TT(_CPP_T, _FMT_STR)      \
-template<>                                      \
-struct scanf_tt<_CPP_T>                         \
-{                                               \
-    static                                      \
-    const char *format() { return _FMT_STR; }   \
+#define DECLARE_SCANF_TT(_CPP_T, _FMT_STR)                              \
+template<>                                                              \
+/** A traits class for scanf conversion codes, specialized fo _CPP_T */ \
+struct scanf_tt<_CPP_T>                                                 \
+{                                                                       \
+    static                                                              \
+    const char *format() { return _FMT_STR; }                           \
 };
 DECLARE_SCANF_TT(float," %g")
 DECLARE_SCANF_TT(double," %lg")
@@ -107,63 +117,66 @@ DECLARE_SCANF_TT(unsigned long, " %lu")
 DECLARE_SCANF_TT(unsigned long long, "%llu")
 DECLARE_SCANF_TT(std::string, " \"%128s")
 
+/// A traits class for conversion from text to numbers
 template <typename T>
 struct string_tt {};
 
-#define DECLARE_STR_CONVERSION_I(_CPP_T, _FUNC)                 \
-template <>                                                     \
-struct string_tt<_CPP_T>                                        \
-{                                                               \
-    static const char *type_name() { return # _CPP_T; }         \
-                                                                \
-    static int convert(char *str, _CPP_T &val)                  \
-    {                                                           \
-        errno = 0;                                              \
-        char *endp = nullptr;                                   \
-        _CPP_T tmp = _FUNC(str, &endp, 0);                      \
-        if (errno != 0)                                         \
-        {                                                       \
-            TECA_ERROR("Failed to convert string \""            \
-                << str << "\" to a nunber." << strerror(errno)) \
-            return  -1;                                         \
-        }                                                       \
-        else if (endp == str)                                   \
-        {                                                       \
-            TECA_ERROR("Failed to convert string \""            \
-                << str << "\" to a nunber. Invalid string.")    \
-            return  -1;                                         \
-        }                                                       \
-        val = tmp;                                              \
-        return 0;                                               \
-    }                                                           \
+#define DECLARE_STR_CONVERSION_I(_CPP_T, _FUNC)                                     \
+/** A traits class for conversion from text to numbers, specialized for _CPP_T */   \
+template <>                                                                         \
+struct string_tt<_CPP_T>                                                            \
+{                                                                                   \
+    static const char *type_name() { return # _CPP_T; }                             \
+                                                                                    \
+    static int convert(char *str, _CPP_T &val)                                      \
+    {                                                                               \
+        errno = 0;                                                                  \
+        char *endp = nullptr;                                                       \
+        _CPP_T tmp = _FUNC(str, &endp, 0);                                          \
+        if (errno != 0)                                                             \
+        {                                                                           \
+            TECA_ERROR("Failed to convert string \""                                \
+                << str << "\" to a nunber." << strerror(errno))                     \
+            return  -1;                                                             \
+        }                                                                           \
+        else if (endp == str)                                                       \
+        {                                                                           \
+            TECA_ERROR("Failed to convert string \""                                \
+                << str << "\" to a nunber. Invalid string.")                        \
+            return  -1;                                                             \
+        }                                                                           \
+        val = tmp;                                                                  \
+        return 0;                                                                   \
+    }                                                                               \
 };
 
-#define DECLARE_STR_CONVERSION_F(_CPP_T, _FUNC)                 \
-template <>                                                     \
-struct string_tt<_CPP_T>                                        \
-{                                                               \
-    static const char *type_name() { return # _CPP_T; }         \
-                                                                \
-    static int convert(const char *str, _CPP_T &val)            \
-    {                                                           \
-        errno = 0;                                              \
-        char *endp = nullptr;                                   \
-        _CPP_T tmp = _FUNC(str, &endp);                         \
-        if (errno != 0)                                         \
-        {                                                       \
-            TECA_ERROR("Failed to convert string \""            \
-                << str << "\" to a nunber." << strerror(errno)) \
-            return  -1;                                         \
-        }                                                       \
-        else if (endp == str)                                   \
-        {                                                       \
-            TECA_ERROR("Failed to convert string \""            \
-                << str << "\" to a nunber. Invalid string.")    \
-            return  -1;                                         \
-        }                                                       \
-        val = tmp;                                              \
-        return 0;                                               \
-    }                                                           \
+#define DECLARE_STR_CONVERSION_F(_CPP_T, _FUNC)                                     \
+/** A traits class for conversion from text to numbers, specialized for _CPP_T */   \
+template <>                                                                         \
+struct string_tt<_CPP_T>                                                            \
+{                                                                                   \
+    static const char *type_name() { return # _CPP_T; }                             \
+                                                                                    \
+    static int convert(const char *str, _CPP_T &val)                                \
+    {                                                                               \
+        errno = 0;                                                                  \
+        char *endp = nullptr;                                                       \
+        _CPP_T tmp = _FUNC(str, &endp);                                             \
+        if (errno != 0)                                                             \
+        {                                                                           \
+            TECA_ERROR("Failed to convert string \""                                \
+                << str << "\" to a nunber." << strerror(errno))                     \
+            return  -1;                                                             \
+        }                                                                           \
+        else if (endp == str)                                                       \
+        {                                                                           \
+            TECA_ERROR("Failed to convert string \""                                \
+                << str << "\" to a nunber. Invalid string.")                        \
+            return  -1;                                                             \
+        }                                                                           \
+        val = tmp;                                                                  \
+        return 0;                                                                   \
+    }                                                                               \
 };
 
 DECLARE_STR_CONVERSION_F(float, strtof)
@@ -174,6 +187,7 @@ DECLARE_STR_CONVERSION_I(int, strtol)
 DECLARE_STR_CONVERSION_I(long, strtoll)
 DECLARE_STR_CONVERSION_I(long long, strtoll)
 
+/// A traits class for conversion from text to numbers, specialized for bool
 template <>
 struct string_tt<bool>
 {
@@ -206,6 +220,7 @@ struct string_tt<bool>
     }
 };
 
+/// A traits class for conversion from text to numbers, specialized for std::string
 template <>
 struct string_tt<std::string>
 {
@@ -218,8 +233,9 @@ struct string_tt<std::string>
     }
 };
 
-
-// watch out for memory leak, val needs to be free'd
+/** A traits class for conversion from text to numbers, specialized for char*
+ * watch out for memory leak, val needs to be free'd
+ */
 template <>
 struct string_tt<char*>
 {
@@ -232,9 +248,10 @@ struct string_tt<char*>
     }
 };
 
-// extract the value in a "name = value" pair.
-// an error occurs if splitting the input on '=' doesn't produce 2 tokens
-// or if the conversion to val_t fails. returns 0 if successful.
+/** Extract the value in a "name = value" pair.
+ * an error occurs if splitting the input on '=' doesn't produce 2 tokens
+ * or if the conversion to val_t fails. returns 0 if successful.
+ */
 template <typename val_t>
 int extract_value(char *l, val_t &val)
 {
@@ -256,6 +273,18 @@ int extract_value(char *l, val_t &val)
     return 0;
 }
 
+/** Given a collection of strings, where some of the strings end with a common
+ * substring, the post-fix, this function visits each string in the collection
+ * and removes the post-fix from each string that it is found in.
+ */
+void remove_post_fix(std::set<std::string> &names, std::string post_fix);
+
+/// When passed the string "" return empty string otherwise return the passed string
+inline std::string emptystr(const std::string &in)
+{
+    return (in == "\"\"" ? std::string() : in);
+}
+
 }
 
 #endif
diff --git a/core/teca_system_util.h b/core/teca_system_util.h
index 2139501ef..dd7946c25 100644
--- a/core/teca_system_util.h
+++ b/core/teca_system_util.h
@@ -1,21 +1,25 @@
 #ifndef teca_system_util_h
 #define teca_system_util_h
 
+/// @file
+
 #include "teca_common.h"
 #include "teca_string_util.h"
 
 #include <cstdlib>
 
+/// Codes for dealing with low level system API's
 namespace teca_system_util
 {
-// initialize val with the environment variable named by var converted to a
-// numeric type. Only floating point and signed integers are implemented. For
-// unsigned types, check that the return is greater or equal to zero.
-//
-// returns:
-//    0  if the variable was found and val was initialized from it
-//    1  if the varibale was not found
-//   -1  if the variable was found but conversion from string failed
+/** initialize val with the environment variable named by var converted to a
+ * numeric type. Only floating point and signed integers are implemented. For
+ * unsigned types, check that the return is greater or equal to zero.
+ *
+ * returns:
+ *    0  if the variable was found and val was initialized from it
+ *    1  if the varibale was not found
+ *   -1  if the variable was found but conversion from string failed
+ */
 template <typename T>
 int get_environment_variable(const char *var, T &val)
 {
@@ -33,14 +37,16 @@ int get_environment_variable(const char *var, T &val)
     return 1;
 }
 
-// extract the value of the named command line argument.
-// return 0 if successful. If require is not zero then an error
-// will be reported if the argument is not present.
+/** extract the value of the named command line argument.  return 0 if
+ * successful. If require is not zero then an error will be reported if the
+ * argument is not present.
+ */
 int get_command_line_option(int argc, char **argv,
     const char *arg_name, int require, std::string &arg_val);
 
-// check for the presence of the name command line option.
-// return non-zero if it is found.
+/** check for the presence of the name command line option.  return non-zero if
+ * it is found.
+ */
 int command_line_option_check(int argc, char **argv,
     const char *arg_name);
 }
diff --git a/core/teca_thread_pool.h b/core/teca_thread_pool.h
index 55721111b..9c31bf704 100644
--- a/core/teca_thread_pool.h
+++ b/core/teca_thread_pool.h
@@ -2,7 +2,7 @@
 #define teca_thread_pool_h
 
 #include "teca_common.h"
-#include "teca_algorithm_fwd.h"
+#include "teca_algorithm.h"
 #include "teca_thread_util.h"
 #include "teca_threadsafe_queue.h"
 #include "teca_mpi.h"
@@ -26,8 +26,7 @@ class teca_thread_pool;
 template <typename task_t, typename data_t>
 using p_teca_thread_pool = std::shared_ptr<teca_thread_pool<task_t, data_t>>;
 
-// a class to manage a fixed size pool of threads that dispatch
-// I/O work
+/// A class to manage a fixed size pool of threads that dispatch I/O work.
 template <typename task_t, typename data_t>
 class teca_thread_pool
 {
@@ -113,8 +112,16 @@ void teca_thread_pool<task_t, data_t>::create_threads(MPI_Comm comm,
     int n_threads = n_requested;
 
     std::deque<int> core_ids;
-    teca_thread_util::thread_parameters(comm, -1,
-        n_requested, bind, verbose, n_threads, core_ids);
+
+    if (teca_thread_util::thread_parameters(comm, -1,
+        n_requested, bind, verbose, n_threads, core_ids))
+    {
+        TECA_WARNING("Failed to detetermine thread parameters."
+            " Falling back to 1 thread, affinity disabled.")
+
+        n_threads = 1;
+        bind = false;
+    }
 
     // allocate the threads
     for (int i = 0; i < n_threads; ++i)
diff --git a/core/teca_thread_util.cxx b/core/teca_thread_util.cxx
index 3a7fe5fd7..e0c2c46e7 100644
--- a/core/teca_thread_util.cxx
+++ b/core/teca_thread_util.cxx
@@ -296,7 +296,7 @@ int thread_parameters(MPI_Comm comm, int base_core_id, int n_requested,
     (void)affinity;
     if (n_requested < 1)
     {
-        TECA_WARNING("Cannot autmatically detect threading parameters "
+        TECA_WARNING("Can not automatically detect threading parameters "
             "on this platform. The default is 1 thread per process.")
         n_threads = 1;
     }
@@ -368,14 +368,17 @@ int thread_parameters(MPI_Comm comm, int base_core_id, int n_requested,
     }
 
     // if the user runs more MPI ranks than cores some of the ranks
-    // will have no cores to use. fallback to 1 thread on core 0
-    if (n_threads < 1)
+    // will have no cores to use.
+    if (n_procs > cores_per_node)
     {
+        TECA_WARNING(<< n_procs << " MPI ranks running on this node but only "
+            << cores_per_node << " CPU cores are available. Performance will"
+            " be degraded.")
+
         n_threads = 1;
-        affinity.push_back(0);
-        TECA_WARNING("CPU cores are unavailable, performance will be degraded. "
-            "This can occur when running more MPI ranks than there are CPU "
-            "cores. Launching 1 thread on core 0.")
+        affinity.push_back(base_core_id);
+
+        return -1;
     }
 
     // stop now if we are not binding threads to cores
@@ -401,7 +404,7 @@ int thread_parameters(MPI_Comm comm, int base_core_id, int n_requested,
 
     // there are enough cores that each thread can have it's own core
     // mark the cores which have the root thread as used so that we skip them.
-    // if we always did this in the fully apcked case we'd always be assigning
+    // if we always did this in the fully packed case we'd always be assigning
     // hyperthreads off core. it is better to keep them local.
     if (((n_threads+1)*n_procs) < cores_per_node)
     {
diff --git a/core/teca_thread_util.h b/core/teca_thread_util.h
index 44fb40f13..a0f45ce81 100644
--- a/core/teca_thread_util.h
+++ b/core/teca_thread_util.h
@@ -1,62 +1,66 @@
 #ifndef teca_thread_utils_h
 #define teca_thread_utils_h
 
+/// @file
+
 #include "teca_common.h"
 #include "teca_mpi.h"
 #include <deque>
 
+/// Codes for dealing with threading
 namespace teca_thread_util
 {
-// load balances threads across an MPI communication space such that on the
-// individual nodes physical cores each receive the same number of threads.
-// This is an MPI collective call.  Building the affinity map relies on
-// features available only in _GNU_SOURCE.  On systems where these features are
-// unavailable, when automated detection of the number of threads is requested,
-// the call will fail and the n_threads will be set to 1,
-//
-// comm - an MPI communcation space to load balance threads across.
-//        the communicator is used to coordinate affinity mapping such that
-//        each rank can allocate a number of threads bound to unique cores.
-//
-// base_core_id - identifies the core in use by this MPI rank's main
-//                thread. if -1 is passed this will be automatically
-//                determined.
-//
-// n_requested - the number of requested threads per rank. Passing a value of
-//               -1 results in use of all the cores on the node such that each
-//               physical core is assigned exactly 1 thread. Note that for
-//               performance reasons hyperthreads are not used here. The
-//               suggested number of threads is retruned in n_threads, and the
-//               returned affinity map specifies which core the thread should
-//               be bound to to acheive this. Passing n_requested >= 1
-//               specifies a run time override. This indicates that caller
-//               wants to use a specific number of threads, rather than one per
-//               physical core. In this case the affinity map is also
-//               constructed.
-//
-// bind - if true extra work is done to determine an affinity map such
-//        that each thread can be bound to a unique core on the node.
-//
-// verbose - prints a report decribing the affinity map.
-//
-// n_threads - if n_requested is -1, this will be set to the number of threads
-//             one can use such that there is one thread per phycial core
-//             taking into account all ranks running on the node. if
-//             n_requested is >= 1 n_threads will be set to n_requested. This
-//             allows a run time override for cases when the caller knows how
-//             she wants to schedule things. if an error occurs and n_requested
-//             is -1 this will be set to 1.
-//
-// affinity - an affinity map, describing for each of n_threads,
-//            a core id that the thread can be bound to. if n_requested is -1
-//            then the map will conatin an entry for each of n_threads where
-//            each of the threads is assigned a unique phyical core.  when
-//            n_requested is >= 1 the map contains an enrty for each of the
-//            n_requested threads such that when more threads are requested
-//            than cores each core is assigned approximately the same number of
-//            threads.
-//
-// return 0 on success
+/** load balances threads across an MPI communication space such that on the
+ * individual nodes physical cores each receive the same number of threads.
+ * This is an MPI collective call.  Building the affinity map relies on
+ * features available only in _GNU_SOURCE.  On systems where these features are
+ * unavailable, when automated detection of the number of threads is requested,
+ * the call will fail and the n_threads will be set to 1,
+ *
+ * @param[in] comm an MPI communcation space to load balance threads across.
+ *                 the communicator is used to coordinate affinity mapping such that
+ *                 each rank can allocate a number of threads bound to unique cores.
+ *
+ * @param[in] base_core_id identifies the core in use by this MPI rank's main
+ *                         thread. if -1 is passed this will be automatically
+ *                         determined.
+ *
+ * @param[in] n_requested the number of requested threads per rank. Passing a value of
+ *                        -1 results in use of all the cores on the node such that each
+ *                        physical core is assigned exactly 1 thread. Note that for
+ *                        performance reasons hyperthreads are not used here. The
+ *                        suggested number of threads is retruned in n_threads, and the
+ *                        returned affinity map specifies which core the thread should
+ *                        be bound to to acheive this. Passing n_requested >= 1
+ *                        specifies a run time override. This indicates that caller
+ *                        wants to use a specific number of threads, rather than one per
+ *                        physical core. In this case the affinity map is also
+ *                        constructed.
+ *
+ * @param[in] bind if true extra work is done to determine an affinity map such
+ *                 that each thread can be bound to a unique core on the node.
+ *
+ * @param[in] verbose prints a report decribing the affinity map.
+ *
+ * @param[in,out] n_threads if n_requested is -1, this will be set to the number of threads
+ *                          one can use such that there is one thread per phycial core
+ *                          taking into account all ranks running on the node. if
+ *                          n_requested is >= 1 n_threads will be set to n_requested. This
+ *                          allows a run time override for cases when the caller knows how
+ *                          she wants to schedule things. if an error occurs and n_requested
+ *                          is -1 this will be set to 1.
+ *
+ * @param[out] affinity an affinity map, describing for each of n_threads,
+ *                      a core id that the thread can be bound to. if n_requested is -1
+ *                      then the map will conatin an entry for each of n_threads where
+ *                      each of the threads is assigned a unique phyical core.  when
+ *                      n_requested is >= 1 the map contains an enrty for each of the
+ *                      n_requested threads such that when more threads are requested
+ *                      than cores each core is assigned approximately the same number of
+ *                      threads.
+ *
+ * @returns 0 on success
+ */
 int thread_parameters(MPI_Comm comm, int base_core_id, int n_requested,
     bool bind, bool verbose, int &n_threads, std::deque<int> &affinity);
 };
diff --git a/core/teca_threaded_algorithm.cxx b/core/teca_threaded_algorithm.cxx
index 42848e1ea..0578aef3e 100644
--- a/core/teca_threaded_algorithm.cxx
+++ b/core/teca_threaded_algorithm.cxx
@@ -73,7 +73,7 @@ void teca_threaded_algorithm_internals::thread_pool_resize(MPI_Comm comm,
 
 
 // --------------------------------------------------------------------------
-teca_threaded_algorithm::teca_threaded_algorithm() : verbose(0),
+teca_threaded_algorithm::teca_threaded_algorithm() :
     bind_threads(1), stream_size(-1), poll_interval(1000000),
     internals(new teca_threaded_algorithm_internals)
 {
@@ -95,20 +95,22 @@ void teca_threaded_algorithm::get_properties_description(
 
     opts.add_options()
         TECA_POPTS_GET(int, prefix, bind_threads,
-            "bind software threads to hardware cores (1)")
+            "bind software threads to hardware cores")
         TECA_POPTS_GET(int, prefix, verbose,
-            "print a run time report of settings (0)")
+            "print a run time report of settings")
         TECA_POPTS_GET(int, prefix, thread_pool_size,
             "number of threads in pool. When n == -1, 1 thread per core is "
-            "created (-1)")
+            "created")
         TECA_POPTS_GET(int, prefix, stream_size,
             "number of datasests to pass per execute call. -1 means wait "
-            "for all. (-1)")
+            "for all.")
         TECA_POPTS_GET(long, prefix, poll_interval,
             "number of nanoseconds to wait between scans of the thread pool "
-            "for completed tasks (1.0e6)")
+            "for completed tasks")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -116,6 +118,8 @@ void teca_threaded_algorithm::get_properties_description(
 void teca_threaded_algorithm::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, int, prefix, bind_threads)
     TECA_POPTS_SET(opts, int, prefix, verbose)
 
diff --git a/core/teca_threaded_algorithm.h b/core/teca_threaded_algorithm.h
index 7f02f670a..77451662b 100644
--- a/core/teca_threaded_algorithm.h
+++ b/core/teca_threaded_algorithm.h
@@ -2,9 +2,11 @@
 #define teca_threaded_algorithm_h
 
 #include "teca_algorithm.h"
-#include "teca_threaded_algorithm_fwd.h"
-#include "teca_algorithm_output_port.h"
 #include "teca_dataset.h"
+#include "teca_shared_object.h"
+
+#include <thread>
+#include <future>
 
 template <typename task_t, typename data_t>
 class teca_thread_pool;
@@ -12,24 +14,35 @@ class teca_thread_pool;
 class teca_metadata;
 class teca_threaded_algorithm_internals;
 
-#include <thread>
-#include <future>
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_threaded_algorithm)
 
-// declare the thread pool type
+/// Task type for tasks returing a pointer to teca_dataset
 using teca_data_request_task = std::packaged_task<const_p_teca_dataset()>;
 
 class teca_data_request;
+
+/// A thread pool for processing teca_data_request_task
 using teca_data_request_queue =
     teca_thread_pool<teca_data_request_task, const_p_teca_dataset>;
 
+/// A pointer to teca_data_request_queue
 using p_teca_data_request_queue = std::shared_ptr<teca_data_request_queue>;
 
+/** Allocate and initialize a new thread pool.
+ * comm [in] The communicator to allocate thread across
+ * n [in] The number of threads to create per MPI rank. Use -1 to
+ *        map one thread per physical core on each node.
+ * bind [in] If set then thread will be bound to a specific core.
+ * verbose [in] If set then the mapping is sent to the stderr
+ */
 p_teca_data_request_queue new_teca_data_request_queue(MPI_Comm comm,
     int n, bool bind, bool verbose);
 
-// this is the base class defining a threaded algorithm.
-// the stratgey employed is to parallelize over upstream
-// data requests using a thread pool.
+/// This is the base class defining a threaded algorithm.
+/**
+ * The strategy employed is to parallelize over upstream
+ * data requests using a thread pool.
+ */
 class teca_threaded_algorithm : public teca_algorithm
 {
 public:
@@ -43,29 +56,46 @@ class teca_threaded_algorithm : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set/get the number of threads in the pool. setting
-    // to -1 results in a thread per core factoring in all MPI
-    // ranks running on the node. the default is -1.
+    /** Set the number of threads in the pool. setting to -1 results in a
+     * thread per core factoring in all MPI ranks running on the node.
+     */
     void set_thread_pool_size(int n_threads);
-    unsigned int get_thread_pool_size() const noexcept;
-
-    // set/get the verbosity level.
-    TECA_ALGORITHM_PROPERTY(int, verbose);
-
-    // set/get thread affinity mode. When 0 threads are not bound
-    // CPU cores, allowing for migration among all cores. This will
-    // likely degrade performance. Default is 1.
-    TECA_ALGORITHM_PROPERTY(int, bind_threads);
 
-    // set the smallest number of datasets to gather per call to
-    // execute. the default (-1) results in all datasets being
-    // gathered. In practice more datasets will be returned if
-    // ready
-    TECA_ALGORITHM_PROPERTY(int, stream_size);
+    /// Get the number of threads in the pool.
+    unsigned int get_thread_pool_size() const noexcept;
 
-    // set the duration in nano seconds to wait between checking
-    // for completed tasks
-    TECA_ALGORITHM_PROPERTY(long long, poll_interval);
+    /** @name verbose
+     * set/get the verbosity level.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(int, verbose)
+    ///@}
+
+    /** @name bind_threads
+     * set/get thread affinity mode. When 0 threads are not bound CPU cores,
+     * allowing for migration among all cores. This will likely degrade
+     * performance. Default is 1.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(int, bind_threads)
+    ///@}
+
+    /** @name stream_size
+     * set the smallest number of datasets to gather per call to execute. the
+     * default (-1) results in all datasets being gathered. In practice more
+     * datasets will be returned if ready
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(int, stream_size)
+    ///@}
+
+    /** @name poll_interval
+     * set the duration in nanoseconds to wait between checking for completed
+     * tasks
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(long long, poll_interval)
+    ///@}
 
     // explicitly set the thread pool to submit requests to
     void set_data_request_queue(const p_teca_data_request_queue &queue);
@@ -88,12 +118,12 @@ class teca_threaded_algorithm : public teca_algorithm
         const teca_metadata &request) override;
 
     // driver function that manages execution of the given
-    // requst on the named port. each upstream request issued
+    // request on the named port. each upstream request issued
     // will be executed by the thread pool.
     const_p_teca_dataset request_data(teca_algorithm_output_port &port,
         const teca_metadata &request) override;
+
 private:
-    int verbose;
     int bind_threads;
     int stream_size;
     long long poll_interval;
diff --git a/core/teca_threaded_algorithm_fwd.h b/core/teca_threaded_algorithm_fwd.h
deleted file mode 100644
index 5d3eb6fef..000000000
--- a/core/teca_threaded_algorithm_fwd.h
+++ /dev/null
@@ -1,8 +0,0 @@
-#ifndef teca_threaded_algorithm_fwd_h
-#define teca_threaded_algorithm_fwd_h
-
-#include "teca_shared_object.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_threaded_algorithm)
-
-#endif
diff --git a/core/teca_threaded_programmable_algorithm.h b/core/teca_threaded_programmable_algorithm.h
index a120a3a9c..444748b0a 100644
--- a/core/teca_threaded_programmable_algorithm.h
+++ b/core/teca_threaded_programmable_algorithm.h
@@ -2,67 +2,66 @@
 #define teca_threaded_programmable_algorithm_h
 
 #include "teca_metadata.h"
+#include "teca_dataset.h"
 #include "teca_threaded_algorithm.h"
-#include "teca_dataset_fwd.h"
+#include "teca_programmable_algorithm.h"
 
-#include "teca_programmable_algorithm_fwd.h"
-
-/// an algorithm implemented with  user provided callbacks
+/// An threaded algorithm implemented with user provided callbacks.
 /**
-This version of the teca_programmable_algorithm is threaded. A thread pool
-(call set_thread_pool_size to initialize) executes the upstream pipeline
-asynchronously for each request made. Hence, this version of the prpogrammable
-algorithm is most useful when there are multiple requests to be processed. Data
-from the set of requests can be processed incrementally when streaming (see
-set_stream_size to initialize).  If one doesn't need these features it is
-better to use the teca_programmable_algorithm instead. See
-teca_threaded_algorithm for more details about threaded execution.
-
-The user can provide a callback for each of the three phases
-of pipeline execution. The number of input and output ports
-can also be set for filters (1 or more inputs, 1 or more outputs)
-sources, (no  inputs, 1 or more outputs), or sinks (1 or more
-inputs, no outputs).
-
-1) report phase. the report callback returns metadata
-    describing data that can be produced. The report callback
-    is optional. It's only needed if the algorithm will produce
-    new data or transform metadata.
-
-    the report callback must be callable with signature:
-    teca_metadata(unsigned int)
-
-2) request phase. the request callback generates a vector of
-    requests(metadata objects) that inform the upstream of
-    what data to generate. The request callback is optional.
-    It's only needed if the algorithm needs data from the
-    upstream or transform metadata.
-
-    the request callback must be callable with the signature:
-    std::vector<teca_metadata>(
-        unsigned int,
-        const std::vector<teca_metadata> &,
-        const teca_metadata &)
-
-3) execute phase. the execute callback is used to do useful
-    work on incoming or outgoing data. Examples include
-    generating new datasets, processing datasets, reading
-    and writing data to/from disk, and so on. The execute
-    callback is  optional.
-
-    the execute callback must be callable with the signature:
-    const_p_teca_dataset(
-        unsigned int, const std::vector<const_p_teca_dataset> &,
-        const teca_metadata &, int)
-
-see also:
-
-set_number_of_input_connections
-set_number_of_output_ports
-set_report_callback
-set_request_callback
-set_execute_callback
-*/
+ * This version of the teca_programmable_algorithm is threaded. A thread pool
+ * (call set_thread_pool_size to initialize) executes the upstream pipeline
+ * asynchronously for each request made. Hence, this version of the
+ * programmable algorithm is most useful when there are multiple requests to
+ * be processed. Data from the set of requests can be processed incrementally
+ * when streaming (see set_stream_size to initialize).  If one doesn't need
+ * these features it is better to use the teca_programmable_algorithm instead.
+ * See teca_threaded_algorithm for more details about threaded execution.
+ *
+ * The user can provide a callback for each of the three phases
+ * of pipeline execution. The number of input and output ports
+ * can also be set for filters (1 or more inputs, 1 or more outputs)
+ * sources, (no  inputs, 1 or more outputs), or sinks (1 or more
+ * inputs, no outputs).
+ *
+ * 1) report phase. the report callback returns metadata
+ *     describing data that can be produced. The report callback
+ *     is optional. It's only needed if the algorithm will produce
+ *     new data or transform metadata.
+ *
+ *     the report callback must be callable with signature:
+ *     teca_metadata(unsigned int)
+ *
+ * 2) request phase. the request callback generates a vector of
+ *     requests(metadata objects) that inform the upstream of
+ *     what data to generate. The request callback is optional.
+ *     It's only needed if the algorithm needs data from the
+ *     upstream or transform metadata.
+ *
+ *     the request callback must be callable with the signature:
+ *     std::vector<teca_metadata>(
+ *         unsigned int,
+ *         const std::vector<teca_metadata> &,
+ *         const teca_metadata &)
+ *
+ * 3) execute phase. the execute callback is used to do useful
+ *     work on incoming or outgoing data. Examples include
+ *     generating new datasets, processing datasets, reading
+ *     and writing data to/from disk, and so on. The execute
+ *     callback is  optional.
+ *
+ *     the execute callback must be callable with the signature:
+ *     const_p_teca_dataset(
+ *         unsigned int, const std::vector<const_p_teca_dataset> &,
+ *         const teca_metadata &, int)
+ *
+ * see also:
+ *
+ * set_number_of_input_connections
+ * set_number_of_output_ports
+ * set_report_callback
+ * set_request_callback
+ * set_execute_callback
+ */
 class teca_threaded_programmable_algorithm : public teca_threaded_algorithm
 {
 public:
@@ -80,7 +79,7 @@ class teca_threaded_programmable_algorithm : public teca_threaded_algorithm
     using teca_algorithm::set_number_of_input_connections;
     using teca_algorithm::set_number_of_output_ports;
 
-    // set the number of threads. The default is -1. 
+    // set the number of threads. The default is -1.
     using teca_threaded_algorithm::set_thread_pool_size;
 
     // set the stream size. the default -1 disables streaming.
diff --git a/core/teca_threadsafe_queue.h b/core/teca_threadsafe_queue.h
index 27d10cdae..a15769686 100644
--- a/core/teca_threadsafe_queue.h
+++ b/core/teca_threadsafe_queue.h
@@ -5,6 +5,7 @@
 #include <queue>
 #include <condition_variable>
 
+/// A thread safe queue
 template<typename T>
 class teca_threadsafe_queue
 {
diff --git a/core/teca_type_select.h b/core/teca_type_select.h
index c480465d6..a372f706d 100644
--- a/core/teca_type_select.h
+++ b/core/teca_type_select.h
@@ -1,28 +1,45 @@
 #ifndef teca_type_elevate_h
 #define teca_type_elevate_h
 
+/// @file
+
+/// Select a type based on input type(s)
 namespace teca_type_select
 {
-// given two arguments, an elevate cast, selects
-// the type of or casts to the higher precision
-// type. note that given a signed and unsigned
-// argument, signed type is selected.
+/// Select the higher precision type.
+/** Given two arguments, an elevate cast, selects the type of or casts to the
+ * higher precision type. note that given a signed and unsigned argument,
+ * signed type is selected.
+ *
+ * @tparam t1 first input type
+ * @tparam t2 second input type
+ */
 template <typename t1, typename t2>
 struct elevate {};
 
-// given two areuments, a decay cast, selects the
-// type of or casts to the lower precision
-// type. note that given a signed and unsigned
-// argument, unsigned type is selected.
+/// Select the lower precision type.
+/** Given two arguments, a decay cast, selects the type of or casts to the lower
+ * precision type. note that given a signed and unsigned argument, unsigned
+ * type is selected.
+ *
+ * @tparam t1 first input type
+ * @tparam t2 second input type
+ */
 template <typename t1, typename t2>
 struct decay {};
 
 #define teca_type_select(_class, _ret, _t1, _t2)    \
+/** Given _t1 and _t2 _class to _ret */             \
 template <>                                         \
 struct _class<_t1, _t2>                             \
 {                                                   \
+    /** _class result type */                       \
     using type = _ret;                              \
+                                                    \
+    /** cast to _ret */                             \
     static _ret cast(_t1 arg){ return arg; }        \
+                                                    \
+    /** name of the _class result type */           \
     static constexpr const char *type_name()        \
     { return #_ret; }                               \
 };
diff --git a/core/teca_uuid.h b/core/teca_uuid.h
index e8ba10eca..09002f755 100644
--- a/core/teca_uuid.h
+++ b/core/teca_uuid.h
@@ -5,7 +5,7 @@
 #include <boost/uuid/uuid_generators.hpp>
 
 
-// a universally uniquer identifier
+/// A universally uniquer identifier.
 class teca_uuid : public boost::uuids::uuid
 {
 public:
diff --git a/core/teca_variant_array.h b/core/teca_variant_array.h
index e68869138..4d34243b2 100644
--- a/core/teca_variant_array.h
+++ b/core/teca_variant_array.h
@@ -1,6 +1,8 @@
 #ifndef teca_variant_array_h
 #define teca_variant_array_h
 
+/// @file
+
 #include <vector>
 #include <string>
 #include <sstream>
@@ -14,27 +16,273 @@
 
 #include "teca_common.h"
 #include "teca_binary_stream.h"
-#include "teca_variant_array_fwd.h"
 #include "teca_bad_cast.h"
+#include "teca_shared_object.h"
+
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_variant_array)
+TECA_SHARED_OBJECT_TEMPLATE_FORWARD_DECL(teca_variant_array_impl)
+
+#ifndef SWIG
+using teca_string_array = teca_variant_array_impl<std::string>;
+using p_teca_string_array = std::shared_ptr<teca_variant_array_impl<std::string>>;
+using const_p_teca_string_array = std::shared_ptr<const teca_variant_array_impl<std::string>>;
+
+using teca_float_array = teca_variant_array_impl<float>;
+using p_teca_float_array = std::shared_ptr<teca_variant_array_impl<float>>;
+using const_p_teca_float_array = std::shared_ptr<const teca_variant_array_impl<float>>;
+
+using teca_double_array = teca_variant_array_impl<double>;
+using p_teca_double_array = std::shared_ptr<teca_variant_array_impl<double>>;
+using const_p_teca_double_array = std::shared_ptr<const teca_variant_array_impl<double>>;
+
+using teca_char_array = teca_variant_array_impl<char>;
+using p_teca_char_array = std::shared_ptr<teca_variant_array_impl<char>>;
+using const_p_teca_char_array = std::shared_ptr<const teca_variant_array_impl<char>>;
+
+using teca_unsigned_char_array = teca_variant_array_impl<unsigned char>;
+using p_teca_unsigned_char_array = std::shared_ptr<teca_variant_array_impl<unsigned char>>;
+using const_p_teca_unsigned_char_array = std::shared_ptr<const teca_variant_array_impl<unsigned char>>;
+
+using teca_short_array = teca_variant_array_impl<short>;
+using p_teca_short_array = std::shared_ptr<teca_variant_array_impl<short>>;
+using const_p_teca_short_array = std::shared_ptr<const teca_variant_array_impl<short>>;
+
+using teca_unsigned_short_array = teca_variant_array_impl<unsigned short>;
+using p_teca_unsigned_short_array = std::shared_ptr<teca_variant_array_impl<unsigned short>>;
+using const_p_teca_unsigned_short_array = std::shared_ptr<const teca_variant_array_impl<unsigned short>>;
+
+using teca_int_array = teca_variant_array_impl<int>;
+using p_teca_int_array = std::shared_ptr<teca_variant_array_impl<int>>;
+using const_p_teca_int_array = std::shared_ptr<const teca_variant_array_impl<int>>;
+
+using teca_unsigned_int_array = teca_variant_array_impl<unsigned int>;
+using p_teca_unsigned_int_array = std::shared_ptr<teca_variant_array_impl<unsigned int>>;
+using const_p_teca_unsigned_int_array = std::shared_ptr<const teca_variant_array_impl<unsigned int>>;
+
+using teca_long_array = teca_variant_array_impl<long>;
+using p_teca_long_array = std::shared_ptr<teca_variant_array_impl<long>>;
+using const_p_teca_long_array = std::shared_ptr<const teca_variant_array_impl<long>>;
+
+using teca_unsigned_long_array = teca_variant_array_impl<unsigned long>;
+using p_teca_unsigned_long_array = std::shared_ptr<teca_variant_array_impl<unsigned long>>;
+using const_p_teca_unsigned_long_array = std::shared_ptr<const teca_variant_array_impl<unsigned long>>;
+
+using teca_long_long_array = teca_variant_array_impl<long long>;
+using p_teca_long_long_array = std::shared_ptr<teca_variant_array_impl<long long>>;
+using const_p_teca_long_long_array = std::shared_ptr<const teca_variant_array_impl<long long>>;
+
+using teca_unsigned_long_long_array = teca_variant_array_impl<unsigned long long>;
+using p_teca_unsigned_long_long_array = std::shared_ptr<teca_variant_array_impl<unsigned long long>>;
+using const_p_teca_unsigned_long_long_array = std::shared_ptr<const teca_variant_array_impl<unsigned long long>>;
+
+using teca_size_t_array = teca_variant_array_impl<size_t>;
+using p_teca_size_t_array = std::shared_ptr<teca_variant_array_impl<size_t>>;
+using const_p_teca_size_t_array = std::shared_ptr<const teca_variant_array_impl<size_t>>;
+#endif
+
+/** this is a convenience macro to be used to declare a static
+ * New method that will be used to construct new objects in
+ * shared_ptr's. This manages the details of interoperability
+ * with std C++11 shared pointer
+ */
+#define TECA_VARIANT_ARRAY_STATIC_NEW(T, t)                             \
+                                                                        \
+/** Allocate a T<t> */                                                  \
+static std::shared_ptr<T<t>> New()                                      \
+{                                                                       \
+    return std::shared_ptr<T<t>>(new T<t>);                             \
+}                                                                       \
+                                                                        \
+/** Allocate a T<t> of size n */                                        \
+static std::shared_ptr<T<t>> New(size_t n)                              \
+{                                                                       \
+    return std::shared_ptr<T<t>>(new T<t>(n));                          \
+}                                                                       \
+                                                                        \
+/** Allocate a T<t> of size n initialized with v */                     \
+static std::shared_ptr<T<t>> New(size_t n, const t &v)                  \
+{                                                                       \
+    return std::shared_ptr<T<t>>(new T<t>(n, v));                       \
+}                                                                       \
+                                                                        \
+/** Allocate a T<t> initialized with n values from vals */              \
+static std::shared_ptr<T<t>> New(const t *vals, size_t n)               \
+{                                                                       \
+    return std::shared_ptr<T<t>>(new T<t>(vals, n));                    \
+}                                                                       \
+                                                                        \
+using teca_variant_array::shared_from_this;                             \
+                                                                        \
+std::shared_ptr<T> shared_from_this()                                   \
+{                                                                       \
+    return std::static_pointer_cast<T>(shared_from_this());             \
+}                                                                       \
+                                                                        \
+std::shared_ptr<T const> shared_from_this() const                       \
+{                                                                       \
+    return std::static_pointer_cast<T const>(shared_from_this());       \
+}
+
+
+
 
-// tag for ops on POD data
+
+
+
+
+/// @cond
+/// A tag for dispatching operations on POD data
 template <typename T>
 struct pod_dispatch :
     std::integral_constant<bool,
     std::is_arithmetic<T>::value>
 {};
 
-// tag for ops on classes
+/// A tag for disp[atching operations on classes
 template <typename T>
 struct object_dispatch :
     std::integral_constant<bool,
     !std::is_arithmetic<T>::value>
 {};
+/// @endcond
+
+/** Executes the code in body if p is a tt<nt>
+ * @param tt     derived container
+ * @param nt     contained type
+ * @param p      base class pointer
+ * @param body   the code to execute if the type matches
+ *
+ * The following aliases are provided to know the type within the code to execute.
+ *
+ *     using TT = tt<nt>;
+ *     using NT = nt;
+ *
+ */
+#define TEMPLATE_DISPATCH_CASE(tt, nt, p, body) \
+    if (dynamic_cast<tt<nt>*>(p))               \
+    {                                           \
+        using TT = tt<nt>;                      \
+        using NT = nt;                          \
+        body                                    \
+    }
+
+/** Executes the code in body if p is a tt<nt> an idnetifier disambiguates type
+ * aliases  when nested
+ *
+ * @param tt     derived container
+ * @param nt     contained type
+ * @param p      base class pointer
+ * @param i      identifier
+ * @param body   the code to execute if the type matches
+ *
+ * The following aliases are provided to know the type within the code to execute.
+ *
+ *     using TT##i = tt<nt>;
+ *     using NT##i = nt;
+ *
+ */
+#define NESTED_TEMPLATE_DISPATCH_CASE(tt, nt, p, i, body)   \
+    if (dynamic_cast<tt<nt>*>(p))                           \
+    {                                                       \
+        using TT##i = tt<nt>;                               \
+        using NT##i = nt;                                   \
+        body                                                \
+    }
+
+/// Executes the code in body if p is a t<nt> where nt is a floating point type
+#define TEMPLATE_DISPATCH_FP(t, p, body)        \
+    TEMPLATE_DISPATCH_CASE(t, float, p, body)   \
+    else TEMPLATE_DISPATCH_CASE(t, double, p, body)
+
+/// Executes the code in body if p is a t<nt> where nt is a signed inetegral type
+#define TEMPLATE_DISPATCH_SI(t, p, body)                        \
+    TEMPLATE_DISPATCH_CASE(t, long long, p, body)               \
+    else TEMPLATE_DISPATCH_CASE(t, long, p, body)               \
+    else TEMPLATE_DISPATCH_CASE(t, int, p, body)                \
+    else TEMPLATE_DISPATCH_CASE(t, short int, p, body)          \
+    else TEMPLATE_DISPATCH_CASE(t, char, p, body)
+
+/// Executes the code in body if p is a t<nt> where nt is either a signed integral or floating point type
+#define TEMPLATE_DISPATCH_FP_SI(t, p, body)             \
+    TEMPLATE_DISPATCH_CASE(t, float, p, body)           \
+    else TEMPLATE_DISPATCH_CASE(t, double, p, body)     \
+    else TEMPLATE_DISPATCH_SI(t, p, body)
+
+/// Executes the code in body if p is a t<nt> where nt is an integral type
+#define TEMPLATE_DISPATCH_I(t, p, body)                         \
+    TEMPLATE_DISPATCH_CASE(t, long long, p, body)               \
+    else TEMPLATE_DISPATCH_CASE(t, unsigned long long, p, body) \
+    else TEMPLATE_DISPATCH_CASE(t, long, p, body)               \
+    else TEMPLATE_DISPATCH_CASE(t, int, p, body)                \
+    else TEMPLATE_DISPATCH_CASE(t, unsigned int, p, body)       \
+    else TEMPLATE_DISPATCH_CASE(t, unsigned long, p, body)      \
+    else TEMPLATE_DISPATCH_CASE(t, short int, p, body)          \
+    else TEMPLATE_DISPATCH_CASE(t, short unsigned int, p, body) \
+    else TEMPLATE_DISPATCH_CASE(t, char, p, body)               \
+    else TEMPLATE_DISPATCH_CASE(t, unsigned char, p, body)
+
+/** A macro for accessing the typed contents of a teca_variant_array
+ * @param t    container type
+ * @param p    pointer to an instance to match on
+ * @param body code to execute on match
+ *
+ * See #TEMPLATE_DISPATCH_CASE for details.
+ */
+#define TEMPLATE_DISPATCH(t, p, body)       \
+    TEMPLATE_DISPATCH_FP(t, p, body)        \
+    else TEMPLATE_DISPATCH_I(t, p, body)
+
+/** A macro for accessing the floating point typed contents of a teca_variant_array
+ * @param t    container type
+ * @param p    pointer to an instance to match on
+ * @param i    an indentifier to use with type aliases
+ * @param body code to execute on match
+ *
+ * See #NESTED_TEMPLATE_DISPATCH_CASE for details.
+ */
+#define NESTED_TEMPLATE_DISPATCH_FP(t, p, i, body)              \
+    NESTED_TEMPLATE_DISPATCH_CASE(t, float, p, i, body)         \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, double, p, i, body)
+
+/** A macro for accessing the inetgral typed contents of a teca_variant_array
+ * @param t    container type
+ * @param p    pointer to an instance to match on
+ * @param i    an indentifier to use with type aliases
+ * @param body code to execute on match
+ *
+ * See #NESTED_TEMPLATE_DISPATCH_CASE for details.
+ */
+#define NESTED_TEMPLATE_DISPATCH_I(t, p, i, body)                         \
+    NESTED_TEMPLATE_DISPATCH_CASE(t, long long, p, i, body)               \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, unsigned long long, p, i, body) \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, long, p, i, body)               \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, int, p, i, body)                \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, unsigned int, p, i, body)       \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, unsigned long, p, i, body)      \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, short int, p, i, body)          \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, short unsigned int, p, i, body) \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, char, p, i, body)               \
+    else NESTED_TEMPLATE_DISPATCH_CASE(t, unsigned char, p, i, body)
 
-/// type agnostic container for array based data
-/**
-type agnostic container for array based data.
-*/
+/** \def NESTED_TEMPLATE_DISPATCH(t, p, i, body)
+ * A macro for accessing the typed contents of a teca_variant_array
+ * @param t    container type
+ * @param p    pointer to an instance to match on
+ * @param i    an indentifier to use with type aliases
+ * @param body code to execute on match
+ *
+ * See #NESTED_TEMPLATE_DISPATCH_CASE for details.
+ */
+#define NESTED_TEMPLATE_DISPATCH(t, p, i, body)     \
+    NESTED_TEMPLATE_DISPATCH_FP(t, p, i, body)      \
+    else NESTED_TEMPLATE_DISPATCH_I(t, p, i, body)
+
+
+
+/// A type agnostic container for array based data.
+/** See #TEMPLATE_DISPATCH and #NESTED_TEMPLATE_DISPATCH for details on how to
+ * apply type specific code to an instance of teca_variant_array.
+ */
 class teca_variant_array : public std::enable_shared_from_this<teca_variant_array>
 {
 public:
@@ -55,12 +303,12 @@ class teca_variant_array : public std::enable_shared_from_this<teca_variant_arra
     teca_variant_array &operator=(teca_variant_array &&other)
     { this->swap(other); return *this; }
 
-    // virtual constructor. return a new'ly allocated
+    // virtual constructor. return a newly allocated
     // empty object of the same type.
     virtual p_teca_variant_array new_instance() const = 0;
     virtual p_teca_variant_array new_instance(size_t n) const = 0;
 
-    // virtual copy construct. return a new'ly allocated object,
+    // virtual copy construct. return a newly allocated object,
     // initialized copy from this. caller must delete.
     virtual p_teca_variant_array new_copy() const = 0;
     virtual p_teca_variant_array new_copy(size_t start, size_t end) const = 0;
@@ -119,7 +367,7 @@ class teca_variant_array : public std::enable_shared_from_this<teca_variant_arra
     // resize. allocates new storage and copies in existing values
     virtual void resize(unsigned long i) = 0;
 
-    // reserve. reserves the requested ammount of space with out
+    // reserve. reserves the requested amount of space with out
     // constructing elements
     virtual void reserve(unsigned long i) = 0;
 
@@ -127,7 +375,7 @@ class teca_variant_array : public std::enable_shared_from_this<teca_variant_arra
     virtual void clear() noexcept = 0;
 
     // copy the contents from the other array.
-    // an excpetion is thrown when no conversion
+    // an exception is thrown when no conversion
     // between the two types exists. This method
     // is not virtual so that string can be handled
     // as a special case in the base class.
@@ -140,7 +388,7 @@ class teca_variant_array : public std::enable_shared_from_this<teca_variant_arra
     { this->append(*other.get()); }
 
     // swap the contents of this and the other object.
-    // an excpetion is thrown when no conversion
+    // an exception is thrown when no conversion
     // between the two types exists.
     virtual void swap(teca_variant_array &other) = 0;
     void swap(const p_teca_variant_array &other)
@@ -232,7 +480,7 @@ class teca_variant_array : public std::enable_shared_from_this<teca_variant_arra
 };
 
 
-
+/// @cond
 // tag for contiguous arrays, and objects that have
 // overrides in teca_binary_stream
 template<typename T>
@@ -259,86 +507,98 @@ struct pack_object
     !std::is_pointer<T>::value &&
     !pack_object_ptr<T>::value>
 {};
+/// @endcond
 
 
-
-// implementation of our type agnostic container
-// for simple arrays
+/** @brief
+ * The concrete implementation of our type agnostic container for contiguous
+ * arrays.
+ */
 template<typename T>
 class teca_variant_array_impl : public teca_variant_array
 {
 public:
-    // construct
+    /** @name Array constructors
+     * Constructs a new instance containing the templated type.
+     */
+    ///@{
     TECA_VARIANT_ARRAY_STATIC_NEW(teca_variant_array_impl, T)
 
-    // destruct
-    virtual ~teca_variant_array_impl() noexcept;
-
-    // virtual constructor
+    /// Returns a new instance initialized with a copy of this one.
     p_teca_variant_array new_copy() const override;
+
+    /// Returns a new instance initialized with a copy of a subset of this one.
     p_teca_variant_array new_copy(size_t start, size_t end) const override;
+
+    /// Returns a new instance of the same type.
     p_teca_variant_array new_instance() const override;
+
+    /// Returns a new instance of the same type sized to hold n elements.
     p_teca_variant_array new_instance(size_t n) const override;
+    ///@}
 
-    // return the name of the class in a human readable form
+    virtual ~teca_variant_array_impl() noexcept;
+
+    /// Returns the name of the class in a human readable form
     std::string get_class_name() const override;
 
-    // intialize with T()
+    /// Initialize all elements with T()
     void initialize() override;
 
-    // copy
+    /// Copy from the other array
     const teca_variant_array_impl<T> &
     operator=(const teca_variant_array_impl<T> &other);
 
+    /// Copy from the other array
     template<typename U>
     const teca_variant_array_impl<T> &
     operator=(const teca_variant_array_impl<U> &other);
 
-    // move
+    /// Move the contents of the other array
     teca_variant_array_impl(teca_variant_array_impl<T> &&other);
 
+    /// Move the contents of the other array
     const teca_variant_array_impl<T> &
     operator=(teca_variant_array_impl<T> &&other);
 
-    // get the ith value
+    /// Get the ith value
     T &get(unsigned long i)
     { return m_data[i]; }
 
+    /// Get the ith value
     const T &get(unsigned long i) const
     { return m_data[i]; }
 
-    // get the ith value
+    /// Get the ith value
     template<typename U>
     void get(unsigned long i, U &val) const;
 
-    // get a range of values decribed by [start end]
+    // get a range of values described by [start end]
     // inclusive
     template<typename U>
     void get(size_t start, size_t end, U *vals) const;
 
-    // copy the data out into the passed in vector
+    /// Copy the data out into the passed in vector
     template<typename U>
     void get(std::vector<U> &val) const;
 
-    // pointer to the data
+    /// Get a pointer to the data
     T *get(){ return &m_data[0]; }
     const T *get() const { return &m_data[0]; }
 
-    // set the ith value
+    /// Set the ith value
     template<typename U>
     void set(unsigned long i, const U &val);
 
-    // set a range opf values described by [start end]
-    // inclusive
+    /// Set a range of values described by [start end] inclusive
     template<typename U>
     void set(size_t start, size_t end, const U *vals);
 
-    // copy data, replacing contents with the passed in
-    // vector
+    /// Copy data, replacing contents with the passed in vector
     template<typename U>
     void set(const std::vector<U> &val);
 
-    // insert from the passed in vector at the back
+    /// Insert from the passed in vector at the back
     template<typename U>
     void append(const std::vector<U> &val);
 
@@ -346,54 +606,57 @@ class teca_variant_array_impl : public teca_variant_array
     template<typename U>
     void append(const U &val);
 
-    // get the current size of the data
+    /// Get the current size of the data
     virtual unsigned long size() const noexcept override;
 
-    // resize the data
+    /// Resize the data
     virtual void resize(unsigned long n) override;
     void resize(unsigned long n, const T &val);
 
-    // reserve space
+    /// Reserve space
     virtual void reserve(unsigned long n) override;
 
-    // clear the data
+    /// Clear the data
     virtual void clear() noexcept override;
 
-    // copy. This method is not virtual so that
-    // string can be handled as a special case in
-    // the base class.
+    /** copy. This method is not virtual so that string can be handled as a
+     * special case in the base class.
+     */
     void copy(const teca_variant_array &other);
 
-    // append. This method is not virtual so that
-    // string can be handled as a special case in
-    // the base class.
+    /** append. This method is not virtual so that
+     * string can be handled as a special case in the base class.
+     */
     void append(const teca_variant_array &other);
 
-    // virtual swap
+    /// virtual swap
     void swap(teca_variant_array &other) override;
 
-    // virtual equavalince test
+    /// virtual equivalence test
     bool equal(const teca_variant_array &other) const override;
 
-    // serialize to/from stream
+    /// Serialize to the stream
     int to_stream(teca_binary_stream &s) const override
     {
         this->to_binary<T>(s);
         return 0;
     }
 
+    /// Deserialize from the stream
     int from_stream(teca_binary_stream &s) override
     {
         this->from_binary<T>(s);
         return 0;
     }
 
+    /// Serialize to the stream
     int to_stream(std::ostream &s) const override
     {
         this->to_ascii<T>(s);
         return 0;
     }
 
+    /// Deserialize from the stream
     int from_stream(std::ostream &s) override
     {
         this->from_ascii<T>(s);
@@ -448,7 +711,7 @@ class teca_variant_array_impl : public teca_variant_array
     void from_binary(teca_binary_stream &s,
         typename std::enable_if<pack_object<U>::value, U>::type* = 0);
 
-    // tag dispatch array of poniter to other objects
+    // tag dispatch array of pointer to other objects
     template <typename U = T>
     void to_binary(teca_binary_stream &s,
         typename std::enable_if<pack_object_ptr<U>::value, U>::type* = 0)
@@ -488,7 +751,7 @@ class teca_variant_array_impl : public teca_variant_array
     void from_ascii(std::ostream &s,
         typename std::enable_if<pack_object_ptr<U>::value, U>::type* = 0);
 
-    // for serializaztion
+    // for serialization
     unsigned int type_code() const noexcept override;
 private:
     std::vector<T> m_data;
@@ -497,119 +760,9 @@ class teca_variant_array_impl : public teca_variant_array
     template<typename U> friend class teca_variant_array_impl;
 };
 
-
 #pragma GCC diagnostic ignored "-Wunknown-pragmas"
 #pragma GCC diagnostic ignored "-Wunused-local-typedefs"
 
-// tt - derived container
-// nt - contained type
-// tt<nt> - complete derived type
-// p - base class pointer
-// body - code to execute
-#define TEMPLATE_DISPATCH_CASE(tt, nt, p, body) \
-    if (dynamic_cast<tt<nt>*>(p))               \
-    {                                           \
-        using TT = tt<nt>;                      \
-        using NT = nt;                          \
-        body                                    \
-    }
-
-// tt - derived container
-// nt - contained type
-// tt<nt> - complete derived type
-// p - base class pointer
-// i - id suffix
-// body - code to execute
-#define NESTED_TEMPLATE_DISPATCH_CASE(tt, nt, p, i, body)   \
-    if (dynamic_cast<tt<nt>*>(p))                           \
-    {                                                       \
-        using TT##i = tt<nt>;                               \
-        using NT##i = nt;                                   \
-        body                                                \
-    }
-
-// variant that limits dispatch to floating point types
-// for use in numerical compuatation where integer types
-// are not supported (ie, math operations from std library)
-#define TEMPLATE_DISPATCH_FP(t, p, body)        \
-    TEMPLATE_DISPATCH_CASE(t, float, p, body)   \
-    else TEMPLATE_DISPATCH_CASE(t, double, p, body)
-
-// variant that limits dispatch to signed integer types
-// for use in numerical compuatation where signed integer types
-// are not supported
-#define TEMPLATE_DISPATCH_SI(t, p, body)                        \
-    TEMPLATE_DISPATCH_CASE(t, long long, p, body)               \
-    else TEMPLATE_DISPATCH_CASE(t, long, p, body)               \
-    else TEMPLATE_DISPATCH_CASE(t, int, p, body)                \
-    else TEMPLATE_DISPATCH_CASE(t, short int, p, body)          \
-    else TEMPLATE_DISPATCH_CASE(t, char, p, body)
-
-// variant that limits dispatch to floating point types
-// for use in numerical compuatation where integer types
-// are not supported (ie, math operations from std library)
-#define TEMPLATE_DISPATCH_FP_SI(t, p, body)             \
-    TEMPLATE_DISPATCH_CASE(t, float, p, body)           \
-    else TEMPLATE_DISPATCH_CASE(t, double, p, body)     \
-    else TEMPLATE_DISPATCH_SI(t, p, body)
-
-// variant that limits dispatch to integer types
-// for use in numerical compuatation where floating point types
-// are not supported
-#define TEMPLATE_DISPATCH_I(t, p, body)                         \
-    TEMPLATE_DISPATCH_CASE(t, long long, p, body)               \
-    else TEMPLATE_DISPATCH_CASE(t, unsigned long long, p, body) \
-    else TEMPLATE_DISPATCH_CASE(t, long, p, body)               \
-    else TEMPLATE_DISPATCH_CASE(t, int, p, body)                \
-    else TEMPLATE_DISPATCH_CASE(t, unsigned int, p, body)       \
-    else TEMPLATE_DISPATCH_CASE(t, unsigned long, p, body)      \
-    else TEMPLATE_DISPATCH_CASE(t, short int, p, body)          \
-    else TEMPLATE_DISPATCH_CASE(t, short unsigned int, p, body) \
-    else TEMPLATE_DISPATCH_CASE(t, char, p, body)               \
-    else TEMPLATE_DISPATCH_CASE(t, unsigned char, p, body)
-
-// macro for helping downcast to POD types
-// don't add classes to this.
-// t - derived container type
-// p - pointer to base class
-// body - code to execute on match
-#define TEMPLATE_DISPATCH(t, p, body)       \
-    TEMPLATE_DISPATCH_FP(t, p, body)        \
-    else TEMPLATE_DISPATCH_I(t, p, body)
-
-// variant that limits dispatch to floating point types
-// for use in numerical compuatation where integer types
-// are not supported (ie, math operations from std library)
-#define NESTED_TEMPLATE_DISPATCH_FP(t, p, i, body)              \
-    NESTED_TEMPLATE_DISPATCH_CASE(t, float, p, i, body)         \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, double, p, i, body)
-
-// variant that limits dispatch to integer types
-// for use in numerical compuatation where integer types
-// are not supported (ie, math operations from std library)
-#define NESTED_TEMPLATE_DISPATCH_I(t, p, i, body)      \
-    NESTED_TEMPLATE_DISPATCH_CASE(t, long long, p, i, body)               \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, unsigned long long, p, i, body) \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, long, p, i, body)               \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, int, p, i, body)                \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, unsigned int, p, i, body)       \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, unsigned long, p, i, body)      \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, short int, p, i, body)          \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, short unsigned int, p, i, body) \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, char, p, i, body)               \
-    else NESTED_TEMPLATE_DISPATCH_CASE(t, unsigned char, p, i, body)
-
-// macro for helping downcast to POD types
-// don't add classes to this.
-// t - templated derived type
-// p - base class pointer
-// i - id for nesting
-// body - code to execute on match
-#define NESTED_TEMPLATE_DISPATCH(t, p, i, body)     \
-    NESTED_TEMPLATE_DISPATCH_FP(t, p, i, body)      \
-    else NESTED_TEMPLATE_DISPATCH_I(t, p, i, body)
-
-
 // --------------------------------------------------------------------------
 template<typename T>
 void teca_variant_array::get_dispatch(std::vector<T> &vals,
@@ -1243,6 +1396,7 @@ void teca_variant_array_impl<T>::from_ascii(
     // TODO
 }
 
+/// @cond
 template <typename T>
 struct teca_variant_array_code {};
 
@@ -1256,7 +1410,7 @@ struct teca_variant_array_type {};
 template <>                                         \
 struct teca_variant_array_code<T>                   \
 {                                                   \
-    static unsigned int get() noexcept              \
+    static constexpr unsigned int get()             \
     { return v; }                                   \
 };                                                  \
 template <>                                         \
@@ -1269,6 +1423,9 @@ template <>                                         \
 struct teca_variant_array_type<v>                   \
 {                                                   \
     using type = T;                                 \
+                                                    \
+    static constexpr const char *name()             \
+    { return #T; }                                  \
 };
 
 #define TECA_VARIANT_ARRAY_FACTORY_NEW(_v)              \
@@ -1293,7 +1450,9 @@ TECA_VARIANT_ARRAY_TT_SPEC(double, 12)
 TECA_VARIANT_ARRAY_TT_SPEC(std::string, 13)
 TECA_VARIANT_ARRAY_TT_SPEC(teca_metadata, 14)
 TECA_VARIANT_ARRAY_TT_SPEC(p_teca_variant_array, 15)
+/// @endcond
 
+/// Creates an instance of teca_variant_array_impl<T> where T is determined from the type code.
 struct teca_variant_array_factory
 {
     static p_teca_variant_array New(unsigned int type_code)
@@ -1324,6 +1483,7 @@ struct teca_variant_array_factory
     }
 };
 
+/// @cond
 #define CODE_DISPATCH_CASE(_v, _c, _code)               \
     if (_v == _c)                                       \
     {                                                   \
@@ -1357,6 +1517,7 @@ struct teca_variant_array_factory
     CODE_DISPATCH_I(_v, _code)              \
     else CODE_DISPATCH_FP(_v, _code)
 
+/// @endcond
 
 // --------------------------------------------------------------------------
 template<typename T>
diff --git a/core/teca_variant_array_fwd.h b/core/teca_variant_array_fwd.h
deleted file mode 100644
index 734f640c5..000000000
--- a/core/teca_variant_array_fwd.h
+++ /dev/null
@@ -1,107 +0,0 @@
-#ifndef teca_variant_array_fwd_h
-#define teca_variant_array_fwd_h
-
-#include <string>
-#include "teca_shared_object.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_variant_array)
-TECA_SHARED_OBJECT_TEMPLATE_FORWARD_DECL(teca_variant_array_impl)
-
-#ifndef SWIG
-// convenience defs for POD types
-// these should not be used in API, use teca_variant_array instead
-using teca_string_array = teca_variant_array_impl<std::string>;
-using p_teca_string_array = std::shared_ptr<teca_variant_array_impl<std::string>>;
-using const_p_teca_string_array = std::shared_ptr<const teca_variant_array_impl<std::string>>;
-
-using teca_float_array = teca_variant_array_impl<float>;
-using p_teca_float_array = std::shared_ptr<teca_variant_array_impl<float>>;
-using const_p_teca_float_array = std::shared_ptr<const teca_variant_array_impl<float>>;
-
-using teca_double_array = teca_variant_array_impl<double>;
-using p_teca_double_array = std::shared_ptr<teca_variant_array_impl<double>>;
-using const_p_teca_double_array = std::shared_ptr<const teca_variant_array_impl<double>>;
-
-using teca_char_array = teca_variant_array_impl<char>;
-using p_teca_char_array = std::shared_ptr<teca_variant_array_impl<char>>;
-using const_p_teca_char_array = std::shared_ptr<const teca_variant_array_impl<char>>;
-
-using teca_unsigned_char_array = teca_variant_array_impl<unsigned char>;
-using p_teca_unsigned_char_array = std::shared_ptr<teca_variant_array_impl<unsigned char>>;
-using const_p_teca_unsigned_char_array = std::shared_ptr<const teca_variant_array_impl<unsigned char>>;
-
-using teca_short_array = teca_variant_array_impl<short>;
-using p_teca_short_array = std::shared_ptr<teca_variant_array_impl<short>>;
-using const_p_teca_short_array = std::shared_ptr<const teca_variant_array_impl<short>>;
-
-using teca_unsigned_short_array = teca_variant_array_impl<unsigned short>;
-using p_teca_unsigned_short_array = std::shared_ptr<teca_variant_array_impl<unsigned short>>;
-using const_p_teca_unsigned_short_array = std::shared_ptr<const teca_variant_array_impl<unsigned short>>;
-
-using teca_int_array = teca_variant_array_impl<int>;
-using p_teca_int_array = std::shared_ptr<teca_variant_array_impl<int>>;
-using const_p_teca_int_array = std::shared_ptr<const teca_variant_array_impl<int>>;
-
-using teca_unsigned_int_array = teca_variant_array_impl<unsigned int>;
-using p_teca_unsigned_int_array = std::shared_ptr<teca_variant_array_impl<unsigned int>>;
-using const_p_teca_unsigned_int_array = std::shared_ptr<const teca_variant_array_impl<unsigned int>>;
-
-using teca_long_array = teca_variant_array_impl<long>;
-using p_teca_long_array = std::shared_ptr<teca_variant_array_impl<long>>;
-using const_p_teca_long_array = std::shared_ptr<const teca_variant_array_impl<long>>;
-
-using teca_unsigned_long_array = teca_variant_array_impl<unsigned long>;
-using p_teca_unsigned_long_array = std::shared_ptr<teca_variant_array_impl<unsigned long>>;
-using const_p_teca_unsigned_long_array = std::shared_ptr<const teca_variant_array_impl<unsigned long>>;
-
-using teca_long_long_array = teca_variant_array_impl<long long>;
-using p_teca_long_long_array = std::shared_ptr<teca_variant_array_impl<long long>>;
-using const_p_teca_long_long_array = std::shared_ptr<const teca_variant_array_impl<long long>>;
-
-using teca_unsigned_long_long_array = teca_variant_array_impl<unsigned long long>;
-using p_teca_unsigned_long_long_array = std::shared_ptr<teca_variant_array_impl<unsigned long long>>;
-using const_p_teca_unsigned_long_long_array = std::shared_ptr<const teca_variant_array_impl<unsigned long long>>;
-
-using teca_size_t_array = teca_variant_array_impl<size_t>;
-using p_teca_size_t_array = std::shared_ptr<teca_variant_array_impl<size_t>>;
-using const_p_teca_size_t_array = std::shared_ptr<const teca_variant_array_impl<size_t>>;
-#endif
-
-// this is a convenience macro to be used to declare a static
-// New method that will be used to construct new objects in
-// shared_ptr's. This manages the details of interoperability
-// with std C++11 shared pointer
-#define TECA_VARIANT_ARRAY_STATIC_NEW(T, t)                             \
-                                                                        \
-static std::shared_ptr<T<t>> New()                                      \
-{                                                                       \
-    return std::shared_ptr<T<t>>(new T<t>);                             \
-}                                                                       \
-                                                                        \
-static std::shared_ptr<T<t>> New(size_t n)                              \
-{                                                                       \
-    return std::shared_ptr<T<t>>(new T<t>(n));                          \
-}                                                                       \
-                                                                        \
-static std::shared_ptr<T<t>> New(size_t n, const t &v)                  \
-{                                                                       \
-    return std::shared_ptr<T<t>>(new T<t>(n, v));                       \
-}                                                                       \
-                                                                        \
-static std::shared_ptr<T<t>> New(const t *vals, size_t n)               \
-{                                                                       \
-    return std::shared_ptr<T<t>>(new T<t>(vals, n));                    \
-}                                                                       \
-                                                                        \
-using teca_variant_array::shared_from_this;                             \
-                                                                        \
-std::shared_ptr<T> shared_from_this()                                   \
-{                                                                       \
-    return std::static_pointer_cast<T>(shared_from_this());             \
-}                                                                       \
-                                                                        \
-std::shared_ptr<T const> shared_from_this() const                       \
-{                                                                       \
-    return std::static_pointer_cast<T const>(shared_from_this());       \
-}
-#endif
diff --git a/data/CMakeLists.txt b/data/CMakeLists.txt
index 22c186805..72532f094 100644
--- a/data/CMakeLists.txt
+++ b/data/CMakeLists.txt
@@ -9,6 +9,7 @@ set(teca_data_srcs
     teca_arakawa_c_grid.cxx
     teca_array_attributes.cxx
     teca_array_collection.cxx
+    teca_calendar_util.cxx
     teca_cartesian_mesh.cxx
     teca_coordinate_util.cxx
     teca_curvilinear_mesh.cxx
diff --git a/data/teca_arakawa_c_grid.h b/data/teca_arakawa_c_grid.h
index f7e695a62..8d08eb446 100644
--- a/data/teca_arakawa_c_grid.h
+++ b/data/teca_arakawa_c_grid.h
@@ -11,56 +11,60 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_arakawa_c_grid)
 
-/// data on an Arkawa C Grid
-//
-// The C grid is defined by combinations of horizontal and vertical centerings.
-//
-// The horzontal centerings occur at so called mass or M points, U points, and
-// V points. These centerings are depicted in the following diagram:
-//
-//  *-------V-------*
-//  |               |
-//  |               |
-//  |               |
-//  U       M       U
-//  |               |
-//  |               |
-//  |               |
-//  *-------V-------*
-//
-// The horizontal coordinates are stored in 2d arrays. Assuming the mass
-// corrinate arrays have dimension [nx, ny], then the U coordinate arrays have
-// dimension [nx + 1, ny], and the V coordinate arrays have dimension
-// [nx, ny + 1].
-//
-// The vertical centerings occur at so called mass and w points
-//
-//  *-------W-------*
-//  |               |
-//  |               |
-//  |               |
-//  |       M       |
-//  |               |
-//  |               |
-//  |               |
-//  *-------W-------*
-//
-// The vertical coordinates are stored in 1d arrays. Assuming the M vertical
-// coordinate has the dimension [nz], then the W coordinate has dimension
-// [nz + 1].
-//
-// The 3d mesh dimensions can be obtained from mesh metadata, as well as coordinate
-// array names, and array attributes describing the data type, units, etc.
-//
-// Variables may exist on one of a number of permutations of horizontal and
-// vertical centerings, array attributes contains the centering metadata.
-//
-// See also:
-// "A Description of the Advanced Research WRF Model Version 4",
-// NCAR/TN-556+STR
-//
-// "Grids in Numerical Weather and Climate Models"
-// http://dx.doi.org/10.5772/55922
+/// A representation of mesh based data on an Arkawa C Grid.
+/**
+ * The Arakawa C grid is defined by various combinations of horizontal and
+ * vertical centerings.
+ *
+ * The horizontal centerings occur at so called mass or M points, U points,
+ * and V points. These centerings are depicted in the following diagram:
+ *
+ * >  *-------V-------*
+ * >  |               |
+ * >  |               |
+ * >  |               |
+ * >  U       M       U
+ * >  |               |
+ * >  |               |
+ * >  |               |
+ * >  *-------V-------*
+ *
+ * The horizontal coordinates are stored in 2d arrays. Assuming the mass
+ * coordinate arrays have dimension [nx, ny], then the U coordinate arrays
+ * have dimension [nx + 1, ny], and the V coordinate arrays have dimension
+ * [nx, ny + 1].
+ *
+ * The vertical centerings occur at so called M points and W points. These
+ * centerings are depicted in the following diagram.
+ *
+ * >  *-------W-------*
+ * >  |               |
+ * >  |               |
+ * >  |               |
+ * >  |       M       |
+ * >  |               |
+ * >  |               |
+ * >  |               |
+ * >  *-------W-------*
+ *
+ * The vertical coordinates are stored in 1d arrays. Assuming the M vertical
+ * coordinate has the dimension [nz], then the W coordinate has dimension
+ * [nz + 1].
+ *
+ * The 3d mesh dimensions can be obtained from mesh metadata, as well as
+ * coordinate array names, and array attributes describing the data type,
+ * units, etc.
+ *
+ * Variables may exist on one of a number of permutations of horizontal and
+ * vertical centerings, array attributes contains the centering metadata.
+ *
+ * See also:
+ * "A Description of the Advanced Research WRF Model Version 4",
+ * NCAR/TN-556+STR
+ *
+ * "Grids in Numerical Weather and Climate Models"
+ * http://dx.doi.org/10.5772/55922
+ */
 class teca_arakawa_c_grid : public teca_mesh
 {
 public:
@@ -75,7 +79,7 @@ class teca_arakawa_c_grid : public teca_mesh
     TECA_DATASET_METADATA(extent, unsigned long, 6)
     TECA_DATASET_METADATA(bounds, double, 6)
 
-    // flag set if the boundary in the given direction is perdiodic
+    // flag set if the boundary in the given direction is periodic
     TECA_DATASET_METADATA(periodic_in_x, int, 1)
     TECA_DATASET_METADATA(periodic_in_y, int, 1)
     TECA_DATASET_METADATA(periodic_in_z, int, 1)
diff --git a/data/teca_array_attributes.cxx b/data/teca_array_attributes.cxx
index b1b8fcd72..a1191bcbf 100644
--- a/data/teca_array_attributes.cxx
+++ b/data/teca_array_attributes.cxx
@@ -149,7 +149,7 @@ int teca_array_attributes::from(const teca_metadata &md)
 }
 
 // --------------------------------------------------------------------------
-void teca_array_attributes::to_stream(std::ostream &os)
+void teca_array_attributes::to_stream(std::ostream &os) const
 {
     os << "type_code=" << type_code << ", centering=" << centering
         << ", size=" << size << ", units=\"" << units
@@ -171,3 +171,49 @@ void teca_array_attributes::to_stream(std::ostream &os)
         os << "None";
     }
 }
+
+// --------------------------------------------------------------------------
+const char *teca_array_attributes::centering_to_string(int cen)
+{
+    const char *cen_str = "invalid";
+    switch (cen)
+    {
+        case cell_centering:
+            cen_str = "cell";
+            break;
+
+        case x_face_centering:
+            cen_str = "x-face";
+            break;
+
+        case y_face_centering:
+            cen_str = "y-face";
+            break;
+
+        case z_face_centering:
+            cen_str = "z-face";
+            break;
+
+        case x_edge_centering:
+            cen_str = "x-edge";
+            break;
+
+        case y_edge_centering:
+            cen_str = "y-edge";
+            break;
+
+        case z_edge_centering:
+            cen_str = "z-edge";
+            break;
+
+        case point_centering:
+            cen_str = "point";
+            break;
+
+        case no_centering:
+            cen_str = "none";
+            break;
+    }
+
+    return cen_str;
+}
diff --git a/data/teca_array_attributes.h b/data/teca_array_attributes.h
index c7b976003..5052da669 100644
--- a/data/teca_array_attributes.h
+++ b/data/teca_array_attributes.h
@@ -6,26 +6,25 @@
 #include <ostream>
 #include <variant>
 
-// a convenience container for conventional array attributes.
-// the attributes listed here are used for CF I/O.
-//
-// type_code - storage type as defined by teca_variant_array::type_code()
-//
-// centering - one of: no_centering, point_centering, cell_centering,
-//             edge_centering, or face_centering
-//
-// size - number of elements in the array
-//
-// units - string describing the uints that the variable is in.
-//
-// long name - a more descriptive name
-//
-// description - text describing the data
-//
-// have_fill_value - set non-zero to indicate that a fill_value
-//                   has been provided.
-//
-// fill_value - value used to identify missing or invalid data
+/** @brief
+ * A convenience container for conventional array attributes necessary and/or
+ * useful when producing NetCDF CF format files using the teca_cf_writer.
+ *
+ * @details
+ *
+ * | Member          | Description                                                |
+ * | ------          | -----------                                                |
+ * | type_code       | storage type as defined by teca_variant_array::type_code() |
+ * | centering       | one of: no_centering, point_centering, cell_centering,     |
+ * |                 | edge_centering, or face_centering                          |
+ * | size            | number of elements in the array                            |
+ * | units           | string describing the units that the variable is in.       |
+ * | long name       | a more descriptive name                                    |
+ * | description     | text describing the data                                   |
+ * | have_fill_value | set non-zero to indicate that a fill_value has been        |
+ * |                 | provided.                                                  |
+ * | fill_value      | value used to identify missing or invalid data             |
+ */
 struct teca_array_attributes
 {
     teca_array_attributes() : type_code(0),
@@ -44,7 +43,7 @@ struct teca_array_attributes
     teca_array_attributes(const teca_array_attributes &) = default;
     teca_array_attributes &operator=(const teca_array_attributes &) = default;
 
-    // converts from metadata object.
+    /// Convert a from metadata object.
     teca_array_attributes(const teca_metadata &md) :
         type_code(0), centering(0), size(0), units(), long_name(),
         description(), have_fill_value(0), fill_value(1.e20f)
@@ -52,47 +51,47 @@ struct teca_array_attributes
         from(md);
     }
 
-    // convert from metadata object
+    /// Convert from metadata object.
     teca_array_attributes &operator=(const teca_metadata &md);
 
-    // converts to a metadata object
+    /// Converts to a metadata object.
     operator teca_metadata() const;
 
-    // adds current values to the metadata object
+    /// Adds current values to the metadata object
     int to(teca_metadata &md) const;
 
-    // adds current values to the metadata object,
-    // only if they don't exist
+    /// Adds the current values to the metadata object, only if they don't exist.
     int merge_to(teca_metadata &md) const;
 
-    // intializes values from the metadata object
+    /// Intializes values from the metadata object.
     int from(const teca_metadata &md);
 
-    // send to the stream in human readable form
-    void to_stream(std::ostream &os);
-
-    // possible centrings
-    //
-    // for coordinate system with orthogonal axes x,y,z
-    // relative to cell centering:
-    //
-    //   If A is one of x,y or z then A_face_centering data is located on the
-    //   low A face i.e. shifted in the -A direction and arrays will be longer
-    //   by 1 value in the A direction.
-    //
-    //   If A is one of x,y or z then  A_edge_centering data is located on the
-    //   low side edge parallel to A corrdinate axis. i.e. shifted in the -B
-    //   and -C directions and arrays will be longer by 1 value in the B and C
-    //   directions.
-    //
-    //   point_centering data is located on the low corner. i.e. shifted
-    //   in the -A,-B, and -C directions and arrays will be longer
-    //   by 1 value in the A, B and C directions.
-    //
-    // arrays that are not associated with geometric locations should
-    // be identified as no_centering.
-    //
-    // the default centering is cell centering.
+    /// Send to the stream in human readable form.
+    void to_stream(std::ostream &os) const;
+
+    /** The possible mesh centrings.
+     *
+     * For coordinate system with orthogonal axes x,y,z relative to cell
+     * centering:
+     *
+     * > If A is one of x,y or z then A_face_centering data is located on the
+     * > low A face i.e. shifted in the -A direction and arrays will be longer
+     * > by 1 value in the A direction.
+     * >
+     * > If A is one of x,y or z then  A_edge_centering data is located on the
+     * > low side edge parallel to A corrdinate axis. i.e. shifted in the -B
+     * > and -C directions and arrays will be longer by 1 value in the B and C
+     * > directions.
+     * >
+     * > point_centering data is located on the low corner. i.e. shifted
+     * > in the -A,-B, and -C directions and arrays will be longer
+     * > by 1 value in the A, B and C directions.
+     *
+     * Arrays that are not associated with geometric locations should
+     * be identified as no_centering.
+     *
+     * The default centering is cell centering.
+     */
     enum
     {
         invalid_value    = 0,
@@ -107,6 +106,9 @@ struct teca_array_attributes
         no_centering     = 0x1000,
     };
 
+    /// convert the centering code to a string
+    static const char *centering_to_string(int cen);
+
     using fill_value_t =
         std::variant<char, unsigned char, short, unsigned short,
             int, unsigned int, long, unsigned long, long long,
diff --git a/data/teca_array_collection.h b/data/teca_array_collection.h
index 992a2b917..a2b49e628 100644
--- a/data/teca_array_collection.h
+++ b/data/teca_array_collection.h
@@ -1,107 +1,137 @@
 #ifndef teca_array_collection_h
 #define teca_array_collection_h
 
-#include "teca_array_collection_fwd.h"
+#include "teca_shared_object.h"
 #include "teca_variant_array.h"
 #include <map>
 #include <vector>
 #include <string>
 
-// a collection of named arrays
-/**
-A collection of named arrays
-*/
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_array_collection)
+
+/// A collection of named arrays.
 class teca_array_collection
 {
 public:
-    // construct on heap
+
+    /// construct on heap
     static
     p_teca_array_collection New()
     { return p_teca_array_collection(new teca_array_collection()); }
 
-    // reset to empty state
+    /// reset to empty state
     void clear();
 
-    // declare a set of arrays. requires name,type pairs
-    // for ex. define("c1",int(),"c2",float()) creates
-    // 2 arrays in the collection the first storing int's
-    // the second storing float's.
+    /** declare a set of arrays. requires name,type pairs for ex.
+     * define("c1",int(),"c2",float()) creates 2 arrays in the collection the
+     * first storing int the second storing float.
+     */
     template<typename nT, typename aT, typename... oT>
     void declare_set(nT &&a_name, aT a_type, oT &&...args);
 
-    // declare a single array
+    /// declare a single array
     template<typename nT, typename aT>
     void declare(nT &&a_name, aT a_type);
 
-    // add, return the index of the new entry.
-    // or -1 if the array name already exists.
+    /** add, return the index of the new entry,  or -1 if the array name already
+     * exists.
+     */
     int append(p_teca_variant_array array);
+
+    /** add, return the index of the new entry,  or -1 if the array name already
+     * exists.
+     */
     int append(const std::string &name, p_teca_variant_array array);
 
-    // set, return 0 on success.
+    /** replace the ith array, return 0 on success.  the name of the array is
+     * not changed.
+     */
     int set(unsigned int i, p_teca_variant_array array);
+
+    /// add or replace the named array, returns 0 on success.
     int set(const std::string &name, p_teca_variant_array array);
 
-    // remove
+    /// remove the ith array
     int remove(unsigned int i);
+
+    /// remove the named array
     int remove(const std::string &name);
 
-    // number of
+    /// Return the number of arrays
     unsigned int size() const noexcept
     { return m_arrays.size(); }
 
-    // access by id
+    /// access an array by its by id
     p_teca_variant_array get(unsigned int i)
     { return m_arrays[i]; }
 
+    /// access an array by its by id
     const_p_teca_variant_array get(unsigned int i) const
     { return m_arrays[i]; }
 
-    // test for array
+    /// test for array
     bool has(const std::string &name) const;
 
-    // access by name
+    /// access an array by name
     p_teca_variant_array get(const std::string &name);
+
+    /// access an array by name
     const_p_teca_variant_array get(const std::string &name) const;
 
+    /// access an array by name
     p_teca_variant_array operator[](const std::string &name)
     { return this->get(name); }
 
+    /// access an array by name
     const_p_teca_variant_array operator[](const std::string &name) const
     { return this->get(name); }
 
-    // access names
+    // Get the name of the ith array
     std::string &get_name(unsigned int i)
     { return m_names[i]; }
 
+    // Get the name of the ith array
     const std::string &get_name(unsigned int i) const
     { return m_names[i]; }
 
-    // return a unique string identifier
+    // Get the list of names
+    std::vector<std::string> &get_names()
+    { return m_names; }
+
+    // Get the list of names
+    const std::vector<std::string> &get_names() const
+    { return m_names; }
+
+    /// Return the name of the class
     std::string get_class_name() const
     { return "teca_array_collection"; }
 
-    // return an integer identifier uniquely naming the dataset type
+    /// return an integer identifier uniquely naming the dataset type
     int get_type_code() const
     { return -1; }
 
-    // copy
+    /// copy
     void copy(const const_p_teca_array_collection &other);
+
+    /// shallow copy
     void shallow_copy(const p_teca_array_collection &other);
 
-    // append
+    /// append
     int append(const const_p_teca_array_collection &other);
+
+    /// shallow append
     int shallow_append(const p_teca_array_collection &other);
 
-    // swap
+    /// swap
     void swap(p_teca_array_collection &other);
 
-    // serialize the data to/from the given stream
-    // for I/O or communication
+    /// serialize the data to the given stream for I/O or communication
     int to_stream(teca_binary_stream &s) const;
+
+    /// serialize the data from the given stream for I/O or communication
     int from_stream(teca_binary_stream &s);
 
-    // stream to/from human readable representation
+    /// stream to a human readable representation
     int to_stream(std::ostream &) const;
 
 protected:
diff --git a/data/teca_array_collection_fwd.h b/data/teca_array_collection_fwd.h
deleted file mode 100644
index d014188c4..000000000
--- a/data/teca_array_collection_fwd.h
+++ /dev/null
@@ -1,8 +0,0 @@
-#ifndef teca_array_collection_fwd_h
-#define teca_array_collection_fwd_h
-
-#include "teca_shared_object.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_array_collection)
-
-#endif
diff --git a/data/teca_calendar_util.cxx b/data/teca_calendar_util.cxx
new file mode 100644
index 000000000..5d8954faa
--- /dev/null
+++ b/data/teca_calendar_util.cxx
@@ -0,0 +1,857 @@
+#include "teca_calendar_util.h"
+
+#include "teca_common.h"
+#include "teca_variant_array.h"
+#include "teca_coordinate_util.h"
+#include "teca_calcalcs.h"
+
+#include <algorithm>
+
+// TODO - With 23:59:59, sometimes we select the next day.  What is the right
+// end-of-day time so that all use cases are satisfied without selecting the
+// next day?
+#define END_OF_DAY_HH 23
+#define END_OF_DAY_MM 30
+#define END_OF_DAY_SS 0
+#define END_OF_DAY "23:30:00"
+
+// --------------------------------------------------------------------------
+std::ostream &operator<<(std::ostream &os,
+    const teca_calendar_util::time_point &tpt)
+{
+    os << "time[" << tpt.index << "] = " << tpt.time << ", \""
+        << tpt.year << "-" << tpt.month << "-"
+        << tpt.day << " " << tpt.hour << ":" << tpt.minute
+        << ":" << tpt.second << "\"";
+    return os;
+}
+
+
+
+namespace teca_calendar_util
+{
+
+// **************************************************************************
+long gregorian_number(long y, long m, long d)
+{
+    m = (m + 9) % 12;
+    y = y - m/10;
+    return 365*y + y/4 - y/100 + y/400 + (m*306 + 5)/10 + (d - 1);
+}
+
+// **************************************************************************
+void date_from_gregorian_number(long g, long &y, long &m, long &d)
+{
+    y = (10000*g + 14780)/3652425;
+    long ddd = g - (365*y + y/4 - y/100 + y/400);
+    if (ddd < 0)
+    {
+        y = y - 1;
+        ddd = g - (365*y + y/4 - y/100 + y/400);
+    }
+
+    long mi = (100*ddd + 52)/3060;
+
+    m = (mi + 2)%12 + 1;
+    y = y + (mi + 2)/12;
+    d = ddd - (mi*306 + 5)/10 + 1;
+}
+
+// **************************************************************************
+bool valid_gregorian_date(long y, long m, long d)
+{
+    long g = gregorian_number(y,m,d);
+    if (g < 578027) // 578027 = gergorian_number(1582,10,1);
+        return false;
+
+    long yy, mm, dd;
+    date_from_gregorian_number(g, yy, mm, dd);
+
+    if ((y != yy) || (m != mm) || (d != dd))
+        return false;
+
+    return true;
+}
+
+
+/// returns one of DJF,MAM,JJA,SON based on the month passed in
+const char *get_season_name(int month)
+{
+    if ((month == 12) || ((month >= 1) && (month <= 2)))
+    {
+        return "DJF";
+    }
+    else if ((month >= 3) && (month <= 5))
+    {
+        return "MAM";
+    }
+    else if ((month >= 6) && (month <= 8))
+    {
+        return "JJA";
+    }
+    else if ((month >= 9) && (month <= 11))
+    {
+        return "SON";
+    }
+
+    TECA_ERROR("Failed to get the season name for month " << month)
+    return "invalid";
+}
+
+// --------------------------------------------------------------------------
+time_point::time_point(long i, double t, const std::string &units,
+    const std::string &calendar) : index(i), time(t), year(0), month(0),
+    day(0), hour(0), minute(0), second(0)
+
+{
+    if (teca_calcalcs::date(t, &this->year, &this->month, &this->day,
+        &this->hour, &this->minute, &this->second, units.c_str(),
+        calendar.c_str()))
+    {
+        TECA_ERROR("Failed to convert the time value " << t
+            << " \"" << units << "\" in the \"" << calendar << "\"")
+    }
+}
+
+// --------------------------------------------------------------------------
+bool season_iterator::is_valid() const
+{
+    if (!this->valid)
+        return false;
+
+    // get the end of the current season
+    int ey = -1;
+    int em = -1;
+    int ed = -1;
+    if (this->get_season_end(this->year, this->month, ey, em, ed))
+    {
+        TECA_ERROR("Failed to get season end")
+        return false;
+    }
+
+    // verify that we have data for the current season
+    if ((ey > this->end.year) ||
+        ((ey == this->end.year) && (em > this->end.month)) ||
+        ((ey == this->end.year) && (em == this->end.month) &&
+        (ed > this->end.day)))
+    {
+        return false;
+    }
+
+    return true;
+}
+
+// --------------------------------------------------------------------------
+int season_iterator::initialize(const const_p_teca_variant_array &t,
+    const std::string &units, const std::string &calendar,
+    long first_step, long last_step)
+{
+    this->time = t;
+    this->units = units;
+    this->calendar = calendar;
+
+    if (t->size() == 0)
+    {
+        TECA_ERROR("The array of time values can't be empty")
+        return -1;
+    }
+
+    if (first_step >= (long)t->size())
+    {
+        TECA_ERROR("first_step " << first_step
+            << " output of bounds with " << t->size() << " time values")
+        return -1;
+    }
+
+    if (last_step < 0)
+        last_step = t->size() - 1;
+
+    if ((last_step < first_step) || (last_step >= (long)t->size()))
+    {
+        TECA_ERROR("invalid last_step " << last_step << " with first_step "
+            << first_step << " and " << t->size() << " time values")
+        return -1;
+    }
+
+    // initialize the time range to iterate over
+    TEMPLATE_DISPATCH(const teca_variant_array_impl,
+        t.get(),
+
+        const NT *p_t = dynamic_cast<const TT*>(t.get())->get();
+
+        this->begin = time_point(first_step, p_t[first_step], this->units, this->calendar);
+        this->end = time_point(last_step, p_t[last_step], this->units, this->calendar);
+        )
+
+    // skip ahead to the first season.
+    if (this->get_first_season(this->begin.year,
+        this->begin.month, this->year, this->month))
+    {
+        TECA_ERROR("Failed to determine the first season")
+        return -1;
+    }
+
+    this->valid = true;
+
+    return 0;
+}
+
+
+// --------------------------------------------------------------------------
+int season_iterator::get_first_season(int y_in, int m_in, int &y_out,
+    int &m_out) const
+{
+    if ((m_in == 12) or (m_in == 3) or (m_in == 6) or (m_in == 9))
+    {
+        y_out = y_in;
+        m_out = m_in;
+        return 0;
+    }
+
+    return this->get_next_season(y_in, m_in, y_out, m_out);
+}
+
+// --------------------------------------------------------------------------
+int season_iterator::get_season_end(int y_in, int m_in, int &y_out,
+    int &m_out, int &d_out) const
+{
+    if (m_in == 12)
+    {
+        y_out = y_in + 1;
+        m_out = 2;
+    }
+    else if ((m_in >= 1) and (m_in <= 2))
+    {
+        y_out = y_in;
+        m_out = 2;
+    }
+    else if ((m_in >= 3) and (m_in <= 5))
+    {
+        y_out = y_in;
+        m_out = 5;
+    }
+    else if ((m_in >= 6) and (m_in <= 8))
+    {
+        y_out = y_in;
+        m_out = 8;
+    }
+    else if ((m_in >= 9) and (m_in <= 11))
+    {
+        y_out = y_in;
+        m_out = 11;
+    }
+    else
+    {
+        TECA_ERROR("Failed to get the end of the season from month "
+            << m_in)
+        return -1;
+    }
+
+    if (teca_calcalcs::days_in_month(this->calendar.c_str(),
+        this->units.c_str(), y_out, m_out, d_out))
+    {
+        TECA_ERROR("Failed to get the last day of the month "
+            << y_out << " " << m_out)
+        return -1;
+    }
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int season_iterator::get_next_season(int y_in, int m_in, int &y_out,
+    int &m_out) const
+{
+    if (m_in == 12)
+    {
+        y_out = y_in + 1;
+        m_out = 3;
+    }
+    else if ((m_in >= 1) and (m_in <= 2))
+    {
+        y_out = y_in;
+        m_out = 3;
+    }
+    else if ((m_in >= 3) and (m_in <= 5))
+    {
+        y_out = y_in;
+        m_out = 6;
+    }
+    else if ((m_in >= 6) and (m_in <= 8))
+    {
+        y_out = y_in;
+        m_out = 9;
+    }
+    else if ((m_in >= 9) and (m_in <= 11))
+    {
+        y_out = y_in;
+        m_out = 12;
+    }
+    else
+    {
+        TECA_ERROR("Failed to get the next season from m_in "
+            << m_in)
+        return -1;
+    }
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int season_iterator::get_next_interval(time_point &first_step,
+    time_point &last_step)
+{
+    // get the end of the current season
+    int end_year = -1;
+    int end_month = -1;
+    int end_day = -1;
+    if (this->get_season_end(this->year, this->month, end_year, end_month, end_day))
+    {
+        TECA_ERROR("Failed to get season end")
+        return -1;
+    }
+
+    // verify that we have data for the current season
+    if ((end_year > this->end.year) ||
+        ((end_year == this->end.year) && (end_month > this->end.month)) ||
+        ((end_year == this->end.year) && (end_month == this->end.month) &&
+        (end_day > this->end.day)))
+    {
+        return -1;
+    }
+
+    // find the time step of the first day
+    int sy = this->year;
+    int sm = this->month;
+
+    char t0[21] = {'\0'};
+    snprintf(t0, 21, "%04d-%02d-01 00:00:00", this->year, this->month);
+
+    unsigned long i0 = 0;
+    if (teca_coordinate_util::time_step_of(this->time,
+        false, true, this->calendar, this->units, t0, i0))
+    {
+        TECA_ERROR("Failed to get the tme step of " << t0)
+        return -1;
+    }
+
+    double ti = 0.0;
+    this->time->get(i0, ti);
+    first_step = time_point(i0, ti, this->year, this->month);
+
+    // find the time step of the last day
+    char t1[21] = {'\0'};
+    snprintf(t1, 21, "%04d-%02d-%02d " END_OF_DAY, end_year, end_month, end_day);
+
+    unsigned long i1 = 0;
+    if (teca_coordinate_util::time_step_of(this->time,
+        true, true, this->calendar, this->units, t1, i1))
+    {
+        TECA_ERROR("Failed to get the time step of " << t1)
+        return -1;
+    }
+
+    this->time->get(i1, ti);
+    last_step = time_point(i1, ti, end_year, end_month,
+        end_day, END_OF_DAY_HH, END_OF_DAY_MM, END_OF_DAY_SS);
+
+    // move to next season
+    if (this->get_next_season(sy, sm, this->year, this->month))
+    {
+        TECA_ERROR("Failed to get the next season from "
+            << sy << "-" << sm)
+        return -1;
+    }
+
+    if (!this->is_valid())
+        this->valid = false;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+bool year_iterator::is_valid() const
+{
+    if (!this->valid)
+        return false;
+
+    // check for more months to process
+    if (this->year > this->end.year)
+    {
+        return false;
+    }
+
+    return true;
+}
+
+// --------------------------------------------------------------------------
+int year_iterator::initialize(const const_p_teca_variant_array &t,
+    const std::string &units, const std::string &calendar,
+    long first_step, long last_step)
+{
+    this->time = t;
+    this->units = units;
+    this->calendar = calendar;
+
+    if (t->size() == 0)
+    {
+        TECA_ERROR("The array of time values can't be empty")
+        return -1;
+    }
+
+    if (first_step >= (long)t->size())
+    {
+        TECA_ERROR("first_step " << first_step
+            << " output of bounds with " << t->size() << " time values")
+        return -1;
+    }
+
+    if (last_step < 0)
+        last_step = t->size() - 1;
+
+    if ((last_step < first_step) || (last_step >= (long)t->size()))
+    {
+        TECA_ERROR("invalid last_step " << last_step << " with first_step "
+            << first_step << " and " << t->size() << " time values")
+        return -1;
+    }
+
+    // current time state
+    TEMPLATE_DISPATCH(const teca_variant_array_impl,
+        t.get(),
+
+        const NT *p_t = dynamic_cast<const TT*>(t.get())->get();
+
+        this->begin = time_point(first_step, p_t[first_step], this->units, this->calendar);
+        this->end = time_point(last_step, p_t[last_step], this->units, this->calendar);
+        )
+
+    this->valid = true;
+
+    this->year = this->begin.year;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int year_iterator::get_next_interval(time_point &first_step,
+    time_point &last_step)
+{
+    // check for more months to process
+    if (!this->is_valid())
+        return -1;
+
+    // find the time step of the first day
+    char t0[21] = {'\0'};
+    snprintf(t0, 21, "%04d-01-01 00:00:00", this->year);
+
+    unsigned long i0 = 0;
+    if (teca_coordinate_util::time_step_of(this->time,
+        false, true, this->calendar, this->units, t0, i0))
+    {
+        TECA_ERROR("Failed to locate a time step for " << t0)
+        return -1;
+    }
+
+    double ti = 0.0;
+    this->time->get(i0, ti);
+    first_step = time_point(i0, ti, this->year);
+
+    // find the time step of the last day
+    int n_days = 0;
+    if (teca_calcalcs::days_in_month(this->calendar.c_str(),
+        this->units.c_str(), this->year, 12, n_days))
+    {
+        TECA_ERROR("Failed to get the last day of the month "
+            << this->year << " 12")
+        return -1;
+    }
+
+    char t1[21] = {'\0'};
+    snprintf(t1, 21, "%04d-12-%02d " END_OF_DAY, this->year, n_days);
+
+    unsigned long i1 = 0;
+    if (teca_coordinate_util::time_step_of(this->time,
+        true, true, this->calendar, this->units, t1, i1))
+    {
+        TECA_ERROR("Failed to locate a time step for " << t1)
+        return -1;
+    }
+
+    this->time->get(i1, ti);
+    last_step = time_point(i1, ti, this->year, 12,
+        n_days, END_OF_DAY_HH, END_OF_DAY_MM, END_OF_DAY_SS);
+
+    // move to next year
+    this->year += 1;
+
+    // if we're at the  end of the sequence mark the iterator invalid
+    if (!this->is_valid())
+        this->valid = false;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+bool month_iterator::is_valid() const
+{
+    if (!this->valid)
+        return false;
+
+    // check for more months to process
+    if ((this->year > this->end.year) ||
+        ((this->year == this->end.year) &&
+        (this->month > this->end.month)))
+    {
+        return false;
+    }
+
+    return true;
+}
+
+// --------------------------------------------------------------------------
+int month_iterator::initialize(const const_p_teca_variant_array &t,
+    const std::string &units, const std::string &calendar,
+    long first_step, long last_step)
+{
+    this->time = t;
+    this->units = units;
+    this->calendar = calendar;
+
+    if (t->size() == 0)
+    {
+        TECA_ERROR("The array of time values can't be empty")
+        return -1;
+    }
+
+    if (first_step >= (long)t->size())
+    {
+        TECA_ERROR("first_step " << first_step
+            << " output of bounds with " << t->size() << " time values")
+        return -1;
+    }
+
+    if (last_step < 0)
+        last_step = t->size() - 1;
+
+    if ((last_step < first_step) || (last_step >= (long)t->size()))
+    {
+        TECA_ERROR("invalid last_step " << last_step << " with first_step "
+            << first_step << " and " << t->size() << " time values")
+        return -1;
+    }
+
+    // time point's to iterate between
+    TEMPLATE_DISPATCH(const teca_variant_array_impl,
+        t.get(),
+
+        const NT *p_t = dynamic_cast<const TT*>(t.get())->get();
+
+        this->begin = time_point(first_step, p_t[first_step], this->units, this->calendar);
+        this->end = time_point(last_step, p_t[last_step], this->units, this->calendar);
+        )
+
+    this->valid = true;
+
+    this->year = this->begin.year;
+    this->month = this->begin.month;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int month_iterator::get_next_interval(time_point &first_step,
+    time_point &last_step)
+{
+    // check for more months to process
+    if (!this->is_valid())
+        return -1;
+
+    // find the time step of the first day
+    char t0[21] = {'\0'};
+    snprintf(t0, 21, "%04d-%02d-01 00:00:00", this->year, this->month);
+
+    unsigned long i0 = 0;
+    if (teca_coordinate_util::time_step_of(this->time,
+        false, true, this->calendar, this->units, t0, i0))
+    {
+        TECA_ERROR("Failed to locate a time step for " << t0)
+        return -1;
+    }
+
+    double ti = 0.0;
+    this->time->get(i0, ti);
+    first_step = time_point(i0, ti, this->year, this->month);
+
+    // find the time step of the last day
+    int n_days = 0;
+    if (teca_calcalcs::days_in_month(this->calendar.c_str(),
+        this->units.c_str(), this->year, this->month, n_days))
+    {
+        TECA_ERROR("Failed to get the last day of the month "
+            << this->year << " " << this->month)
+        return -1;
+    }
+
+    char t1[21] = {'\0'};
+    snprintf(t1, 21, "%04d-%02d-%02d " END_OF_DAY, this->year, this->month, n_days);
+
+    unsigned long i1 = 0;
+    if (teca_coordinate_util::time_step_of(this->time,
+        true, true, this->calendar, this->units, t1, i1))
+    {
+        TECA_ERROR("Failed to locate a time step for " << t1)
+        return -1;
+    }
+
+    this->time->get(i1, ti);
+    last_step = time_point(i1, ti, this->year, this->month,
+        n_days, END_OF_DAY_HH, END_OF_DAY_MM, END_OF_DAY_SS);
+
+    // move to next month
+    this->month += 1;
+
+    // move to next year
+    if (this->month == 13)
+    {
+        this->month = 1;
+        this->year += 1;
+    }
+
+    // if we're at the  end of the sequence mark the iterator invalid
+    if (!this->is_valid())
+        this->valid = false;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+bool day_iterator::is_valid() const
+{
+    if (!this->valid)
+        return false;
+
+    // check for more days to process
+    if ((this->year > this->end.year) ||
+        ((this->year == this->end.year) && (this->month > this->end.month)) ||
+        ((this->year == this->end.year) && (this->month == this->end.month) &&
+        (this->day > this->end.day)))
+    {
+        return false;
+    }
+
+    return true;
+}
+
+// --------------------------------------------------------------------------
+int day_iterator::initialize(const const_p_teca_variant_array &t,
+    const std::string &units, const std::string &calendar,
+    long first_step, long last_step)
+{
+    this->time = t;
+    this->units = units;
+    this->calendar = calendar;
+
+    if (t->size() == 0)
+    {
+        TECA_ERROR("The array of time values can't be empty")
+        return -1;
+    }
+
+    if (first_step >= (long)t->size())
+    {
+        TECA_ERROR("first_step " << first_step
+            << " output of bounds with " << t->size() << " time values")
+        return -1;
+    }
+
+    if (last_step < 0)
+        last_step = t->size() - 1;
+
+    if ((last_step < first_step) || (last_step >= (long)t->size()))
+    {
+        TECA_ERROR("invalid last_step " << last_step << " with first_step "
+            << first_step << " and " << t->size() << " time values")
+        return -1;
+    }
+
+    // current time state
+    TEMPLATE_DISPATCH(const teca_variant_array_impl,
+        t.get(),
+
+        const NT *p_t = dynamic_cast<const TT*>(t.get())->get();
+
+        this->begin = time_point(first_step, p_t[first_step], this->units, this->calendar);
+        this->end = time_point(last_step, p_t[last_step], this->units, this->calendar);
+        )
+
+    this->valid = true;
+
+    // current time state
+    this->year = this->begin.year;
+    this->month = this->begin.month;
+    this->day = this->begin.day;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int day_iterator::get_next_interval(time_point &first_step,
+    time_point &last_step)
+{
+    // check for more days to process
+    if (!this->is_valid())
+        return -1;
+
+    // find the time step of the first hour of the day
+    char tstr0[21] = {'\0'};
+    snprintf(tstr0, 21, "%04d-%02d-%02d 00:00:00",
+        this->year, this->month, this->day);
+
+    unsigned long i0 = 0;
+    if (teca_coordinate_util::time_step_of(this->time,
+        false, true, this->calendar, this->units, tstr0, i0))
+    {
+        TECA_ERROR("Failed to locate a time step for " << tstr0)
+        return -1;
+    }
+
+    double ti = 0.0;
+    this->time->get(i0, ti);
+    first_step = time_point(i0, ti, this->year, this->month, this->day);
+
+    // find the time step of the last hour of the day
+    char t1[21] = {'\0'};
+    snprintf(t1, 21, "%04d-%02d-%02d " END_OF_DAY,
+        this->year, this->month, this->day);
+
+    unsigned long i1 = 0;
+    if (teca_coordinate_util::time_step_of(this->time,
+        true, true, this->calendar, this->units, t1, i1))
+    {
+        TECA_ERROR("Failed to locate a time step for " << t1)
+        return -1;
+    }
+
+    this->time->get(i1, ti);
+    last_step = time_point(i1, ti, this->year, this->month,
+        this->day, END_OF_DAY_HH, END_OF_DAY_MM, END_OF_DAY_SS);
+
+    // move to next day
+    int n_days = 0;
+    if (teca_calcalcs::days_in_month(this->calendar.c_str(),
+        this->units.c_str(), this->year, this->month, n_days))
+    {
+        TECA_ERROR("Failed to get the last day of the month "
+            << this->year << " " << this->month)
+        return -1;
+    }
+
+    this->day += 1;
+
+    // move to next month
+    if (this->day > n_days)
+    {
+        this->month += 1;
+        this->day = 1;
+    }
+
+    // move to next year
+    if (this->month == 13)
+    {
+        this->month = 1;
+        this->year += 1;
+    }
+
+    // if we're at the  end of the sequence mark the iterator invalid
+    if (!this->is_valid())
+        this->valid = false;
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int interval_iterator::initialize(const teca_metadata &md)
+{
+    return this->initialize(md, 0, -1);
+}
+
+// --------------------------------------------------------------------------
+int interval_iterator::initialize(const teca_metadata &md,
+    long first_step, long last_step)
+{
+    // get the time axis and calendar
+    teca_metadata attributes;
+    teca_metadata t_atts;
+    std::string calendar;
+    std::string units;
+    teca_metadata coords;
+    p_teca_variant_array t;
+    if (md.get("attributes", attributes) || attributes.get("time", t_atts) ||
+        t_atts.get("calendar", calendar) || t_atts.get("units", units) ||
+        md.get("coordinates", coords) || !(t = coords.get("t")))
+    {
+        TECA_ERROR("Failed to get the time axis from the available metadata."
+            << (attributes.empty() ? "missing" : "has") << " attributes. "
+            << (t_atts.empty() ? "missing" : "has") << " time attributes. "
+            << (calendar.empty() ? "missing" : "has") << " calendar ."
+            << (units.empty() ? "missing" : "has") << " time units. "
+            << (coords.empty() ? "missing" : "has") << " coordinates. "
+            << (t ? "has" : "missing") << " time values.")
+        return -1;
+    }
+
+    return this->initialize(t, units, calendar, first_step, last_step);
+}
+
+// --------------------------------------------------------------------------
+p_interval_iterator interval_iterator_factory::New(const std::string &interval)
+{
+    if (interval == "daily")
+    {
+        return std::make_shared<day_iterator>();
+    }
+    else if (interval == "monthly")
+    {
+        return std::make_shared<month_iterator>();
+    }
+    else if (interval == "seasonal")
+    {
+        return std::make_shared<season_iterator>();
+    }
+    else if (interval == "yearly")
+    {
+        return std::make_shared<year_iterator>();
+    }
+
+    TECA_ERROR("Failed to construct a \""
+        << interval << "\" interval iterator")
+    return nullptr;
+}
+
+// --------------------------------------------------------------------------
+p_interval_iterator interval_iterator_factory::New(int interval)
+{
+    if (interval == daily)
+    {
+        return std::make_shared<day_iterator>();
+    }
+    else if (interval == monthly)
+    {
+        return std::make_shared<month_iterator>();
+    }
+    else if (interval == seasonal)
+    {
+        return std::make_shared<season_iterator>();
+    }
+    else if (interval == yearly)
+    {
+        return std::make_shared<year_iterator>();
+    }
+
+    TECA_ERROR("Failed to construct a \""
+        << interval << "\" interval iterator")
+    return nullptr;
+}
+
+}
diff --git a/data/teca_calendar_util.h b/data/teca_calendar_util.h
new file mode 100644
index 000000000..5d8255ad9
--- /dev/null
+++ b/data/teca_calendar_util.h
@@ -0,0 +1,387 @@
+#ifndef teca_calendar_h
+#define teca_calendar_h
+
+/// @file
+
+#include "teca_variant_array.h"
+#include "teca_metadata.h"
+
+#include <string>
+#include <ostream>
+#include <cstring>
+#include <memory>
+
+/// Codes dealing with calendaring
+namespace teca_calendar_util
+{
+
+/** @name Gregorian calendar
+ * functions for date computations in gregorian calendar.  to use convert the
+ * origin to a gergorian_number do the calculation and convert the number back
+ * into a date useing date_from_gregorian_number. for details about the math
+ * and an explanation of the errors see
+ * http://alcor.concordia.ca/~gpkatch/gdate-algorithm.html
+ */
+///@{
+/** return a date number for the given date that can be used in computations.
+ * input:
+ *
+ * > y : 4 digit year
+ * > m : 2 digit month
+ * > d : 2 digit day
+ *
+ */
+long gregorian_number(long y, long m, long d);
+
+/** input:
+ *
+ * > g : date number computed from gregorian_number
+ *
+ * returns:
+ *
+ * > y : 4 digit year
+ * > m : 2 digit month
+ * > d : 2 digit day
+ *
+ */
+void date_from_gregorian_number(long g, long &y, long &m, long &d);
+
+/**
+ * input:
+ *
+ * > y : 4 digit year
+ * > m : 2 digit month
+ * > d : 2 digit day
+ *
+ * returns:
+ *
+ * true if the date is valid in the gregorian calendar and our conversion
+ * algorithm.
+*/
+bool valid_gregorian_date(long y, long m, long d);
+///@}
+
+
+/// returns one of DJF,MAM,JJA,SON based on the month passed in
+const char *get_season_name(int month);
+
+/** brief
+ * A floating point time value and its corresponding year, month day, hour
+ * minute and second
+ */
+struct time_point
+{
+    time_point() : index(-1), time(0.0), year(0), month(1), day(1),
+        hour(0), minute(0), second(0.0)
+    {}
+
+    /** Initialize explicitly.
+     * @param[in] i the index of the time value
+     * @param[in] t the time value
+     * @param[in] YYYY the year
+     * @param[in] MM the month
+     * @param[in] DD the day
+     * @param[in] hh the hour
+     * @param[in] mm the minute
+     * @param[in] ss the second
+     */
+    time_point(long i, double t, int YYYY=0, int MM=1, int DD=1,
+        int hh=0, int mm=0, double ss=0.0) : index(i), time(t),
+        year(YYYY), month(MM), day(DD), hour(hh), minute(mm),
+        second(ss)
+    {}
+
+
+    /** Initialize from a floating point time value. The calendar and units
+     * must be provided.
+     * @param[in] i the index of the time value
+     * @param[in] t the time value
+     * @param[in] units the units t is in
+     * @param[in] calendar the calendar system the units are in
+     */
+    time_point(long i, double t,
+        const std::string &units, const std::string &calendar);
+
+    long index;
+    double time;
+    int year;
+    int month;
+    int day;
+    int hour;
+    int minute;
+    double second;
+};
+
+/// An iterator over a series of time intervals
+class interval_iterator
+{
+public:
+
+    interval_iterator() : time(), units(), calendar(),
+        begin(), end(), valid(false)
+    {}
+
+    virtual ~interval_iterator() {}
+
+    /** Initialize the iterator from a metadata object following the
+     * conventions defined by the teca_cf_reader.
+     * @returns 0 if successfully initialized
+     */
+    virtual int initialize(const teca_metadata &md);
+
+    /** Initialize the iterator from a metadata object following the
+     * conventions defined by the teca_cf_reader.
+     * @param[in] md a metadata object
+     * @param[in] first_step the first step to include in the series or 0 to use all
+     * @param[in] last_step the last step to include in the series or -1 to use all
+     * @returns 0 if successfully initialized
+     */
+    virtual int initialize(const teca_metadata &md,
+        long first_step, long last_step);
+
+    /** Initialize the iterator.
+     * @param[in] t  An array of time values
+     * @param[in] units A string units of the time values
+     * @param[in] calendar A string name of the calendar system
+     * @param[in] first_step the first step to include in the series or 0 to use all
+     * @param[in] last_step the last step to include in the series or -1 to use all
+     * @returns 0 if successfully initialized
+     */
+    virtual int initialize(const const_p_teca_variant_array &t,
+        const std::string &units, const std::string &calendar,
+        long first_step, long last_step) = 0;
+
+    /// return true if there are more time steps in the sequence
+    virtual bool is_valid() const = 0;
+
+    /** Get the next interval in the series.
+     * @param[out] first_step The first step in the next element of the series
+     * @param[out] last_step The last step in the next element of the series
+     * @returns 0 if successfully initialized
+     */
+    virtual int get_next_interval(time_point &first_step,
+        time_point &last_step) = 0;
+
+    /// @returns true if there are more intervals in the series
+    operator bool() const
+    {
+        return this->is_valid();
+    }
+
+    /// return the first time point in the series
+    const time_point &get_begin() const { return this->begin; }
+
+    /// return the last time point in the series
+    const time_point &get_end() const { return this->end; }
+
+protected:
+    const_p_teca_variant_array time;
+    std::string units;
+    std::string calendar;
+    time_point begin;
+    time_point end;
+    bool valid;
+};
+
+/// Enumerate ranges of time steps bracketing seasons
+/**
+ * An iterator over seasons (DJF, MAM, JJA, SON) between 2 time_point's.  A
+ * pair of time steps bracketing the current season are returned at each
+ * iteration. Only full seasonal intervals are processed. If the input data
+ * doesn't start or end on a seasonal boundary, the data from the start to the
+ * first full season, and the data from the end of the last full season to the
+ * end is skipped.
+ */
+class season_iterator : public interval_iterator
+{
+public:
+    season_iterator() : year(-1), month(-1) {}
+
+    /// return true if there are more time steps in the sequence
+    bool is_valid() const override;
+
+    /** Initialize the iterator.
+     *
+     * @param[in] t  An array of time values
+     * @param[in] units A string units of the time values
+     * @param[in] calendar A string name of the calendar system
+     * @param[in] first_step the first step to include in the series or 0 to use all
+     * @param[in] last_step the last step to include in the series or -1 to use all
+     * @returns 0 if successfully initialized
+     */
+    int initialize(const const_p_teca_variant_array &t,
+        const std::string &units, const std::string &calendar,
+        long first_step, long last_step) override;
+
+    /** return a pair of time steps bracketing the current season.
+     * both returned time steps belong to the current season.
+     */
+    int get_next_interval(time_point &first_step,
+        time_point &last_step) override;
+
+private:
+    /** given a year and month, checks that the values fall on a seasonal
+     * boundary. if not, returns the year and month of the start of the next
+     * season.
+     */
+    int get_first_season(int y_in, int m_in, int &y_out, int &m_out) const;
+
+    /** Given a year and month returns the year month and day of the end of the
+     * season. the input month need not be on a seasonal boundary.
+     */
+    int get_season_end(int y_in, int m_in,
+        int &y_out, int &m_out, int &d_out) const;
+
+    /** Given a year and month returns the year and month of the next season.
+     * the input momnth doesn't need to be on a seasonal boundary.
+     */
+    int get_next_season(int y_in, int m_in, int &y_out, int &m_out) const;
+
+protected:
+    int year;
+    int month;
+};
+
+/// Enumerate ranges of time steps bracketing months
+/** An iterator over all months between 2 time_point's. A pair
+ * of time steps bracketing the current month are returned at
+ * each iteration.
+ */
+class year_iterator : public interval_iterator
+{
+public:
+    year_iterator() : year(-1) {}
+
+    /// return true if there are more time steps in the sequence
+    bool is_valid() const override;
+
+    /** Initialize the iterator.
+     *
+     * @param[in] t  An array of time values
+     * @param[in] units A string units of the time values
+     * @param[in] calendar A string name of the calendar system
+     * @param[in] first_step the first step to include in the series or 0 to use all
+     * @param[in] last_step the last step to include in the series or -1 to use all
+     * @returns 0 if successfully initialized
+     */
+    int initialize(const const_p_teca_variant_array &t,
+        const std::string &units, const std::string &calendar,
+        long first_step, long last_step) override;
+
+    /** return a pair of time steps bracketing the current season.
+     * both returned time steps belong to the current season.
+     */
+    int get_next_interval(time_point &first_step,
+        time_point &last_step) override;
+
+protected:
+    int year;
+};
+
+/// Enumerate ranges of time steps bracketing months
+/** An iterator over all months between 2 time_point's. A pair
+ * of time steps bracketing the current month are returned at
+ * each iteration.
+ */
+class month_iterator : public interval_iterator
+{
+public:
+    month_iterator() : year(-1), month(-1) {}
+
+    /// return true if there are more time steps in the sequence
+    bool is_valid() const override;
+
+    /** Initialize the iterator.
+     *
+     * @param[in] t  An array of time values
+     * @param[in] units A string units of the time values
+     * @param[in] calendar A string name of the calendar system
+     * @param[in] first_step the first step to include in the series or 0 to use all
+     * @param[in] last_step the last step to include in the series or -1 to use all
+     * @returns 0 if successfully initialized
+     */
+    int initialize(const const_p_teca_variant_array &t,
+        const std::string &units, const std::string &calendar,
+        long first_step, long last_step) override;
+
+    /** return a pair of time steps bracketing the current season.
+     * both returned time steps belong to the current season.
+     */
+    int get_next_interval(time_point &first_step,
+        time_point &last_step) override;
+
+protected:
+    int year;
+    int month;
+};
+
+/// Enumerate ranges of time steps bracketing days
+/** An iterator over all days between 2 time_point's. A pair
+ * of time steps bracketing the current day are returned at
+ * each iteration.
+ */
+class day_iterator : public interval_iterator
+{
+public:
+    day_iterator() : year(-1), month(-1), day(-1) {}
+
+    /// return true if there are more time steps in the sequence
+    bool is_valid() const override;
+
+    /** Initialize the iterator.
+     *
+     * @param[in] t  An array of time values
+     * @param[in] units A string units of the time values
+     * @param[in] calendar A string name of the calendar system
+     * @param[in] first_step the first step to include in the series or 0 to use all
+     * @param[in] last_step the last step to include in the series or -1 to use all
+     * @returns 0 if successfully initialized
+     */
+    int initialize(const const_p_teca_variant_array &t,
+        const std::string &units, const std::string &calendar,
+        long first_step, long last_step) override;
+
+    /** return a pair of time steps bracketing the current season.
+     * both returned time steps belong to the current season.
+     */
+    int get_next_interval(time_point &first_step,
+        time_point &last_step) override;
+
+protected:
+    int year;
+    int month;
+    int day;
+};
+
+
+using p_interval_iterator = std::shared_ptr<interval_iterator>;
+
+/// A factory for interval_iterator
+class interval_iterator_factory
+{
+public:
+    /** Allocate and return an instance of the named iterator
+     * @param[in] interval Name of the desired interval iterator. One of daily,
+     *                     monthly, seasonal, or yearly
+     * @returns an instance of interval_iterator
+     */
+    static p_interval_iterator New(const std::string &interval);
+
+    /// The available intervals
+    enum {invalid = 0, daily = 2, monthly = 3, seasonal = 4, yearly = 5};
+
+    /** Allocate and return an instance of the named iterator
+     * @param[in] interval Id of the desired interval iterator. One of daily,
+     *            monthly, seasonal, or yearly
+     * @returns an instance of interval_iterator
+     */
+    static p_interval_iterator New(int interval);
+};
+
+}
+
+/// send the time_point to a stream in humnan readable form
+std::ostream &operator<<(std::ostream &os,
+    const teca_calendar_util::time_point &tpt);
+
+#endif
diff --git a/data/teca_cartesian_mesh.cxx b/data/teca_cartesian_mesh.cxx
index 441af030a..036185b0c 100644
--- a/data/teca_cartesian_mesh.cxx
+++ b/data/teca_cartesian_mesh.cxx
@@ -1,6 +1,8 @@
 #include "teca_cartesian_mesh.h"
 #include "teca_dataset_util.h"
 #include "teca_bad_cast.h"
+#include "teca_metadata.h"
+#include "teca_metadata_util.h"
 
 #include <iostream>
 
@@ -98,6 +100,32 @@ void teca_cartesian_mesh::set_z_coordinates(const std::string &var,
     m_coordinate_arrays->set("z", array);
 }
 
+// --------------------------------------------------------------------------
+int teca_cartesian_mesh::get_array_extent(const std::string &array_name,
+    unsigned long array_extent[6])
+{
+    teca_metadata atts;
+    teca_metadata array_atts;
+    unsigned long mesh_extent[6] = {0};
+    if (this->get_extent(mesh_extent) || this->get_attributes(atts) ||
+        atts.get(array_name, array_atts))
+    {
+        TECA_ERROR("Cartesian mesh dataset metadata issue. extent,"
+            "attributes, and array attributes for \""
+            << array_name << "\" are required")
+        return -1;
+    }
+
+    if (teca_metadata_util::get_array_extent(array_atts,
+        mesh_extent, array_extent))
+    {
+        // not necessarily an error
+        return 1;
+    }
+
+    return 0;
+}
+
 // --------------------------------------------------------------------------
 int teca_cartesian_mesh::to_stream(teca_binary_stream &s) const
 {
diff --git a/data/teca_cartesian_mesh.h b/data/teca_cartesian_mesh.h
index 3dee6ee72..587b60d77 100644
--- a/data/teca_cartesian_mesh.h
+++ b/data/teca_cartesian_mesh.h
@@ -3,9 +3,10 @@
 
 #include "teca_mesh.h"
 #include "teca_shared_object.h"
+
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_cartesian_mesh)
 
-/// data on a physically uniform cartesian mesh
+/// An object representing data on a stretched Cartesian mesh.
 class teca_cartesian_mesh : public teca_mesh
 {
 public:
@@ -15,7 +16,7 @@ class teca_cartesian_mesh : public teca_mesh
 
     virtual ~teca_cartesian_mesh() = default;
 
-    // set/get metadata
+    // Set/get metadata
     TECA_DATASET_METADATA(whole_extent, unsigned long, 6)
     TECA_DATASET_METADATA(extent, unsigned long, 6)
     TECA_DATASET_METADATA(bounds, double, 6)
@@ -27,58 +28,70 @@ class teca_cartesian_mesh : public teca_mesh
     TECA_DATASET_METADATA(z_coordinate_variable, std::string, 1)
     TECA_DATASET_METADATA(t_coordinate_variable, std::string, 1)
 
-    // get x coordinate array
+    /** Get the extent of the named array, taking into account the variable's
+     * dimensions as opposed to the mesh's dimensions.  For instance the mesh
+     * extent may represent a volume while a variables extent may represent a
+     * slice. returns 0 if successful, -1 if an error occurred, 1 if the
+     * have_mesh_dims flag is missing. The latter is not necessarily an error.
+     */
+    int get_array_extent(const std::string &array_name,
+        unsigned long array_extent[6]);
+
+    /// Get the x coordinate array
     p_teca_variant_array get_x_coordinates()
     { return m_coordinate_arrays->get("x"); }
 
     const_p_teca_variant_array get_x_coordinates() const
     { return m_coordinate_arrays->get("x"); }
 
-    // get y coordinate array
+    /// Get the y coordinate array
     p_teca_variant_array get_y_coordinates()
     { return m_coordinate_arrays->get("y"); }
 
     const_p_teca_variant_array get_y_coordinates() const
     { return m_coordinate_arrays->get("y"); }
 
-    // get z coordinate array
+    /// Get the z coordinate array
     p_teca_variant_array get_z_coordinates()
     { return m_coordinate_arrays->get("z"); }
 
     const_p_teca_variant_array get_z_coordinates() const
     { return m_coordinate_arrays->get("z"); }
 
-    // set coordinate arrays
+    /// Set the x coordinate array
     void set_x_coordinates(const std::string &name,
         const p_teca_variant_array &array);
 
+    /// Set the y coordinate array
     void set_y_coordinates(const std::string &name,
         const p_teca_variant_array &array);
 
+    /// Set the z coordinate array
     void set_z_coordinates(const std::string &name,
         const p_teca_variant_array &array);
 
-
-    // return a unique string identifier
+    /// Return the name of the class
     std::string get_class_name() const override
     { return "teca_cartesian_mesh"; }
 
-    // return an integer identifier uniquely naming the dataset type
+    /// return an integer identifier uniquely naming the dataset type
     int get_type_code() const override;
 
-    // copy data and metadata. shallow copy uses reference
-    // counting, while copy duplicates the data.
+    /** Copy data and metadata. Shallow copy uses reference
+     * counting, while copy duplicates the data.
+     */
     void copy(const const_p_teca_dataset &) override;
     void shallow_copy(const p_teca_dataset &) override;
 
-    // copy metadata. always a deep copy.
+    /// Copy metadata. This is always a deep copy.
     void copy_metadata(const const_p_teca_dataset &other) override;
 
-    // swap internals of the two objects
+    /// Swap the internals of the two objects
     void swap(p_teca_dataset &) override;
 
-    // serialize the dataset to/from the given stream
-    // for I/O or communication
+    /** Serialize the dataset to/from the given stream
+     * for I/O or communication
+     */
     int to_stream(teca_binary_stream &) const override;
     int from_stream(teca_binary_stream &) override;
 
diff --git a/data/teca_coordinate_util.cxx b/data/teca_coordinate_util.cxx
index 3a04d4385..e00b177d1 100644
--- a/data/teca_coordinate_util.cxx
+++ b/data/teca_coordinate_util.cxx
@@ -2,7 +2,7 @@
 
 #include "teca_common.h"
 #if defined(TECA_HAS_UDUNITS)
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 #endif
 
 #include <string>
@@ -15,9 +15,10 @@ namespace teca_coordinate_util
 {
 
 // **************************************************************************
-int time_step_of(p_teca_variant_array time, bool lower, bool clamp,
-    const std::string &calendar, const std::string &units,
-    const std::string &date, unsigned long &step)
+int time_step_of(const const_p_teca_variant_array &time,
+    bool lower, bool clamp, const std::string &calendar,
+    const std::string &units, const std::string &date,
+    unsigned long &step)
 {
 #if defined(TECA_HAS_UDUNITS)
     step = 0;
@@ -36,7 +37,7 @@ int time_step_of(p_teca_variant_array time, bool lower, bool clamp,
 
     // apply calendaring to get a time offset
     double t = 0.0;
-    if (calcalcs::coordinate(Y, M, D, h, m, s,
+    if (teca_calcalcs::coordinate(Y, M, D, h, m, s,
         units.c_str(), calendar.c_str(), &t))
     {
         TECA_ERROR("failed to convert date \"" << date
@@ -48,9 +49,9 @@ int time_step_of(p_teca_variant_array time, bool lower, bool clamp,
 
     // locate the nearest time value in the time axis
     unsigned long last = time->size() - 1;
-    TEMPLATE_DISPATCH_FP_SI(teca_variant_array_impl,
+    TEMPLATE_DISPATCH_FP_SI(const teca_variant_array_impl,
         time.get(),
-        NT *p_time = std::dynamic_pointer_cast<TT>(time)->get();
+        const NT *p_time = std::dynamic_pointer_cast<const TT>(time)->get();
         if (clamp && (t <= p_time[0]))
         {
             step = 0;
@@ -91,10 +92,10 @@ int time_to_string(double val, const std::string &calendar,
   const std::string &units, const std::string &format, std::string &date)
 {
 #if defined(TECA_HAS_UDUNITS)
-    // use calcalcs to convert val to a set of year/month/day/etc.
+    // use teca_calcalcs to convert val to a set of year/month/day/etc.
     struct tm timedata = {};
     double seconds = 0.0;
-    if (calcalcs::date(val, &timedata.tm_year, &timedata.tm_mon,
+    if (teca_calcalcs::date(val, &timedata.tm_year, &timedata.tm_mon,
         &timedata.tm_mday, &timedata.tm_hour, &timedata.tm_min, &seconds,
         units.c_str(), calendar.c_str()))
     {
@@ -139,7 +140,7 @@ int bounds_to_extent(const double *bounds, const teca_metadata &md,
     teca_metadata coords;
     if (md.get("coordinates", coords))
     {
-        TECA_ERROR("missing cooridnates")
+        TECA_ERROR("Metadata issue, missing cooridnates")
         return -1;
     }
 
@@ -149,18 +150,26 @@ int bounds_to_extent(const double *bounds, const teca_metadata &md,
 
     if (!x || !y || !z)
     {
-        TECA_ERROR("empty coordinate axes")
+        TECA_ERROR("Metadata issue, empty coordinate axes")
         return -1;
     }
 
-    return bounds_to_extent(bounds, x, y, z, extent);
-}
+    if (bounds_to_extent(bounds, x, y, z, extent) ||
+        validate_extent(x->size(), y->size(), z->size(), extent, true))
+    {
+        TECA_ERROR("Invalid bounds raequested [" << bounds[0] << ", "
+            << bounds[1] << ", " <<  bounds[2] << ", " << bounds[3] << ", "
+            << bounds[4] << ", " << bounds[5] << "]")
+        return -1;
+    }
 
+    return 0;
+}
 
 // **************************************************************************
 int bounds_to_extent(const double *bounds,
-    const_p_teca_variant_array x, const_p_teca_variant_array y,
-    const_p_teca_variant_array z, unsigned long *extent)
+    const const_p_teca_variant_array &x, const const_p_teca_variant_array &y,
+    const const_p_teca_variant_array &z, unsigned long *extent)
 {
     TEMPLATE_DISPATCH_FP(
         const teca_variant_array_impl,
@@ -238,7 +247,56 @@ int bounds_to_extent(const double *bounds,
         return 0;
         )
 
-    TECA_ERROR("invalid coordinate array type")
+    TECA_ERROR("invalid coordinate array type \"" << x->get_class_name() << "\"")
+    return -1;
+}
+
+// **************************************************************************
+int bounds_to_extent(const double *bounds,
+    const const_p_teca_variant_array &x, unsigned long *extent)
+{
+    TEMPLATE_DISPATCH_FP(
+        const teca_variant_array_impl,
+        x.get(),
+
+        // in the following, for each side (low, high) of the bounds in
+        // each cooridnate direction we are searching for the index that
+        // is either just below, just above, or exactly at the given value.
+        // special cases include:
+        //   * x,y,z in descending order. we check for that and
+        //     invert the compare functions that define the bracket
+        //   * bounds describing a plane. we test for this and
+        //     so that both high and low extent return the same value.
+        //   * x,y,z are length 1. we can skip the search in that
+        //     case.
+
+        const NT eps8 = NT(8)*std::numeric_limits<NT>::epsilon();
+
+        unsigned long nx = x->size();
+        unsigned long high_i = nx - 1;
+        extent[0] = 0;
+        extent[1] = high_i;
+        const NT *px = std::dynamic_pointer_cast<TT>(x)->get();
+        NT low_x = static_cast<NT>(bounds[0]);
+        NT high_x = static_cast<NT>(bounds[1]);
+        bool slice_x = equal(low_x, high_x, eps8);
+
+        if (((nx > 1) && (((px[high_i] > px[0]) &&
+            (teca_coordinate_util::index_of(px, 0, high_i, low_x, true, extent[0])
+            || teca_coordinate_util::index_of(px, 0, high_i, high_x, slice_x, extent[1]))) ||
+            ((px[high_i] < px[0]) &&
+            (teca_coordinate_util::index_of<NT,descend_bracket<NT>>(px, 0, high_i, low_x, false, extent[0])
+            || teca_coordinate_util::index_of<NT,descend_bracket<NT>>(px, 0, high_i, high_x, !slice_x, extent[1]))))))
+        {
+            TECA_ERROR(<< "requested subset [" << bounds[0] << ", " << bounds[1] << ", "
+                << "] is not contained in the current dataset bounds [" << px[0] << ", "
+                << px[high_i] << "]")
+            return -1;
+        }
+        return 0;
+        )
+
+    TECA_ERROR("invalid coordinate array type \"" << x->get_class_name() << "\"")
     return -1;
 }
 
@@ -284,6 +342,25 @@ int validate_centering(int centering)
     return ret;
 }
 
+// **************************************************************************
+int get_cartesian_mesh_bounds(const const_p_teca_variant_array x,
+    const const_p_teca_variant_array y, const const_p_teca_variant_array z,
+    double *bounds)
+{
+    unsigned long x1 = x->size() - 1;
+    unsigned long y1 = y->size() - 1;
+    unsigned long z1 = z->size() - 1;
+
+    x->get(0, bounds[0]);
+    x->get(x1, bounds[1]);
+    y->get(0, bounds[2]);
+    y->get(y1, bounds[3]);
+    z->get(0, bounds[4]);
+    z->get(z1, bounds[5]);
+
+    return 0;
+}
+
 // **************************************************************************
 int get_cartesian_mesh_extent(const teca_metadata &md,
     unsigned long *whole_extent, double *bounds)
@@ -327,4 +404,94 @@ int get_cartesian_mesh_extent(const teca_metadata &md,
     return 0;
 }
 
+// **************************************************************************
+int validate_extent(unsigned long nx_max, unsigned long ny_max,
+    unsigned long nz_max, unsigned long *extent, bool verbose)
+{
+    // validate x
+    if ((extent[1] >= nx_max) || (extent[1] < extent[0]))
+    {
+        if (verbose)
+        {
+            TECA_ERROR("The x-axis extent [" << extent[0] << ", "
+                << extent[1] << "] is invalid, the x-axis coordinate"
+                " array has " << nx_max << " values")
+        }
+        return -1;
+    }
+
+    // validate y
+    if ((extent[3] >= ny_max) || (extent[3] < extent[2]))
+    {
+        if (verbose)
+        {
+            TECA_ERROR("The y-axis extent [" << extent[2] << ", "
+                << extent[3] << "] is invalid, the y-axis coordinate"
+                " array has " << ny_max << " values")
+        }
+        return -1;
+    }
+
+    // validate z
+    if ((extent[5] >= nz_max) || (extent[5] < extent[4]))
+    {
+        if (verbose)
+        {
+            TECA_ERROR("The z-axis extent [" << extent[4] << ", "
+                << extent[5] << "] is invalid, the z-axis coordinate"
+                " array has " << nz_max << " values")
+        }
+        return -1;
+    }
+
+    return 0;
+}
+
+// **************************************************************************
+int clamp_dimensions_of_one(unsigned long nx_max, unsigned long ny_max,
+    unsigned long nz_max, unsigned long *extent, bool verbose)
+{
+    int clamped = 0;
+
+    // clamp x
+    if ((nx_max == 1) && (extent[1] != 0))
+    {
+        if (verbose)
+        {
+            TECA_WARNING("The requested x-axis extent [" << extent[0] << ", "
+                << extent[1] << "] is invalid and was clamped to [0, 0]")
+        }
+        extent[0] = 0;
+        extent[1] = 0;
+        clamped = 1;
+    }
+
+    // clamp y
+    if ((ny_max == 1) && (extent[3] != 0))
+    {
+        if (verbose)
+        {
+            TECA_WARNING("The requested y-axis extent [" << extent[2] << ", "
+                << extent[3] << "] is invalid and was clamped to [0, 0]")
+        }
+        extent[2] = 0;
+        extent[3] = 0;
+        clamped = 1;
+    }
+
+    // clamp z
+    if ((nz_max == 1) && (extent[5] != 0))
+    {
+        if (verbose)
+        {
+            TECA_WARNING("The requested z-axis extent [" << extent[4] << ", "
+                << extent[5] << "] is invalid and was clamped to [0, 0]")
+        }
+        extent[4] = 0;
+        extent[5] = 0;
+        clamped = 1;
+    }
+
+    return clamped;
+}
 };
diff --git a/data/teca_coordinate_util.h b/data/teca_coordinate_util.h
index d14b93c20..01fb8d0fb 100644
--- a/data/teca_coordinate_util.h
+++ b/data/teca_coordinate_util.h
@@ -1,6 +1,8 @@
 #ifndef teca_cartesian_mesh_util_h
 #define teca_cartesian_mesh_util_h
 
+/// @file
+
 #include "teca_cartesian_mesh.h"
 #include "teca_variant_array.h"
 #include "teca_metadata.h"
@@ -12,26 +14,35 @@
 #include <typeinfo>
 #include <iomanip>
 
+/// For printing data as ASCII with the maximum supported numerical precision
 #define max_prec(T) \
     std::setprecision(std::numeric_limits<T>::digits10 + 1)
 
+/// Codes dealing with operations on coordinate systems
 namespace teca_coordinate_util
 {
-// traits classes used to get default tolerances for comparing numbers
-// of a given precision. A relative tolerance is used for comparing large
-// numbers and an absolute tolerance is used for comparing small numbers.
-// these defaults are not universal and will not work well in all situations.
-// see also:
-// https://randomascii.wordpress.com/2012/02/25/comparing-floating-point-numbers-2012-edition/
+/** @brief
+ *  traits classes used to get default tolerances for comparing numbers
+ *  of a given precision.
+ *
+ *  @details
+ *  A relative tolerance is used for comparing large
+ *  numbers and an absolute tolerance is used for comparing small numbers.
+ *  these defaults are not universal and will not work well in all situations.
+ *
+ *  see also:
+ *  https://randomascii.wordpress.com/2012/02/25/comparing-floating-point-numbers-2012-edition/
+ */
 template <typename n_t>
 struct equal_tt {};
 
-#define declare_equal_tt(cpp_t, atol, rtol) \
-template <>                                 \
-struct equal_tt<cpp_t>                      \
-{                                           \
-    static cpp_t absTol() { return atol; }  \
-    static cpp_t relTol() { return rtol; }  \
+#define declare_equal_tt(cpp_t, atol, rtol)                                 \
+/** Specialization for cpp_t with default absTol and relTol */              \
+template <>                                                                 \
+struct equal_tt<cpp_t>                                                      \
+{                                                                           \
+    static cpp_t absTol() { return atol; }                                  \
+    static cpp_t relTol() { return rtol; }                                  \
 };
 
 declare_equal_tt(float, 10.0f*std::numeric_limits<float>::epsilon(),
@@ -43,9 +54,9 @@ declare_equal_tt(double, 10.0*std::numeric_limits<double>::epsilon(),
 declare_equal_tt(long double, std::numeric_limits<double>::epsilon(),
     std::numeric_limits<double>::epsilon())
 
-// compare two floating point numbers.
-// absTol handles comparing numbers very close to zero.
-// relTol handles comparing larger values.
+/** Compare two floating point numbers.  absTol handles comparing numbers very
+ * close to zero.  relTol handles comparing larger values.
+ */
 template <typename T>
 bool equal(T a, T b,
     T relTol = equal_tt<T>::relTol(), T absTol = equal_tt<T>::absTol(),
@@ -65,7 +76,7 @@ bool equal(T a, T b,
     return false;
 }
 
-// a specialization for integer types
+/// Compare two integral numbers.
 template <typename T>
 bool equal(T a, T b, T relTol = 0, T absTol = 0,
     typename std::enable_if<std::is_integral<T>::value>::type* = 0)
@@ -75,8 +86,10 @@ bool equal(T a, T b, T relTol = 0, T absTol = 0,
     return a == b;
 }
 
-// an overload for use in regression tests. If the numbers are not equal then a diagnostic
-// message is returned.
+/** Compare two floating point numbers. This overload may be used in regression
+ * tests or other contexts where a diagnostic error message should be reported
+ * if the numbers are not equal.
+ */
 template <typename T>
 bool equal(T a, T b, std::string &diagnostic,
     T relTol = equal_tt<T>::relTol(), T absTol = equal_tt<T>::absTol(),
@@ -109,7 +122,10 @@ bool equal(T a, T b, std::string &diagnostic,
     return false;
 }
 
-// a specialization for integer types
+/** Compare two integral numbers. This overload may be used in regression
+ * tests or other contexts where a diagnostic error message should be reported
+ * if the numbers are not equal.
+ */
 template <typename T>
 bool equal(T a, T b, std::string &diagnostic, T relTol = 0, T absTol = 0,
     typename std::enable_if<std::is_integral<T>::value>::type* = 0)
@@ -126,44 +142,76 @@ bool equal(T a, T b, std::string &diagnostic, T relTol = 0, T absTol = 0,
 }
 
 
-// comparators implementing bracket for ascending and
-// descending input arrays
+/// Less than or equal to predicate
 template<typename data_t>
 struct leq
 { static bool eval(const data_t &l, const data_t &r) { return l <= r; } };
 
+/// Greater than or equal to predicate
 template<typename data_t>
 struct geq
 { static bool eval(const data_t &l, const data_t &r) { return l >= r; } };
 
+/// Less than predicate
 template<typename data_t>
 struct lt
 { static bool eval(const data_t &l, const data_t &r) { return l < r; } };
 
+/// Greater than predicate
 template<typename data_t>
 struct gt
 { static bool eval(const data_t &l, const data_t &r) { return l > r; } };
 
+/// comparator implementing bracket for ascending input arrays
 template<typename data_t>
 struct ascend_bracket
 {
+    // m_0 is an index into the data, m_1 = m_0 + 1
+    // comparitors defining the bracket orientation. for data in
+    // ascending order:  val >= data[m_0] && val <= data[m_1]
     using comp0_t = geq<data_t>;
     using comp1_t = leq<data_t>;
+
+    // m_0 is an index into the data, m_1 = m_0 + 1
+    // get the id of the smaller value (lower == true)
+    // or the larger value (lower == false)
+    static unsigned long get_id(bool lower,
+        unsigned long m_0, unsigned long m_1)
+    {
+        if (lower)
+            return m_0;
+        return m_1;
+    }
 };
 
+/// comparator implementing bracket for descending input arrays
 template<typename data_t>
 struct descend_bracket
 {
+    // m_0 is an index into the data, m_1 = m_0 + 1
+    // comparitors defining the bracket orientation. for data in
+    // descending order:  val <= data[m_0] && val >= data[m_1]
     using comp0_t = leq<data_t>;
     using comp1_t = geq<data_t>;
+
+    // m_0 is an index into the data, m_1 = m_0 + 1
+    // get the id of the smaller value (lower == true)
+    // or the larger value (lower == false)
+    static unsigned long get_id(bool lower,
+        unsigned long m_0, unsigned long m_1)
+    {
+        if (lower)
+            return m_1;
+        return m_0;
+    }
 };
 
-// binary search that will locate index bounding the value
-// above or below such that data[i] <= val or val <= data[i+1]
-// depending on the value of lower. return 0 if the value is
-// found. the comp0 and comp1 template parameters let us
-// operate on both ascending and descending input. defaults
-// are set for ascending inputs.
+/** binary search that will locate index bounding the value above or below
+ * such that data[i] <= val or val <= data[i+1] depending on the value of
+ * lower. return 0 if the value is found. the comp0 and comp1 template
+ * parameters let us operate on both ascending and descending input. defaults
+ * are set for ascending inputs.
+ */
 template <typename data_t, typename bracket_t = ascend_bracket<data_t>>
 int index_of(const data_t *data, unsigned long l, unsigned long r,
     data_t val, bool lower, unsigned long &id)
@@ -192,10 +240,7 @@ int index_of(const data_t *data, unsigned long l, unsigned long r,
         if (equal(val, data[m_1]))
             id = m_1;
         else
-        if (lower)
-            id = m_0;
-        else
-            id = m_1;
+            id = bracket_t::get_id(lower, m_0, m_1);
         return 0;
     }
     else
@@ -216,8 +261,9 @@ int index_of(const data_t *data, unsigned long l, unsigned long r,
     return -1;
 }
 
-// binary search that will locate index of the given value.
-// return 0 if the value is found.
+/** binary search that will locate index of the given value. return 0 if the
+ * value is found.
+ */
 template <typename T>
 int index_of(const T *data, size_t l, size_t r, T val, unsigned long &id)
 {
@@ -263,19 +309,22 @@ int index_of(const T *data, size_t l, size_t r, T val, unsigned long &id)
     return -1;
 }
 
-// convert bounds to extents
-// return non-zero if the requested bounds are not in
-// the given coordinate arrays. coordinate arrays must
-// not be empty.
+/** Convert bounds to extents.  return non-zero if the requested bounds are
+ * not in the given coordinate arrays. coordinate arrays must not be empty.
+ */
+int bounds_to_extent(const double *bounds,
+    const const_p_teca_variant_array &x, const const_p_teca_variant_array &y,
+    const const_p_teca_variant_array &z, unsigned long *extent);
+
 int bounds_to_extent(const double *bounds,
-    const_p_teca_variant_array x, const_p_teca_variant_array y,
-    const_p_teca_variant_array z, unsigned long *extent);
+    const const_p_teca_variant_array &x, unsigned long *extent);
 
 int bounds_to_extent(const double *bounds, const teca_metadata &md,
     unsigned long *extent);
 
-// get the i,j,k cell index of point x,y,z in the given mesh.
-// return 0 if successful.
+/** Get the i,j,k cell index of point x,y,z in the given mesh.  return 0 if
+ * successful.
+ */
 template<typename T>
 int index_of(const const_p_teca_cartesian_mesh &mesh, T x, T y, T z,
         unsigned long &i, unsigned long &j, unsigned long &k)
@@ -312,29 +361,31 @@ int index_of(const const_p_teca_cartesian_mesh &mesh, T x, T y, T z,
     return -1;
 }
 
-// given a human readable date string in YYYY-MM-DD hh:mm:ss format
-// amd a list of floating point offset times inthe specified calendar
-// and units find the closest time step. return 0 if successful
-// see index_of for a description of lower, if clamp is true then
-// when the date falls outside of the time values either the first
-// or last time step is returned.
-int time_step_of(p_teca_variant_array time, bool lower, bool clamp,
-    const std::string &calendar, const std::string &units,
-    const std::string &date, unsigned long &step);
-
-// given a time value (val), associated time units (units), and calendar
-// (calendar), return a human-readable rendering of the date (date) in a
-// strftime-format (format).  return 0 if successful.
+/**  given a human readable date string in YYYY-MM-DD hh:mm:ss format and a
+ * list of floating point offset times in the specified calendar and units find
+ * the closest time step. return 0 if successful see index_of for a description
+ * of lower, if clamp is true then when the date falls outside of the time
+ * values either the first or last time step is returned.
+ */
+int time_step_of(const const_p_teca_variant_array &time,
+    bool lower, bool clamp, const std::string &calendar,
+    const std::string &units, const std::string &date,
+    unsigned long &step);
+
+/**  given a time value (val), associated time units (units), and calendar
+ * (calendar), return a human-readable rendering of the date (date) in a
+ * strftime-format (format).  return 0 if successful.
+ */
 int time_to_string(double val, const std::string &calendar,
     const std::string &units, const std::string &format, std::string &date);
 
-// build random access data structures for an indexed table.
-// the index column gives each entity a unique id. the index is
-// used to identify rows that belong in the entity. it is assumed
-// that an entity ocupies consecutive rows. the returns are:
-// n_entities, the number of entities found; counts, the number of
-// rows used by each entity; offsets, the starting row of each
-// entity; ids, a new set of ids for the entities starting from 0
+/** build random access data structures for an indexed table.  the index column
+ * gives each entity a unique id. the index is used to identify rows that
+ * belong in the entity. it is assumed that an entity occupies consecutive rows.
+ * the returns are: n_entities, the number of entities found; counts, the
+ * number of rows used by each entity; offsets, the starting row of each
+ * entity; ids, a new set of ids for the entities starting from 0
+ */
 template <typename int_t>
 void get_table_offsets(const int_t *index, unsigned long n_rows,
     unsigned long &n_entities, std::vector<unsigned long> &counts,
@@ -374,8 +425,16 @@ void get_table_offsets(const int_t *index, unsigned long n_rows,
         offsets[i] = offsets[i-1] + counts[i-1];
 }
 
-// 0 order (nearest neighbor) interpolation
-// for nodal data on stretched cartesian mesh.
+/** 0th order (nearest neighbor) interpolation for nodal data on a stretched
+ * Cartesian mesh. This overload implements the general 3D case.
+ * cx, cy, cz is the location to interpolate to
+ * p_x, p_y, p_z array arrays containing the source coordinates with extents
+ * [0, ihi, 0, jhi, 0, khi]
+ * p_data is the field to interpolate from
+ * val is the result
+ * returns 0 if successful, an error occurs if cx, cy, cz is outside of the
+ * source coordinate system
+ */
 template<typename CT, typename DT>
 int interpolate_nearest(CT cx, CT cy, CT cz,
     const CT *p_x, const CT *p_y, const CT *p_z,
@@ -411,8 +470,58 @@ int interpolate_nearest(CT cx, CT cy, CT cz,
     return 0;
 }
 
-// 1 order (linear) interpolation
-// for nodal data on stretched cartesian mesh.
+/** 0th order (nearest neighbor) interpolation for nodal data on a stretched
+ * Cartesian mesh.  This overload implements the special case where both source
+ * and target mesh data are in a 2D x-y plane using fewer operations than the
+ * general 3D implementation.
+ * cx, cy, cz is the location to interpolate to
+ * p_x, p_y, p_z array arrays containing the source coordinates with extents
+ * [0, ihi, 0, jhi, 0, khi]
+ * p_data is the field to interpolate from
+ * val is the result
+ * returns 0 if successful, an error occurs if cx, cy, cz is outside of the
+ * source coordinate system
+ */
+template<typename coord_t, typename data_t>
+int interpolate_nearest(coord_t cx, coord_t cy, const coord_t *p_x,
+    const coord_t *p_y, const data_t *p_data, unsigned long ihi,
+    unsigned long jhi, unsigned long nx, data_t &val)
+{
+    // get i,j of node less than cx,cy
+    unsigned long i = 0;
+    unsigned long j = 0;
+
+    if ((ihi && teca_coordinate_util::index_of(p_x, 0, ihi, cx, true, i))
+        || (jhi && teca_coordinate_util::index_of(p_y, 0, jhi, cy, true, j)))
+    {
+        // cx,cy is outside the coordinate axes
+        return -1;
+    }
+
+    // get i,j of node greater than cx,cy
+    unsigned long ii = std::min(i + 1, ihi);
+    unsigned long jj = std::min(j + 1, jhi);
+
+    // get index of nearest node
+    unsigned long p = (cx - p_x[i]) <= (p_x[ii] - cx) ? i : ii;
+    unsigned long q = (cy - p_y[j]) <= (p_y[jj] - cy) ? j : jj;
+
+    // assign value from nearest node
+    val = p_data[p + nx*q];
+
+    return 0;
+}
+
+/** 1st order (linear) interpolation for nodal data on stretched Cartesian
+ * mesh. This overload implements the general 3D case.
+ * cx, cy, cz is the location to interpolate to
+ * p_x, p_y, p_z array arrays containing the source coordinates with extents
+ * [0, ihi, 0, jhi, 0, khi]
+ * p_data is the field to interpolate from
+ * val is the result
+ * returns 0 if successful, an error occurs if cx, cy, cz is outside of the
+ * source coordinate system
+ */
 template<typename CT, typename DT>
 int interpolate_linear(CT cx, CT cy, CT cz,
     const CT *p_x, const CT *p_y, const CT *p_z,
@@ -433,15 +542,15 @@ int interpolate_linear(CT cx, CT cy, CT cz,
         return -1;
     }
 
-    // get i,j of node greater than cx,cy
+    // get i,j of node greater than cx,cy,cz
     unsigned long ii = std::min(i + 1, ihi);
     unsigned long jj = std::min(j + 1, jhi);
     unsigned long kk = std::min(k + 1, khi);
 
     // compute weights
-    CT wx = (cx - p_x[i])/(p_x[ii] - p_x[i]);
-    CT wy = (cy - p_y[i])/(p_y[ii] - p_y[i]);
-    CT wz = (cz - p_z[i])/(p_z[ii] - p_z[i]);
+    CT wx = ii == i ? 0 : (cx - p_x[i])/(p_x[ii] - p_x[i]);
+    CT wy = jj == j ? 0 : (cy - p_y[j])/(p_y[jj] - p_y[j]);
+    CT wz = kk == k ? 0 : (cz - p_z[k])/(p_z[kk] - p_z[k]);
 
     CT vx = CT(1) - wx;
     CT vy = CT(1) - wy;
@@ -460,11 +569,61 @@ int interpolate_linear(CT cx, CT cy, CT cz,
     return 0;
 }
 
-// functor templated on order of accuracy for above Cartesian mesh interpolants
+/** 1st order (linear) interpolation for nodal data on stretched Cartesian mesh.
+ * This overload implements the special case where both source and target data
+ * are in a 2D x-y plane using fewer operations than the general 3D
+ * implementation.
+ * cx, cy, cz is the location to interpolate to
+ * p_x, p_y, p_z array arrays containing the source coordinates with extents
+ * [0, ihi, 0, jhi, 0, khi]
+ * p_data is the field to interpolate from
+ * val is the result
+ * returns 0 if successful, an error occurs if cx, cy, cz is outside of the
+ * source coordinate system
+ */
+template<typename CT, typename DT>
+int interpolate_linear(CT cx, CT cy, const CT *p_x, const CT *p_y,
+    const DT *p_data, unsigned long ihi, unsigned long jhi,
+    unsigned long nx, DT &val)
+{
+    // get i,j of node less than cx,cy
+    unsigned long i = 0;
+    unsigned long j = 0;
+
+    if ((ihi && teca_coordinate_util::index_of(p_x, 0, ihi, cx, true, i))
+        || (jhi && teca_coordinate_util::index_of(p_y, 0, jhi, cy, true, j)))
+    {
+        // cx,cy is outside the coordinate axes
+        return -1;
+    }
+
+    // get i,j of node greater than cx,cy
+    unsigned long ii = std::min(i + 1, ihi);
+    unsigned long jj = std::min(j + 1, jhi);
+
+    // compute weights
+    CT wx = ii == i ? 0 : (cx - p_x[i])/(p_x[ii] - p_x[i]);
+    CT wy = jj == j ? 0 : (cy - p_y[j])/(p_y[jj] - p_y[j]);
+
+    CT vx = CT(1) - wx;
+    CT vy = CT(1) - wy;
+
+    // interpolate
+    val = vx*vy*p_data[ i +  j*nx]
+        + wx*vy*p_data[ii +  j*nx]
+        + wx*wy*p_data[ii + jj*nx]
+        + vx*wy*p_data[ i + jj*nx];
+
+    return 0;
+}
+
+/// A functor templated on order of accuracy for above Cartesian mesh interpolants
 template<int> struct interpolate_t;
 
+/// Zero'th order interpolant specialization
 template<> struct interpolate_t<0>
 {
+    // 3D
     template<typename CT, typename DT>
     int operator()(CT tx, CT ty, CT tz, const CT *sx, const CT *sy,
         const CT *sz, const DT *sa, unsigned long ihi, unsigned long jhi,
@@ -473,10 +632,22 @@ template<> struct interpolate_t<0>
         return teca_coordinate_util::interpolate_nearest(tx,ty,tz,
              sx,sy,sz,sa, ihi,jhi,khi, nx,nxy, ta);
     }
+
+    // 2D x-y plane
+    template<typename CT, typename DT>
+    int operator()(CT tx, CT ty, const CT *sx, const CT *sy,
+        const DT *sa, unsigned long ihi, unsigned long jhi,
+        unsigned long nx, DT &ta)
+    {
+        return teca_coordinate_util::interpolate_nearest(tx,ty,
+             sx,sy,sa, ihi,jhi, nx, ta);
+    }
 };
 
+/// First order interpolant specialization
 template<> struct interpolate_t<1>
 {
+    // 3D
     template<typename CT, typename DT>
     int operator()(CT tx, CT ty, CT tz, const CT *sx, const CT *sy,
         const CT *sz, const DT *sa, unsigned long ihi, unsigned long jhi,
@@ -485,14 +656,22 @@ template<> struct interpolate_t<1>
         return teca_coordinate_util::interpolate_linear(tx,ty,tz,
              sx,sy,sz,sa, ihi,jhi,khi, nx,nxy, ta);
     }
+
+    // 2D x-y plane
+    template<typename CT, typename DT>
+    int operator()(CT tx, CT ty, const CT *sx, const CT *sy,
+        const DT *sa, unsigned long ihi, unsigned long jhi,
+        unsigned long nx,  DT &ta)
+    {
+        return teca_coordinate_util::interpolate_linear(tx,ty,
+             sx,sy,sa, ihi,jhi, nx, ta);
+    }
 };
 
-// return 0 if the centering is one of the values defined
-// in teca_array_attributes
+/// return 0 if the centering is one of the values defined in teca_array_attributes
 int validate_centering(int centering);
 
-// convert from a cell extent to a face, edge or point centered
-// extent
+/// convert from a cell extent to a face, edge or point centered extent
 template <typename num_t>
 int convert_cell_extent(num_t *extent, int centering)
 {
@@ -539,12 +718,98 @@ int convert_cell_extent(num_t *extent, int centering)
     return 0;
 }
 
-// given carteisan mesh metadata extract whole_extent and bounds
-// if bounds metadata is not already present then it is initialized
-// from coordinate arrays. It's an error if whole_extent or coordinate
-// arrays are not present. return zero if successful.
+/** Given Cartesian mesh metadata extract whole_extent and bounds
+ *  if bounds metadata is not already present then it is initialized
+ *  from coordinate arrays. It's an error if whole_extent or coordinate
+ *  arrays are not present. return zero if successful.
+ */
 int get_cartesian_mesh_extent(const teca_metadata &md,
     unsigned long *whole_extent, double *bounds);
 
+/// get the mesh's bounds from the coordinate axis arrays
+int get_cartesian_mesh_bounds(const const_p_teca_variant_array x,
+    const const_p_teca_variant_array y, const const_p_teca_variant_array z,
+    double *bounds);
+
+/** Check that one Cartesian region covers the other coordinates must be in
+ *  ascending order. assumes that both regions are specified in ascending order.
+ */
+template <typename num_t>
+int covers_ascending(const num_t *whole, const num_t *part)
+{
+    if ((part[0] >= whole[0]) && (part[0] <= whole[1]) &&
+        (part[1] >= whole[0]) && (part[1] <= whole[1]) &&
+        (part[2] >= whole[2]) && (part[2] <= whole[3]) &&
+        (part[3] >= whole[2]) && (part[3] <= whole[3]) &&
+        (part[4] >= whole[4]) && (part[4] <= whole[5]) &&
+        (part[5] >= whole[4]) && (part[5] <= whole[5]))
+        return 1;
+    return 0;
+}
+
+/** Check that one Cartesian region covers the other, taking into account the
+ * order of the coordinates. assumes that the regions are specified in the same
+ * orientation.
+ */
+template <typename num_t>
+int covers(const num_t *whole, const num_t *part)
+{
+    bool x_ascend = whole[0] <= whole[1];
+    bool y_ascend = whole[2] <= whole[3];
+    bool z_ascend = whole[4] <= whole[5];
+    if (((x_ascend &&
+        (part[0] >= whole[0]) && (part[0] <= whole[1]) &&
+        (part[1] >= whole[0]) && (part[1] <= whole[1])) ||
+        (!x_ascend &&
+        (part[0] <= whole[0]) && (part[0] >= whole[1]) &&
+        (part[1] <= whole[0]) && (part[1] >= whole[1]))) &&
+        ((y_ascend &&
+        (part[2] >= whole[2]) && (part[2] <= whole[3]) &&
+        (part[3] >= whole[2]) && (part[3] <= whole[3])) ||
+        (!y_ascend &&
+        (part[2] <= whole[2]) && (part[2] >= whole[3]) &&
+        (part[3] <= whole[2]) && (part[3] >= whole[3]))) &&
+        ((z_ascend &&
+        (part[4] >= whole[4]) && (part[4] <= whole[5]) &&
+        (part[5] >= whole[4]) && (part[5] <= whole[5])) ||
+        (!z_ascend &&
+        (part[4] <= whole[4]) && (part[4] >= whole[5]) &&
+        (part[5] <= whole[4]) && (part[5] >= whole[5]))))
+        return 1;
+    return 0;
+}
+
+/** check that two Cartesian regions have the same orientation ie they are
+ * either both specified in ascending or descending order.
+ */
+template <typename num_t>
+int same_orientation(const num_t *whole, const num_t *part)
+{
+    if ((((whole[0] <= whole[1]) && (part[0] <= part[1])) ||
+        ((whole[0] >= whole[1]) && (part[0] >= part[1]))) &&
+        (((whole[2] <= whole[3]) && (part[2] <= part[3])) ||
+        ((whole[2] >= whole[3]) && (part[2] >= part[3]))) &&
+        (((whole[4] <= whole[5]) && (part[4] <= part[5])) ||
+        ((whole[4] >= whole[5]) && (part[4] >= part[5]))))
+        return 1;
+    return 0;
+}
+
+/** where array dimensions specified by nx_max, ny_max, and nz_max are 1, and
+ * the extent would be out of bounds, set the extent to [0, 0].  If verbose is
+ * set, a warning is reported when the extent was clamped in one or more
+ * directions. The return is non zero if any direction was clamped and 0
+ * otherwise.
+ */
+int clamp_dimensions_of_one(unsigned long nx_max, unsigned long ny_max,
+    unsigned long nz_max, unsigned long *extent, bool verbose);
+
+/** Return 0 if the passed extent does not exceed array dimensions specified in
+ * nx_max, ny_max, and nz_max.  If verbose is set, an error is reported via
+ * TECA_ERROR when the extent would be out of bounds.
+ */
+int validate_extent(unsigned long nx_max, unsigned long ny_max,
+    unsigned long nz_max, unsigned long *extent, bool verbose);
+
 };
 #endif
diff --git a/data/teca_curvilinear_mesh.h b/data/teca_curvilinear_mesh.h
index dff79b9b4..5690c429b 100644
--- a/data/teca_curvilinear_mesh.h
+++ b/data/teca_curvilinear_mesh.h
@@ -5,7 +5,7 @@
 #include "teca_shared_object.h"
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_curvilinear_mesh)
 
-/// data on a physically uniform curvilinear mesh
+/// Data on a physically uniform curvilinear mesh.
 class teca_curvilinear_mesh : public teca_mesh
 {
 public:
diff --git a/data/teca_database.h b/data/teca_database.h
index 87b1f37fd..11df3a08c 100644
--- a/data/teca_database.h
+++ b/data/teca_database.h
@@ -3,17 +3,19 @@
 
 #include "teca_dataset.h"
 #include "teca_table.h"
-#include "teca_database_fwd.h"
+#include "teca_shared_object.h"
 #include "teca_table_collection.h"
 #include <iosfwd>
 class teca_binary_stream;
 
-/// teca_database - A collection of named tables
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_database)
+
+/// A collection of named tables.
 /**
-A dataset consisting of a collection of named tables. This
-is a thin wrapper around the teca_table_collection implementing
-the teca_dataset API.
-*/
+ * A dataset consisting of a collection of named tables. This
+ * is a thin wrapper around the teca_table_collection implementing
+ * the teca_dataset API.
+ */
 class teca_database : public teca_dataset
 {
 public:
diff --git a/data/teca_database_fwd.h b/data/teca_database_fwd.h
deleted file mode 100644
index e8f784964..000000000
--- a/data/teca_database_fwd.h
+++ /dev/null
@@ -1,7 +0,0 @@
-#ifndef teca_database_fwd_h
-#define teca_database_fwd_h
-
-#include "teca_shared_object.h"
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_database)
-
-#endif
diff --git a/data/teca_dataset_util.h b/data/teca_dataset_util.h
index e2e90b515..07f4ccc0d 100644
--- a/data/teca_dataset_util.h
+++ b/data/teca_dataset_util.h
@@ -10,6 +10,7 @@
 #include "teca_table.h"
 #include "teca_database.h"
 
+/// @cond
 template <typename dataset_t>
 struct teca_dataset_tt {};
 
@@ -41,7 +42,22 @@ DECLARE_DATASET_TT(teca_curvilinear_mesh, 6)
     case _code:                                 \
         return teca_dataset_new<_code>::New();  \
         break;
+/// @endcond
 
+
+/// Constructs a new instance of teca_dataset from the provided type code.
+/** The type codes are:
+ *
+ * | code | teca_dataset |
+ * | ---- | ------------ |
+ * | 1    | teca_table |
+ * | 2    | teca_database |
+ * | 3    | teca_cartesian_mesh |
+ * | 4    | teca_uniform_cartesian_mesh |
+ * | 5    | teca_arakawa_c_grid |
+ * | 6    | teca_curvilinear_mesh |
+ *
+ */
 struct teca_dataset_factory
 {
     static p_teca_dataset New(int code)
diff --git a/data/teca_mesh.h b/data/teca_mesh.h
index 51e01ec7f..8196fcf29 100644
--- a/data/teca_mesh.h
+++ b/data/teca_mesh.h
@@ -1,18 +1,20 @@
 #ifndef teca_mesh_h
 #define teca_mesh_h
 
-#include "teca_mesh_fwd.h"
 #include "teca_dataset.h"
 #include "teca_metadata.h"
 #include "teca_array_collection.h"
+#include "teca_shared_object.h"
 
-/// a base class for geometric data
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_mesh)
+
+/// A base class for geometric data.
 /**
-The mesh declares containers for typical geometricly associated data
-such as point, cell, face and edge centered data arrays and defines
-the API's for accessing them. API's for accessing common metadata such
-as time related metadata are declared here.
-*/
+ * The mesh declares containers for typical geometrically associated data
+ * such as point, cell, face and edge centered data arrays and defines
+ * the APIs for accessing them. APIs for accessing common metadata such
+ * as time related metadata are declared here.
+ */
 class teca_mesh : public teca_dataset
 {
 public:
@@ -24,8 +26,8 @@ class teca_mesh : public teca_dataset
     TECA_DATASET_METADATA(time_units, std::string, 1)
     TECA_DATASET_METADATA(time_step, unsigned long, 1)
 
-    // set/get array attribute metadata
-    TECA_DATASET_METADATA(array_attributes, teca_metadata, 1)
+    // set/get attribute metadata
+    TECA_DATASET_METADATA(attributes, teca_metadata, 1)
 
     // get the array collection for the given centering
     // the centering enumeration is defined in teca_array_attributes
diff --git a/data/teca_mesh_fwd.h b/data/teca_mesh_fwd.h
deleted file mode 100644
index 92b2b3aa0..000000000
--- a/data/teca_mesh_fwd.h
+++ /dev/null
@@ -1,8 +0,0 @@
-#ifndef teca_mesh_fwd_h
-#define teca_mesh_fwd_h
-
-#include "teca_shared_object.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_mesh)
-
-#endif
diff --git a/data/teca_priority_queue.h b/data/teca_priority_queue.h
new file mode 100644
index 000000000..4a5debb9f
--- /dev/null
+++ b/data/teca_priority_queue.h
@@ -0,0 +1,460 @@
+#ifndef teca_priority_queue_h
+#define teca_priority_queue_h
+
+#include <ostream>
+#include <vector>
+#include <map>
+#include <type_traits>
+#include <cmath>
+#include <memory>
+
+
+/// @cond
+
+// use one of the following aliases for key_map_t. key_map_t
+// is the type of container used to hold the locations of user provided
+// keys in the heap.
+// for keys that are not ordinals 0 to N, use the mapped_key_t alias
+// for contiguous keys 0 to N (faster), use the contiguous_key_t alias
+template<typename key_t>
+using mapped_key_t = std::map<key_t, unsigned long>;
+
+using contiguous_key_t = std::vector<unsigned long>;
+
+// use one of the following objects to provide the priority for the
+// given key. these objects internally point to the container index by
+// key value holding the associated priority.
+// for keys that are not ordinals 0 to N, use the mapped_key_priority_t alias
+// for contiguous keys 0 to N (faster), use the contiguous_key_priority_t alias
+template<typename key_t, typename priority_t>
+struct mapped_key_priority
+{
+    using key_map_t = mapped_key_t<key_t>;
+
+    mapped_key_priority(std::map<key_t, priority_t> &mp) : m_map(&mp)
+    {}
+
+    priority_t operator()(key_t i)
+    { return (*m_map)[i]; }
+
+    std::map<key_t, priority_t> *m_map;
+};
+
+template<typename key_t, typename priority_t>
+struct contiguous_key_priority
+{
+    using key_map_t = contiguous_key_t;
+
+    contiguous_key_priority(const std::vector<priority_t> &vec) :
+        m_vec(vec.data())
+    {}
+
+    priority_t operator()(key_t i)
+    { return m_vec[i]; }
+
+    const priority_t *m_vec;
+};
+
+// forward declare the queue
+template <typename key_t, typename lookup_t, typename comp_t=std::less<>,
+    typename key_map_t=contiguous_key_t>
+class teca_priority_queue;
+
+// pointer type
+template<typename key_t, typename lookup_t, typename ...Types >
+using p_teca_priority_queue = std::shared_ptr<
+    teca_priority_queue<key_t, lookup_t, Types...>>;
+
+/// @endcond
+
+/** @brief
+ * An indirect priority queue that supports random access modification of
+ * priority.
+ *
+ * @details
+ * an indirect priority queue that supports random access modification of
+ * priority the queue works with user provided keys and lookup functor that
+ * converts keys to priorities.
+ *
+ * ### template parameters:
+ *
+ *  | name      | description |
+ *  | ----      | ----------- |
+ *  | key_t     | type of the user provided keys |
+ *  | lookup_t  | callable that implements: priority_t operator()(key_t key) |
+ *  | comp_t    | callable that implements the predicate: bool(key_t, key_t), |
+ *  |           | used to enforce heap order. (std::less<key_t>) |
+ *  | key_map_t | type of container used to track the position in the heap |
+ *  |           | of the keys. The default, a vector, is only valid for |
+ *  |           | interger ordinals from 0 to N. Use mapped_key_t<key_t> |
+ *  |           | for all other cases. (contiguous_key_t) |
+ *
+ * ### typical usage:
+ *
+ * construct a container of objects to prioritize, and initialize a lookup
+ * object that given a key returns the priority of the coresponding object.
+ * create an instance of the priority_queue and push the key values. as keys
+ * are pushed heap ording is imposed, this is why objects need to be in place
+ * before pushing keys. when an object's priority has been changed one must
+ * call modified passing the key of the object. the location of each object is
+ * tracked and the queue will reprioritize itself after modification.
+ *
+ * ### recomendation:
+ *
+ * to obtain high performance, it's best to avoid using std::function for
+ * lookup operations. Instead, write a small functor so that the compiler
+ * can inline lookup calls.
+ *
+ * don't forget to change key_map_t to mapped_key_t<key_t> if
+ * keys are not integer ordinals 0 to N.
+ */
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+class teca_priority_queue
+{
+public:
+
+    ~teca_priority_queue() = default;
+
+    // return a new instance, must pass the lookup operator that
+    // translates keys into priority values
+    static p_teca_priority_queue<key_t, lookup_t, comp_t, key_map_t>
+    New(lookup_t &lookup, unsigned long init_size=256,
+        unsigned long block_size=256)
+    {
+        p_teca_priority_queue<key_t, lookup_t,
+             comp_t, key_map_t> ptr(
+                new teca_priority_queue<
+                    key_t, lookup_t, comp_t, key_map_t>(
+                        lookup, init_size, block_size));
+        return ptr;
+    }
+
+    // return true if the queue has no keys
+    bool empty() { return m_end == 0; }
+
+
+    /// add a value into the queue
+    void push(const key_t &key);
+
+    /// free all resources and reset the queue to an empty state
+    void clear();
+
+    // restore heap condition after an id is modified
+    void modified(const key_t &key);
+
+    // return the id at the top of the queue, and remove it.
+    // internal memory is not deallocated.
+    key_t pop();
+
+    // return the id in the top of queue
+    key_t peak();
+
+    // print the state of the queue
+    void to_stream(std::ostream &os, bool priorities = true);
+
+protected:
+    teca_priority_queue() = default;
+
+    teca_priority_queue(const teca_priority_queue<key_t, lookup_t> &) = delete;
+    void operator=(const teca_priority_queue<key_t, lookup_t> &) = delete;
+
+    // initialize the queue with an comperator, the initial size, and declare
+    // the amount to grow the queue by during dynamic resizing.
+    template<typename u = key_map_t>
+    teca_priority_queue(lookup_t lookup, unsigned long init_size,
+        unsigned long block_size,
+        typename std::enable_if<std::is_same<
+        std::vector<unsigned long>, u>::value>::type * = 0);
+
+    template<typename u = key_map_t>
+    teca_priority_queue(lookup_t lookup, unsigned long init_size,
+        unsigned long block_size,
+        typename std::enable_if<std::is_same<
+        std::map<key_t,unsigned long>, u>::value>::type * = 0);
+
+    // grow the queue to the new size
+    template<typename u = key_map_t>
+    void grow(unsigned long n,
+        typename std::enable_if<std::is_same<
+        std::vector<unsigned long>, u>::value>::type * = 0);
+
+    // grow the queue to the new size
+    template<typename u = key_map_t>
+    void grow(unsigned long n,
+        typename std::enable_if<std::is_same<
+        std::map<key_t, unsigned long>, u>::value>::type * = 0);
+
+    // restore the heap condition starting from here
+    // and working up
+    void up_heapify(unsigned long id);
+
+    // restore the heap condition starting from here
+    // and working down
+    void down_heapify(unsigned long id);
+
+    // exchange two items
+    void swap(unsigned long i, unsigned long j);
+
+    // helpers for walking tree
+    unsigned long left_child(unsigned long a_id)
+    { return a_id*2; }
+
+    unsigned long right_child(unsigned long a_id)
+    { return a_id*2 + 1; }
+
+    unsigned long parent(unsigned long a_id)
+    { return a_id/2; }
+
+
+private:
+    lookup_t m_lookup;          // callable to turn keys into priority values
+    std::vector<key_t> m_ids;   // array of keys
+    key_map_t m_locs;           // map indexed by key to find the current position in the queue
+    unsigned long m_size;       // size of the key buffer
+    unsigned long m_end;        // index of the last key in the queue
+    unsigned long m_block_size; // amount to grow the dynamically alloacted buffers by
+};
+
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+void teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::push(const key_t &key)
+{
+    // extend the queue
+    ++m_end;
+
+    // verify that there is space, if not allocate it
+    if (m_end >= m_size)
+        this->grow(m_size + m_block_size);
+
+    // add key and it's location
+    m_ids[m_end] = key;
+    m_locs[key] = m_end;
+
+    // restore heap condition
+    this->up_heapify(m_end);
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+void teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::clear()
+{
+    m_ids.clear();
+    m_locs.clear();
+    m_size = 0;
+    m_end = 0;
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+void teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::modified(const key_t &key)
+{
+    // find the loc of the modified key
+    unsigned long id = m_locs[key];
+    // fix up then down
+    this->up_heapify(id);
+    this->down_heapify(id);
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+key_t teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::pop()
+{
+    key_t id_1 = m_ids[1];
+    if (m_end > 0)
+    {
+        this->swap(1, m_end);
+        --m_end;
+        this->down_heapify(1);
+    }
+    return id_1;
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+key_t teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::peak()
+{
+    return m_ids[1];
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+void teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::to_stream(std::ostream &os, bool priorities)
+{
+    long log_end = std::log2(m_end);
+    long n_rows = log_end + 1;
+    unsigned long q = 0;
+    for (long i = 0; i < n_rows; ++i)
+    {
+        if (q > m_end)
+            break;
+
+        long n_elem = 1 << i;
+        long isp = (1 << (n_rows - 1 - i)) - 1;
+        long bsp = 2*isp + 1;
+
+        for (long j = 0; j < isp; ++j)
+            os << " ";
+
+        for (long j = 0; (j < n_elem) && (q < m_end); ++j)
+        {
+            if (priorities)
+                os << m_lookup(m_ids[++q]);
+            else
+                os << m_ids[++q];
+            for (long k = 0; k < bsp; ++k)
+                os << " ";
+        }
+
+        os << std::endl;
+    }
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+template<typename u>
+teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::teca_priority_queue(lookup_t lookup,
+    unsigned long init_size, unsigned long block_size,
+    typename std::enable_if<std::is_same<
+    std::vector<unsigned long>, u>::value>::type *) :
+    m_lookup(lookup), m_size(init_size), m_end(0),
+    m_block_size(block_size)
+{
+    m_ids.resize(init_size);
+    m_locs.resize(init_size);
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+template<typename u>
+teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::teca_priority_queue(lookup_t lookup,
+    unsigned long init_size, unsigned long block_size,
+    typename std::enable_if<std::is_same<
+    std::map<key_t,unsigned long>, u>::value>::type *) :
+    m_lookup(lookup), m_size(init_size), m_end(0),
+    m_block_size(block_size)
+{
+    m_ids.resize(init_size);
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+template<typename u>
+void teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::grow(unsigned long n,
+    typename std::enable_if<std::is_same<
+    std::vector<unsigned long>, u>::value>::type *)
+{
+    m_ids.resize(n);
+    m_locs.resize(n);
+    m_size = n;
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+template<typename u>
+void teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::grow(unsigned long n,
+    typename std::enable_if<std::is_same<
+    std::map<key_t, unsigned long>, u>::value>::type *)
+{
+    m_ids.resize(n);
+    m_size = n;
+}
+
+
+ // --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+void teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::up_heapify(unsigned long id)
+{
+    // if at tree root then stop
+    if (id < 2)
+        return;
+
+    // else find parent and enforce heap order
+    comp_t comp;
+    unsigned long id_p = parent(id);
+    if (comp(m_lookup(m_ids[id]), m_lookup(m_ids[id_p])))
+        this->swap(id, id_p);
+
+    // continue up toward the root
+    this->up_heapify(id_p);
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+void teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::down_heapify(unsigned long id)
+{
+    // if no current node then stop
+    if (id > m_end)
+        return;
+
+    // if no left child then stop
+    unsigned long lc = left_child(id);
+    if (lc > m_end)
+        return;
+
+    // find the smaller child
+    comp_t comp;
+    unsigned long smallc = lc;
+    unsigned long rc = right_child(id);
+    if (rc <= m_end)
+        smallc = comp(m_lookup(m_ids[lc]),
+            m_lookup(m_ids[rc])) ? lc : rc;
+
+    // if in heap order then stop
+    if (comp(m_lookup(m_ids[id]), m_lookup(m_ids[smallc])))
+        return;
+
+    // else swap and continue
+    this->swap(id, smallc);
+    this->down_heapify(smallc);
+}
+
+// --------------------------------------------------------------------------
+template <typename key_t, typename lookup_t,
+    typename comp_t, typename key_map_t>
+void teca_priority_queue<key_t, lookup_t,
+    comp_t, key_map_t>::swap(unsigned long i, unsigned long j)
+{
+    key_t key_i = m_ids[i];
+    key_t key_j = m_ids[j];
+    // exchange keys
+    m_ids[i] = key_j;
+    m_ids[j] = key_i;
+    // update locs
+    m_locs[key_j] = i;
+    m_locs[key_i] = j;
+}
+
+template <typename key_t, typename lookup_t, typename ... Args>
+std::ostream & operator<<(std::ostream &os, p_teca_priority_queue<key_t, lookup_t, Args ...> &q)
+{
+    q->to_stream(os);
+    return os;
+}
+
+#endif
diff --git a/data/teca_table.h b/data/teca_table.h
index a3b372eff..241f42d37 100644
--- a/data/teca_table.h
+++ b/data/teca_table.h
@@ -12,10 +12,10 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_table)
 
-/**
-A collection of collumnar data with row based
-accessors and communication and I/O support.
-*/
+/** @brief
+ * A collection of columnar data with row based
+ * accessors and communication and I/O support.
+ */
 class teca_table : public teca_dataset
 {
 public:
@@ -34,8 +34,8 @@ class teca_table : public teca_dataset
 
     // define the table columns. requires name,type pairs
     // for ex. define("c1",int(),"c2",float()) creates a
-    // table with 2 columns the first storing int's the
-    // second storing float's.
+    // table with 2 columns the first storing int the
+    // second storing float.
     template<typename nT, typename cT, typename... oT>
     void declare_columns(nT &&col_name, cT col_type, oT &&...args);
 
@@ -55,7 +55,7 @@ class teca_table : public teca_dataset
     const_p_teca_variant_array get_column(unsigned int i) const;
     const_p_teca_variant_array get_column(const std::string &col_name) const;
 
-    // test for the existance of a specific column
+    // test for the existence of a specific column
     bool has_column(const std::string &col_name) const
     { return m_impl->columns->has(col_name); }
 
@@ -103,7 +103,7 @@ class teca_table : public teca_dataset
     // return an integer identifier uniquely naming the dataset type
     int get_type_code() const override;
 
-    // covert to bool. true if the dataset is not empty.
+    // covert to boolean. true if the dataset is not empty.
     // otherwise false.
     explicit operator bool() const noexcept
     { return !this->empty(); }
diff --git a/data/teca_table_collection.h b/data/teca_table_collection.h
index c2eb9bc95..1bc2a4a68 100644
--- a/data/teca_table_collection.h
+++ b/data/teca_table_collection.h
@@ -1,16 +1,16 @@
 #ifndef teca_table_collection_h
 #define teca_table_collection_h
 
-#include "teca_table_collection_fwd.h"
 #include "teca_table.h"
+#include "teca_shared_object.h"
+
 #include <map>
 #include <vector>
 #include <string>
 
-// a collection of named tables
-/**
-A collection of named tables
-*/
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_table_collection)
+
+/// A collection of named tables.
 class teca_table_collection
 {
 public:
diff --git a/data/teca_table_collection_fwd.h b/data/teca_table_collection_fwd.h
deleted file mode 100644
index 732902648..000000000
--- a/data/teca_table_collection_fwd.h
+++ /dev/null
@@ -1,8 +0,0 @@
-#ifndef teca_table_collection_fwd_h
-#define teca_table_collection_fwd_h
-
-#include "teca_shared_object.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_table_collection)
-
-#endif
diff --git a/data/teca_uniform_cartesian_mesh.h b/data/teca_uniform_cartesian_mesh.h
index bd7ef44d1..f6e31c66c 100644
--- a/data/teca_uniform_cartesian_mesh.h
+++ b/data/teca_uniform_cartesian_mesh.h
@@ -1,10 +1,12 @@
 #ifndef teca_uniform_cartesian_mesh_h
 #define teca_uniform_cartesian_mesh_h
 
-#include "teca_uniform_cartesian_mesh_fwd.h"
 #include "teca_mesh.h"
+#include "teca_shared_object.h"
 
-/// data on a uniform cartesian mesh
+TECA_SHARED_OBJECT_FORWARD_DECL(teca_uniform_cartesian_mesh)
+
+/// Data on a uniform cartesian mesh.
 class teca_uniform_cartesian_mesh : public teca_mesh
 {
 public:
@@ -22,19 +24,19 @@ class teca_uniform_cartesian_mesh : public teca_mesh
     TECA_DATASET_METADATA(extent, unsigned long, 6)
     TECA_DATASET_METADATA(local_extent, unsigned long, 6)
 
-    // return a unique string identifier
+    /// return a unique string identifier
     std::string get_class_name() const override
     { return "teca_uniform_cartesian_mesh"; }
 
-    // return a unique integer identifier
+    /// return a unique integer identifier
     int get_type_code() const override;
 
-    // copy data and metadata. shallow copy uses reference
-    // counting, while copy duplicates the data.
+    /// copy data and metadata. shallow copy uses reference
+    /// counting, while copy duplicates the data.
     void copy(const const_p_teca_dataset &) override;
     void shallow_copy(const p_teca_dataset &) override;
 
-    // swap internals of the two objects
+    /// swap internals of the two objects
     void swap(p_teca_dataset &) override;
 
 protected:
diff --git a/data/teca_uniform_cartesian_mesh_fwd.h b/data/teca_uniform_cartesian_mesh_fwd.h
deleted file mode 100644
index 79a66e960..000000000
--- a/data/teca_uniform_cartesian_mesh_fwd.h
+++ /dev/null
@@ -1,8 +0,0 @@
-#ifndef teca_uniform_cartesian_mesh_fwd_h
-#define teca_uniform_cartesian_mesh_fwd_h
-
-#include "teca_shared_object.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(teca_uniform_cartesian_mesh)
-
-#endif
diff --git a/doc/release/4.1.0.md b/doc/release/4.1.0.md
new file mode 100644
index 000000000..ce91a2e50
--- /dev/null
+++ b/doc/release/4.1.0.md
@@ -0,0 +1,26 @@
+## Release Notes for TECA 4.1.0
+Thu May  6 12:10:26 PM PDT 2021
+
+* new mask below surface algorithm, inetgrated into all the apps
+* new unpack NetCDF packed data stage
+* add coordinate normalization stage transform for longitude from -180 to 180
+  to 0 to 360
+* new IWV algorithm
+* new time based file layouts (daily, monthly, yearly, seasonal)
+* BARD app can now generate output fields weighted by AR probabilities
+* new rename variables stage
+* improvements to cartesian_mesh_source for remeshing
+* cf_reader correctly detects centering and per field dimensionality
+* multi_cf_reader MCF file format improvements. Add support for reader
+  properties, globablly and per reader.
+* cf_reader option to produce 2D field when the 3'rd dimension is length 1
+* Cartesian meshes can now contain both 2D and 3D arrays, metadata annotations
+  are used to differentiate at run time
+* metadata probe improvements to report per-field centering
+* new remeshing capability deployed in cf_restripe and apps that utilize
+  elevation mask
+* improvements to the user guide
+* refactored source code documentation to be compatible with Doxygen,
+* published Doxygen on the rtd site : https://teca.readthedocs.io/en/integrating_breathe/doxygen/index.html
+* new capabilities in the cf_restripe command line application for remeshing
+* 25+ bug fixes
diff --git a/doc/rtd/Doxyfile b/doc/rtd/Doxyfile
new file mode 100644
index 000000000..aa8d9ea3f
--- /dev/null
+++ b/doc/rtd/Doxyfile
@@ -0,0 +1,2547 @@
+# Doxyfile 1.8.20
+
+
+# This file describes the settings to be used by the documentation system
+# doxygen (www.doxygen.org) for a project.
+#
+# All text after a double hash (##) is considered a comment and is placed in
+# front of the TAG it is preceding.
+#
+# All text after a single hash (#) is considered a comment and will be ignored.
+# The format is:
+# TAG = value [value, ...]
+# For lists, items can also be appended using:
+# TAG += value [value, ...]
+# Values that contain spaces should be placed between quotes (\" \").
+
+#---------------------------------------------------------------------------
+# Project related configuration options
+#---------------------------------------------------------------------------
+
+# This tag specifies the encoding used for all characters in the configuration
+# file that follow. The default is UTF-8 which is also the encoding used for all
+# text before the first occurrence of this tag. Doxygen uses libiconv (or the
+# iconv built into libc) for the transcoding. See
+# https://www.gnu.org/software/libiconv/ for the list of possible encodings.
+# The default value is: UTF-8.
+
+DOXYFILE_ENCODING      = UTF-8
+
+# The PROJECT_NAME tag is a single word (or a sequence of words surrounded by
+# double-quotes, unless you are using Doxywizard) that should identify the
+# project for which the documentation is generated. This name is used in the
+# title of most generated pages and in a few other places.
+# The default value is: My Project.
+
+PROJECT_NAME           = "TECA"
+
+# The PROJECT_NUMBER tag can be used to enter a project or revision number. This
+# could be handy for archiving the generated documentation or if some version
+# control system is used.
+
+PROJECT_NUMBER         =
+
+# Using the PROJECT_BRIEF tag one can provide an optional one line description
+# for a project that appears at the top of each page and should give viewer a
+# quick idea about the purpose of the project. Keep the description short.
+
+PROJECT_BRIEF          = "The Toolkit for Extreme Climate Analysis"
+
+# With the PROJECT_LOGO tag one can specify a logo or an icon that is included
+# in the documentation. The maximum height of the logo should not exceed 55
+# pixels and the maximum width should not exceed 200 pixels. Doxygen will copy
+# the logo to the output directory.
+
+PROJECT_LOGO           =
+
+# The OUTPUT_DIRECTORY tag is used to specify the (relative or absolute) path
+# into which the generated documentation will be written. If a relative path is
+# entered, it will be relative to the location where doxygen was started. If
+# left blank the current directory will be used.
+
+OUTPUT_DIRECTORY       = _build
+
+# If the CREATE_SUBDIRS tag is set to YES then doxygen will create 4096 sub-
+# directories (in 2 levels) under the output directory of each output format and
+# will distribute the generated files over these directories. Enabling this
+# option can be useful when feeding doxygen a huge amount of source files, where
+# putting all generated files in the same directory would otherwise causes
+# performance problems for the file system.
+# The default value is: NO.
+
+CREATE_SUBDIRS         = NO
+
+# If the ALLOW_UNICODE_NAMES tag is set to YES, doxygen will allow non-ASCII
+# characters to appear in the names of generated files. If set to NO, non-ASCII
+# characters will be escaped, for example _xE3_x81_x84 will be used for Unicode
+# U+3044.
+# The default value is: NO.
+
+ALLOW_UNICODE_NAMES    = NO
+
+# The OUTPUT_LANGUAGE tag is used to specify the language in which all
+# documentation generated by doxygen is written. Doxygen will use this
+# information to generate all constant output in the proper language.
+# Possible values are: Afrikaans, Arabic, Armenian, Brazilian, Catalan, Chinese,
+# Chinese-Traditional, Croatian, Czech, Danish, Dutch, English (United States),
+# Esperanto, Farsi (Persian), Finnish, French, German, Greek, Hungarian,
+# Indonesian, Italian, Japanese, Japanese-en (Japanese with English messages),
+# Korean, Korean-en (Korean with English messages), Latvian, Lithuanian,
+# Macedonian, Norwegian, Persian (Farsi), Polish, Portuguese, Romanian, Russian,
+# Serbian, Serbian-Cyrillic, Slovak, Slovene, Spanish, Swedish, Turkish,
+# Ukrainian and Vietnamese.
+# The default value is: English.
+
+OUTPUT_LANGUAGE        = English
+
+# The OUTPUT_TEXT_DIRECTION tag is used to specify the direction in which all
+# documentation generated by doxygen is written. Doxygen will use this
+# information to generate all generated output in the proper direction.
+# Possible values are: None, LTR, RTL and Context.
+# The default value is: None.
+
+OUTPUT_TEXT_DIRECTION  = None
+
+# If the BRIEF_MEMBER_DESC tag is set to YES, doxygen will include brief member
+# descriptions after the members that are listed in the file and class
+# documentation (similar to Javadoc). Set to NO to disable this.
+# The default value is: YES.
+
+BRIEF_MEMBER_DESC      = YES
+
+# If the REPEAT_BRIEF tag is set to YES, doxygen will prepend the brief
+# description of a member or function before the detailed description
+#
+# Note: If both HIDE_UNDOC_MEMBERS and BRIEF_MEMBER_DESC are set to NO, the
+# brief descriptions will be completely suppressed.
+# The default value is: YES.
+
+REPEAT_BRIEF           = YES
+
+# This tag implements a quasi-intelligent brief description abbreviator that is
+# used to form the text in various listings. Each string in this list, if found
+# as the leading text of the brief description, will be stripped from the text
+# and the result, after processing the whole list, is used as the annotated
+# text. Otherwise, the brief description is used as-is. If left blank, the
+# following values are used ($name is automatically replaced with the name of
+# the entity):The $name class, The $name widget, The $name file, is, provides,
+# specifies, contains, represents, a, an and the.
+
+ABBREVIATE_BRIEF       = "The $name class" \
+                         "The $name widget" \
+                         "The $name file" \
+                         is \
+                         provides \
+                         specifies \
+                         contains \
+                         represents \
+                         a \
+                         an \
+                         the
+
+# If the ALWAYS_DETAILED_SEC and REPEAT_BRIEF tags are both set to YES then
+# doxygen will generate a detailed section even if there is only a brief
+# description.
+# The default value is: NO.
+
+ALWAYS_DETAILED_SEC    = YES
+
+# If the INLINE_INHERITED_MEMB tag is set to YES, doxygen will show all
+# inherited members of a class in the documentation of that class as if those
+# members were ordinary class members. Constructors, destructors and assignment
+# operators of the base classes will not be shown.
+# The default value is: NO.
+
+INLINE_INHERITED_MEMB  = NO
+
+# If the FULL_PATH_NAMES tag is set to YES, doxygen will prepend the full path
+# before files name in the file list and in the header files. If set to NO the
+# shortest path that makes the file name unique will be used
+# The default value is: YES.
+
+FULL_PATH_NAMES        = YES
+
+# The STRIP_FROM_PATH tag can be used to strip a user-defined part of the path.
+# Stripping is only done if one of the specified strings matches the left-hand
+# part of the path. The tag can be used to show relative paths in the file list.
+# If left blank the directory from which doxygen is run is used as the path to
+# strip.
+#
+# Note that you can specify absolute paths here, but also relative paths, which
+# will be relative from the directory where doxygen is started.
+# This tag requires that the tag FULL_PATH_NAMES is set to YES.
+
+STRIP_FROM_PATH        = ../../..
+
+# The STRIP_FROM_INC_PATH tag can be used to strip a user-defined part of the
+# path mentioned in the documentation of a class, which tells the reader which
+# header file to include in order to use a class. If left blank only the name of
+# the header file containing the class definition is used. Otherwise one should
+# specify the list of include paths that are normally passed to the compiler
+# using the -I flag.
+
+STRIP_FROM_INC_PATH    =
+
+# If the SHORT_NAMES tag is set to YES, doxygen will generate much shorter (but
+# less readable) file names. This can be useful is your file systems doesn't
+# support long names like on DOS, Mac, or CD-ROM.
+# The default value is: NO.
+
+SHORT_NAMES            = NO
+
+# If the JAVADOC_AUTOBRIEF tag is set to YES then doxygen will interpret the
+# first line (until the first dot) of a Javadoc-style comment as the brief
+# description. If set to NO, the Javadoc-style will behave just like regular Qt-
+# style comments (thus requiring an explicit @brief command for a brief
+# description.)
+# The default value is: NO.
+
+JAVADOC_AUTOBRIEF      = NO
+
+# If the JAVADOC_BANNER tag is set to YES then doxygen will interpret a line
+# such as
+# /***************
+# as being the beginning of a Javadoc-style comment "banner". If set to NO, the
+# Javadoc-style will behave just like regular comments and it will not be
+# interpreted by doxygen.
+# The default value is: NO.
+
+JAVADOC_BANNER         = NO
+
+# If the QT_AUTOBRIEF tag is set to YES then doxygen will interpret the first
+# line (until the first dot) of a Qt-style comment as the brief description. If
+# set to NO, the Qt-style will behave just like regular Qt-style comments (thus
+# requiring an explicit \brief command for a brief description.)
+# The default value is: NO.
+
+QT_AUTOBRIEF           = NO
+
+# The MULTILINE_CPP_IS_BRIEF tag can be set to YES to make doxygen treat a
+# multi-line C++ special comment block (i.e. a block of //! or /// comments) as
+# a brief description. This used to be the default behavior. The new default is
+# to treat a multi-line C++ comment block as a detailed description. Set this
+# tag to YES if you prefer the old behavior instead.
+#
+# Note that setting this tag to YES also means that rational rose comments are
+# not recognized any more.
+# The default value is: NO.
+
+MULTILINE_CPP_IS_BRIEF = NO
+
+# By default Python docstrings are displayed as preformatted text and doxygen's
+# special commands cannot be used. By setting PYTHON_DOCSTRING to NO the
+# doxygen's special commands can be used and the contents of the docstring
+# documentation blocks is shown as doxygen documentation.
+# The default value is: YES.
+
+PYTHON_DOCSTRING       = NO
+
+# If the INHERIT_DOCS tag is set to YES then an undocumented member inherits the
+# documentation from any documented member that it re-implements.
+# The default value is: YES.
+
+INHERIT_DOCS           = YES
+
+# If the SEPARATE_MEMBER_PAGES tag is set to YES then doxygen will produce a new
+# page for each member. If set to NO, the documentation of a member will be part
+# of the file/class/namespace that contains it.
+# The default value is: NO.
+
+SEPARATE_MEMBER_PAGES  = NO
+
+# The TAB_SIZE tag can be used to set the number of spaces in a tab. Doxygen
+# uses this value to replace tabs by spaces in code fragments.
+# Minimum value: 1, maximum value: 16, default value: 4.
+
+TAB_SIZE               = 4
+
+# This tag can be used to specify a number of aliases that act as commands in
+# the documentation. An alias has the form:
+# name=value
+# For example adding
+# "sideeffect=@par Side Effects:\n"
+# will allow you to put the command \sideeffect (or @sideeffect) in the
+# documentation, which will result in a user-defined paragraph with heading
+# "Side Effects:". You can put \n's in the value part of an alias to insert
+# newlines (in the resulting output). You can put ^^ in the value part of an
+# alias to insert a newline as if a physical newline was in the original file.
+# When you need a literal { or } or , in the value part of an alias you have to
+# escape them by means of a backslash (\), this can lead to conflicts with the
+# commands \{ and \} for these it is advised to use the version @{ and @} or use
+# a double escape (\\{ and \\})
+
+ALIASES =
+
+#ALIASES = "rst=\verbatim embed:rst"
+#ALIASES += "endrst=\endverbatim"
+#ALIASES += "rststar=\verbatim embed:rst:leading-asterisk"
+#ALIASES += "endrststar=\endverbatim"
+
+# Set the OPTIMIZE_OUTPUT_FOR_C tag to YES if your project consists of C sources
+# only. Doxygen will then generate output that is more tailored for C. For
+# instance, some of the names that are used will be different. The list of all
+# members will be omitted, etc.
+# The default value is: NO.
+
+OPTIMIZE_OUTPUT_FOR_C  = NO
+
+# Set the OPTIMIZE_OUTPUT_JAVA tag to YES if your project consists of Java or
+# Python sources only. Doxygen will then generate output that is more tailored
+# for that language. For instance, namespaces will be presented as packages,
+# qualified scopes will look different, etc.
+# The default value is: NO.
+
+OPTIMIZE_OUTPUT_JAVA   = NO
+
+# Set the OPTIMIZE_FOR_FORTRAN tag to YES if your project consists of Fortran
+# sources. Doxygen will then generate output that is tailored for Fortran.
+# The default value is: NO.
+
+OPTIMIZE_FOR_FORTRAN   = NO
+
+# Set the OPTIMIZE_OUTPUT_VHDL tag to YES if your project consists of VHDL
+# sources. Doxygen will then generate output that is tailored for VHDL.
+# The default value is: NO.
+
+OPTIMIZE_OUTPUT_VHDL   = NO
+
+# Set the OPTIMIZE_OUTPUT_SLICE tag to YES if your project consists of Slice
+# sources only. Doxygen will then generate output that is more tailored for that
+# language. For instance, namespaces will be presented as modules, types will be
+# separated into more groups, etc.
+# The default value is: NO.
+
+OPTIMIZE_OUTPUT_SLICE  = NO
+
+# Doxygen selects the parser to use depending on the extension of the files it
+# parses. With this tag you can assign which parser to use for a given
+# extension. Doxygen has a built-in mapping, but you can override or extend it
+# using this tag. The format is ext=language, where ext is a file extension, and
+# language is one of the parsers supported by doxygen: IDL, Java, JavaScript,
+# Csharp (C#), C, C++, D, PHP, md (Markdown), Objective-C, Python, Slice, VHDL,
+# Fortran (fixed format Fortran: FortranFixed, free formatted Fortran:
+# FortranFree, unknown formatted Fortran: Fortran. In the later case the parser
+# tries to guess whether the code is fixed or free formatted code, this is the
+# default for Fortran type files). For instance to make doxygen treat .inc files
+# as Fortran files (default is PHP), and .f files as C (default is Fortran),
+# use: inc=Fortran f=C.
+#
+# Note: For files without extension you can use no_extension as a placeholder.
+#
+# Note that for custom extensions you also need to set FILE_PATTERNS otherwise
+# the files are not read by doxygen.
+
+EXTENSION_MAPPING      =
+
+# If the MARKDOWN_SUPPORT tag is enabled then doxygen pre-processes all comments
+# according to the Markdown format, which allows for more readable
+# documentation. See https://daringfireball.net/projects/markdown/ for details.
+# The output of markdown processing is further processed by doxygen, so you can
+# mix doxygen, HTML, and XML commands with Markdown formatting. Disable only in
+# case of backward compatibilities issues.
+# The default value is: YES.
+
+MARKDOWN_SUPPORT       = YES
+
+# When the TOC_INCLUDE_HEADINGS tag is set to a non-zero value, all headings up
+# to that level are automatically included in the table of contents, even if
+# they do not have an id attribute.
+# Note: This feature currently applies only to Markdown headings.
+# Minimum value: 0, maximum value: 99, default value: 5.
+# This tag requires that the tag MARKDOWN_SUPPORT is set to YES.
+
+TOC_INCLUDE_HEADINGS   = 5
+
+# When enabled doxygen tries to link words that correspond to documented
+# classes, or namespaces to their corresponding documentation. Such a link can
+# be prevented in individual cases by putting a % sign in front of the word or
+# globally by setting AUTOLINK_SUPPORT to NO.
+# The default value is: YES.
+
+AUTOLINK_SUPPORT       = YES
+
+# If you use STL classes (i.e. std::string, std::vector, etc.) but do not want
+# to include (a tag file for) the STL sources as input, then you should set this
+# tag to YES in order to let doxygen match functions declarations and
+# definitions whose arguments contain STL classes (e.g. func(std::string);
+# versus func(std::string) {}). This also make the inheritance and collaboration
+# diagrams that involve STL classes more complete and accurate.
+# The default value is: NO.
+
+BUILTIN_STL_SUPPORT    = YES
+
+# If you use Microsoft's C++/CLI language, you should set this option to YES to
+# enable parsing support.
+# The default value is: NO.
+
+CPP_CLI_SUPPORT        = NO
+
+# Set the SIP_SUPPORT tag to YES if your project consists of sip (see:
+# https://www.riverbankcomputing.com/software/sip/intro) sources only. Doxygen
+# will parse them like normal C++ but will assume all classes use public instead
+# of private inheritance when no explicit protection keyword is present.
+# The default value is: NO.
+
+SIP_SUPPORT            = NO
+
+# For Microsoft's IDL there are propget and propput attributes to indicate
+# getter and setter methods for a property. Setting this option to YES will make
+# doxygen to replace the get and set methods by a property in the documentation.
+# This will only work if the methods are indeed getting or setting a simple
+# type. If this is not the case, or you want to show the methods anyway, you
+# should set this option to NO.
+# The default value is: YES.
+
+IDL_PROPERTY_SUPPORT   = NO
+
+# If member grouping is used in the documentation and the DISTRIBUTE_GROUP_DOC
+# tag is set to YES then doxygen will reuse the documentation of the first
+# member in the group (if any) for the other members of the group. By default
+# all members of a group must be documented explicitly.
+# The default value is: NO.
+
+DISTRIBUTE_GROUP_DOC   = NO
+
+# If one adds a struct or class to a group and this option is enabled, then also
+# any nested class or struct is added to the same group. By default this option
+# is disabled and one has to add nested compounds explicitly via \ingroup.
+# The default value is: NO.
+
+GROUP_NESTED_COMPOUNDS = NO
+
+# Set the SUBGROUPING tag to YES to allow class member groups of the same type
+# (for instance a group of public functions) to be put as a subgroup of that
+# type (e.g. under the Public Functions section). Set it to NO to prevent
+# subgrouping. Alternatively, this can be done per class using the
+# \nosubgrouping command.
+# The default value is: YES.
+
+SUBGROUPING            = YES
+
+# When the INLINE_GROUPED_CLASSES tag is set to YES, classes, structs and unions
+# are shown inside the group in which they are included (e.g. using \ingroup)
+# instead of on a separate page (for HTML and Man pages) or section (for LaTeX
+# and RTF).
+#
+# Note that this feature does not work in combination with
+# SEPARATE_MEMBER_PAGES.
+# The default value is: NO.
+
+INLINE_GROUPED_CLASSES = NO
+
+# When the INLINE_SIMPLE_STRUCTS tag is set to YES, structs, classes, and unions
+# with only public data fields or simple typedef fields will be shown inline in
+# the documentation of the scope in which they are defined (i.e. file,
+# namespace, or group documentation), provided this scope is documented. If set
+# to NO, structs, classes, and unions are shown on a separate page (for HTML and
+# Man pages) or section (for LaTeX and RTF).
+# The default value is: NO.
+
+INLINE_SIMPLE_STRUCTS  = NO
+
+# When TYPEDEF_HIDES_STRUCT tag is enabled, a typedef of a struct, union, or
+# enum is documented as struct, union, or enum with the name of the typedef. So
+# typedef struct TypeS {} TypeT, will appear in the documentation as a struct
+# with name TypeT. When disabled the typedef will appear as a member of a file,
+# namespace, or class. And the struct will be named TypeS. This can typically be
+# useful for C code in case the coding convention dictates that all compound
+# types are typedef'ed and only the typedef is referenced, never the tag name.
+# The default value is: NO.
+
+TYPEDEF_HIDES_STRUCT   = NO
+
+# The size of the symbol lookup cache can be set using LOOKUP_CACHE_SIZE. This
+# cache is used to resolve symbols given their name and scope. Since this can be
+# an expensive process and often the same symbol appears multiple times in the
+# code, doxygen keeps a cache of pre-resolved symbols. If the cache is too small
+# doxygen will become slower. If the cache is too large, memory is wasted. The
+# cache size is given by this formula: 2^(16+LOOKUP_CACHE_SIZE). The valid range
+# is 0..9, the default is 0, corresponding to a cache size of 2^16=65536
+# symbols. At the end of a run doxygen will report the cache usage and suggest
+# the optimal cache size from a speed point of view.
+# Minimum value: 0, maximum value: 9, default value: 0.
+
+LOOKUP_CACHE_SIZE      = 0
+
+# The NUM_PROC_THREADS specifies the number threads doxygen is allowed to use
+# during processing. When set to 0 doxygen will based this on the number of
+# cores available in the system. You can set it explicitly to a value larger
+# than 0 to get more control over the balance between CPU load and processing
+# speed. At this moment only the input processing can be done using multiple
+# threads. Since this is still an experimental feature the default is set to 1,
+# which efficively disables parallel processing. Please report any issues you
+# encounter. Generating dot graphs in parallel is controlled by the
+# DOT_NUM_THREADS setting.
+# Minimum value: 0, maximum value: 32, default value: 1.
+
+NUM_PROC_THREADS       = 1
+
+#---------------------------------------------------------------------------
+# Build related configuration options
+#---------------------------------------------------------------------------
+
+# If the EXTRACT_ALL tag is set to YES, doxygen will assume all entities in
+# documentation are documented, even if no documentation was available. Private
+# class members and static file members will be hidden unless the
+# EXTRACT_PRIVATE respectively EXTRACT_STATIC tags are set to YES.
+# Note: This will also disable the warnings about undocumented members that are
+# normally produced when WARNINGS is set to YES.
+# The default value is: NO.
+
+EXTRACT_ALL            = NO
+
+# If the EXTRACT_PRIVATE tag is set to YES, all private members of a class will
+# be included in the documentation.
+# The default value is: NO.
+
+EXTRACT_PRIVATE        = NO
+
+# If the EXTRACT_PRIV_VIRTUAL tag is set to YES, documented private virtual
+# methods of a class will be included in the documentation.
+# The default value is: NO.
+
+EXTRACT_PRIV_VIRTUAL   = NO
+
+# If the EXTRACT_PACKAGE tag is set to YES, all members with package or internal
+# scope will be included in the documentation.
+# The default value is: NO.
+
+EXTRACT_PACKAGE        = NO
+
+# If the EXTRACT_STATIC tag is set to YES, all static members of a file will be
+# included in the documentation.
+# The default value is: NO.
+
+EXTRACT_STATIC         = NO
+
+# If the EXTRACT_LOCAL_CLASSES tag is set to YES, classes (and structs) defined
+# locally in source files will be included in the documentation. If set to NO,
+# only classes defined in header files are included. Does not have any effect
+# for Java sources.
+# The default value is: YES.
+
+EXTRACT_LOCAL_CLASSES  = NO
+
+# This flag is only useful for Objective-C code. If set to YES, local methods,
+# which are defined in the implementation section but not in the interface are
+# included in the documentation. If set to NO, only methods in the interface are
+# included.
+# The default value is: NO.
+
+EXTRACT_LOCAL_METHODS  = NO
+
+# If this flag is set to YES, the members of anonymous namespaces will be
+# extracted and appear in the documentation as a namespace called
+# 'anonymous_namespace{file}', where file will be replaced with the base name of
+# the file that contains the anonymous namespace. By default anonymous namespace
+# are hidden.
+# The default value is: NO.
+
+EXTRACT_ANON_NSPACES   = NO
+
+# If the HIDE_UNDOC_MEMBERS tag is set to YES, doxygen will hide all
+# undocumented members inside documented classes or files. If set to NO these
+# members will be included in the various overviews, but no documentation
+# section is generated. This option has no effect if EXTRACT_ALL is enabled.
+# The default value is: NO.
+
+HIDE_UNDOC_MEMBERS     = NO
+
+# If the HIDE_UNDOC_CLASSES tag is set to YES, doxygen will hide all
+# undocumented classes that are normally visible in the class hierarchy. If set
+# to NO, these classes will be included in the various overviews. This option
+# has no effect if EXTRACT_ALL is enabled.
+# The default value is: NO.
+
+HIDE_UNDOC_CLASSES     = NO
+
+# If the HIDE_FRIEND_COMPOUNDS tag is set to YES, doxygen will hide all friend
+# declarations. If set to NO, these declarations will be included in the
+# documentation.
+# The default value is: NO.
+
+HIDE_FRIEND_COMPOUNDS  = NO
+
+# If the HIDE_IN_BODY_DOCS tag is set to YES, doxygen will hide any
+# documentation blocks found inside the body of a function. If set to NO, these
+# blocks will be appended to the function's detailed documentation block.
+# The default value is: NO.
+
+HIDE_IN_BODY_DOCS      = NO
+
+# The INTERNAL_DOCS tag determines if documentation that is typed after a
+# \internal command is included. If the tag is set to NO then the documentation
+# will be excluded. Set it to YES to include the internal documentation.
+# The default value is: NO.
+
+INTERNAL_DOCS          = NO
+
+# If the CASE_SENSE_NAMES tag is set to NO then doxygen will only generate file
+# names in lower-case letters. If set to YES, upper-case letters are also
+# allowed. This is useful if you have classes or files whose names only differ
+# in case and if your file system supports case sensitive file names. Windows
+# (including Cygwin) and Mac users are advised to set this option to NO.
+# The default value is: system dependent.
+
+CASE_SENSE_NAMES       = NO
+
+# If the HIDE_SCOPE_NAMES tag is set to NO then doxygen will show members with
+# their full class and namespace scopes in the documentation. If set to YES, the
+# scope will be hidden.
+# The default value is: NO.
+
+HIDE_SCOPE_NAMES       = NO
+
+# If the HIDE_COMPOUND_REFERENCE tag is set to NO (default) then doxygen will
+# append additional text to a page's title, such as Class Reference. If set to
+# YES the compound reference will be hidden.
+# The default value is: NO.
+
+HIDE_COMPOUND_REFERENCE= NO
+
+# If the SHOW_INCLUDE_FILES tag is set to YES then doxygen will put a list of
+# the files that are included by a file in the documentation of that file.
+# The default value is: YES.
+
+SHOW_INCLUDE_FILES     = YES
+
+# If the SHOW_GROUPED_MEMB_INC tag is set to YES then Doxygen will add for each
+# grouped member an include statement to the documentation, telling the reader
+# which file to include in order to use the member.
+# The default value is: NO.
+
+SHOW_GROUPED_MEMB_INC  = NO
+
+# If the FORCE_LOCAL_INCLUDES tag is set to YES then doxygen will list include
+# files with double quotes in the documentation rather than with sharp brackets.
+# The default value is: NO.
+
+FORCE_LOCAL_INCLUDES   = NO
+
+# If the INLINE_INFO tag is set to YES then a tag [inline] is inserted in the
+# documentation for inline members.
+# The default value is: YES.
+
+INLINE_INFO            = YES
+
+# If the SORT_MEMBER_DOCS tag is set to YES then doxygen will sort the
+# (detailed) documentation of file and class members alphabetically by member
+# name. If set to NO, the members will appear in declaration order.
+# The default value is: YES.
+
+SORT_MEMBER_DOCS       = YES
+
+# If the SORT_BRIEF_DOCS tag is set to YES then doxygen will sort the brief
+# descriptions of file, namespace and class members alphabetically by member
+# name. If set to NO, the members will appear in declaration order. Note that
+# this will also influence the order of the classes in the class list.
+# The default value is: NO.
+
+SORT_BRIEF_DOCS        = NO
+
+# If the SORT_MEMBERS_CTORS_1ST tag is set to YES then doxygen will sort the
+# (brief and detailed) documentation of class members so that constructors and
+# destructors are listed first. If set to NO the constructors will appear in the
+# respective orders defined by SORT_BRIEF_DOCS and SORT_MEMBER_DOCS.
+# Note: If SORT_BRIEF_DOCS is set to NO this option is ignored for sorting brief
+# member documentation.
+# Note: If SORT_MEMBER_DOCS is set to NO this option is ignored for sorting
+# detailed member documentation.
+# The default value is: NO.
+
+SORT_MEMBERS_CTORS_1ST = NO
+
+# If the SORT_GROUP_NAMES tag is set to YES then doxygen will sort the hierarchy
+# of group names into alphabetical order. If set to NO the group names will
+# appear in their defined order.
+# The default value is: NO.
+
+SORT_GROUP_NAMES       = YES
+
+# If the SORT_BY_SCOPE_NAME tag is set to YES, the class list will be sorted by
+# fully-qualified names, including namespaces. If set to NO, the class list will
+# be sorted only by class name, not including the namespace part.
+# Note: This option is not very useful if HIDE_SCOPE_NAMES is set to YES.
+# Note: This option applies only to the class list, not to the alphabetical
+# list.
+# The default value is: NO.
+
+SORT_BY_SCOPE_NAME     = NO
+
+# If the STRICT_PROTO_MATCHING option is enabled and doxygen fails to do proper
+# type resolution of all parameters of a function it will reject a match between
+# the prototype and the implementation of a member function even if there is
+# only one candidate or it is obvious which candidate to choose by doing a
+# simple string match. By disabling STRICT_PROTO_MATCHING doxygen will still
+# accept a match between prototype and implementation in such cases.
+# The default value is: NO.
+
+STRICT_PROTO_MATCHING  = NO
+
+# The GENERATE_TODOLIST tag can be used to enable (YES) or disable (NO) the todo
+# list. This list is created by putting \todo commands in the documentation.
+# The default value is: YES.
+
+GENERATE_TODOLIST      = YES
+
+# The GENERATE_TESTLIST tag can be used to enable (YES) or disable (NO) the test
+# list. This list is created by putting \test commands in the documentation.
+# The default value is: YES.
+
+GENERATE_TESTLIST      = YES
+
+# The GENERATE_BUGLIST tag can be used to enable (YES) or disable (NO) the bug
+# list. This list is created by putting \bug commands in the documentation.
+# The default value is: YES.
+
+GENERATE_BUGLIST       = YES
+
+# The GENERATE_DEPRECATEDLIST tag can be used to enable (YES) or disable (NO)
+# the deprecated list. This list is created by putting \deprecated commands in
+# the documentation.
+# The default value is: YES.
+
+GENERATE_DEPRECATEDLIST= YES
+
+# The ENABLED_SECTIONS tag can be used to enable conditional documentation
+# sections, marked by \if <section_label> ... \endif and \cond <section_label>
+# ... \endcond blocks.
+
+ENABLED_SECTIONS       =
+
+# The MAX_INITIALIZER_LINES tag determines the maximum number of lines that the
+# initial value of a variable or macro / define can have for it to appear in the
+# documentation. If the initializer consists of more lines than specified here
+# it will be hidden. Use a value of 0 to hide initializers completely. The
+# appearance of the value of individual variables and macros / defines can be
+# controlled using \showinitializer or \hideinitializer command in the
+# documentation regardless of this setting.
+# Minimum value: 0, maximum value: 10000, default value: 30.
+
+MAX_INITIALIZER_LINES  = 10000
+
+# Set the SHOW_USED_FILES tag to NO to disable the list of files generated at
+# the bottom of the documentation of classes and structs. If set to YES, the
+# list will mention the files that were used to generate the documentation.
+# The default value is: YES.
+
+SHOW_USED_FILES        = YES
+
+# Set the SHOW_FILES tag to NO to disable the generation of the Files page. This
+# will remove the Files entry from the Quick Index and from the Folder Tree View
+# (if specified).
+# The default value is: YES.
+
+SHOW_FILES             = YES
+
+# Set the SHOW_NAMESPACES tag to NO to disable the generation of the Namespaces
+# page. This will remove the Namespaces entry from the Quick Index and from the
+# Folder Tree View (if specified).
+# The default value is: YES.
+
+SHOW_NAMESPACES        = YES
+
+# The FILE_VERSION_FILTER tag can be used to specify a program or script that
+# doxygen should invoke to get the current version for each file (typically from
+# the version control system). Doxygen will invoke the program by executing (via
+# popen()) the command command input-file, where command is the value of the
+# FILE_VERSION_FILTER tag, and input-file is the name of an input file provided
+# by doxygen. Whatever the program writes to standard output is used as the file
+# version. For an example see the documentation.
+
+FILE_VERSION_FILTER    =
+
+# The LAYOUT_FILE tag can be used to specify a layout file which will be parsed
+# by doxygen. The layout file controls the global structure of the generated
+# output files in an output format independent way. To create the layout file
+# that represents doxygen's defaults, run doxygen with the -l option. You can
+# optionally specify a file name after the option, if omitted DoxygenLayout.xml
+# will be used as the name of the layout file.
+#
+# Note that if you run doxygen from a directory containing a file called
+# DoxygenLayout.xml, doxygen will parse it automatically even if the LAYOUT_FILE
+# tag is left empty.
+
+LAYOUT_FILE            = DoxygenLayout.xml
+
+# The CITE_BIB_FILES tag can be used to specify one or more bib files containing
+# the reference definitions. This must be a list of .bib files. The .bib
+# extension is automatically appended if omitted. This requires the bibtex tool
+# to be installed. See also https://en.wikipedia.org/wiki/BibTeX for more info.
+# For LaTeX the style of the bibliography can be controlled using
+# LATEX_BIB_STYLE. To use this feature you need bibtex and perl available in the
+# search path. See also \cite for info how to create references.
+
+CITE_BIB_FILES         =
+
+#---------------------------------------------------------------------------
+# Configuration options related to warning and progress messages
+#---------------------------------------------------------------------------
+
+# The QUIET tag can be used to turn on/off the messages that are generated to
+# standard output by doxygen. If QUIET is set to YES this implies that the
+# messages are off.
+# The default value is: NO.
+
+QUIET                  = NO
+
+# The WARNINGS tag can be used to turn on/off the warning messages that are
+# generated to standard error (stderr) by doxygen. If WARNINGS is set to YES
+# this implies that the warnings are on.
+#
+# Tip: Turn warnings on while writing the documentation.
+# The default value is: YES.
+
+WARNINGS               = YES
+
+# If the WARN_IF_UNDOCUMENTED tag is set to YES then doxygen will generate
+# warnings for undocumented members. If EXTRACT_ALL is set to YES then this flag
+# will automatically be disabled.
+# The default value is: YES.
+
+WARN_IF_UNDOCUMENTED   = YES
+
+# If the WARN_IF_DOC_ERROR tag is set to YES, doxygen will generate warnings for
+# potential errors in the documentation, such as not documenting some parameters
+# in a documented function, or documenting parameters that don't exist or using
+# markup commands wrongly.
+# The default value is: YES.
+
+WARN_IF_DOC_ERROR      = YES
+
+# This WARN_NO_PARAMDOC option can be enabled to get warnings for functions that
+# are documented, but have no documentation for their parameters or return
+# value. If set to NO, doxygen will only warn about wrong or incomplete
+# parameter documentation, but not about the absence of documentation. If
+# EXTRACT_ALL is set to YES then this flag will automatically be disabled.
+# The default value is: NO.
+
+WARN_NO_PARAMDOC       = NO
+
+# If the WARN_AS_ERROR tag is set to YES then doxygen will immediately stop when
+# a warning is encountered.
+# The default value is: NO.
+
+WARN_AS_ERROR          = NO
+
+# The WARN_FORMAT tag determines the format of the warning messages that doxygen
+# can produce. The string should contain the $file, $line, and $text tags, which
+# will be replaced by the file and line number from which the warning originated
+# and the warning text. Optionally the format may contain $version, which will
+# be replaced by the version of the file (if it could be obtained via
+# FILE_VERSION_FILTER)
+# The default value is: $file:$line: $text.
+
+WARN_FORMAT            = "$file:$line: $text"
+
+# The WARN_LOGFILE tag can be used to specify a file to which warning and error
+# messages should be written. If left blank the output is written to standard
+# error (stderr).
+
+WARN_LOGFILE           =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the input files
+#---------------------------------------------------------------------------
+
+# The INPUT tag is used to specify the files and/or directories that contain
+# documented source files. You may enter file names like myfile.cpp or
+# directories like /usr/src/myproject. Separate the files or directories with
+# spaces. See also FILE_PATTERNS and EXTENSION_MAPPING
+# Note: If this tag is empty the current directory is searched.
+
+INPUT                  = ../../README.md \
+                         ../../alg \
+                         ../../core \
+                         ../../data \
+                         ../../io \
+                         ../../python
+
+# This tag can be used to specify the character encoding of the source files
+# that doxygen parses. Internally doxygen uses the UTF-8 encoding. Doxygen uses
+# libiconv (or the iconv built into libc) for the transcoding. See the libiconv
+# documentation (see: https://www.gnu.org/software/libiconv/) for the list of
+# possible encodings.
+# The default value is: UTF-8.
+
+INPUT_ENCODING         = UTF-8
+
+# If the value of the INPUT tag contains directories, you can use the
+# FILE_PATTERNS tag to specify one or more wildcard patterns (like *.cpp and
+# *.h) to filter out the source-files in the directories.
+#
+# Note that for custom extensions or not directly supported extensions you also
+# need to set EXTENSION_MAPPING for the extension otherwise the files are not
+# read by doxygen.
+#
+# If left blank the following patterns are tested:*.c, *.cc, *.cxx, *.cpp,
+# *.c++, *.java, *.ii, *.ixx, *.ipp, *.i++, *.inl, *.idl, *.ddl, *.odl, *.h,
+# *.hh, *.hxx, *.hpp, *.h++, *.cs, *.d, *.php, *.php4, *.php5, *.phtml, *.inc,
+# *.m, *.markdown, *.md, *.mm, *.dox (to be provided as doxygen C comment),
+# *.doc (to be provided as doxygen C comment), *.txt (to be provided as doxygen
+# C comment), *.py, *.pyw, *.f90, *.f95, *.f03, *.f08, *.f18, *.f, *.for, *.vhd,
+# *.vhdl, *.ucf, *.qsf and *.ice.
+
+FILE_PATTERNS          = *.h \
+                         *.py
+
+# The RECURSIVE tag can be used to specify whether or not subdirectories should
+# be searched for input files as well.
+# The default value is: NO.
+
+RECURSIVE              = YES
+
+# The EXCLUDE tag can be used to specify files and/or directories that should be
+# excluded from the INPUT source files. This way you can easily exclude a
+# subdirectory from a directory tree whose root is specified with the INPUT tag.
+#
+# Note that relative paths are relative to the directory from which doxygen is
+# run.
+
+EXCLUDE                = ../../alg/teca_deeplab_ar_detect_internals.py \
+                         parse_xml.py
+
+# The EXCLUDE_SYMLINKS tag can be used to select whether or not files or
+# directories that are symbolic links (a Unix file system feature) are excluded
+# from the input.
+# The default value is: NO.
+
+EXCLUDE_SYMLINKS       = NO
+
+# If the value of the INPUT tag contains directories, you can use the
+# EXCLUDE_PATTERNS tag to specify one or more wildcard patterns to exclude
+# certain files from those directories.
+#
+# Note that the wildcards are matched against the file with absolute path, so to
+# exclude all test directories for example use the pattern */test/*
+
+EXCLUDE_PATTERNS       =
+
+# The EXCLUDE_SYMBOLS tag can be used to specify one or more symbol names
+# (namespaces, classes, functions, etc.) that should be excluded from the
+# output. The symbol name can be a fully qualified name, a word, or if the
+# wildcard * is used, a substring. Examples: ANamespace, AClass,
+# AClass::ANamespace, ANamespace::*Test
+#
+# Note that the wildcards are matched against the file with absolute path, so to
+# exclude all test directories use the pattern */test/*
+
+EXCLUDE_SYMBOLS        =
+
+# The EXAMPLE_PATH tag can be used to specify one or more files or directories
+# that contain example code fragments that are included (see the \include
+# command).
+
+EXAMPLE_PATH           =
+
+# If the value of the EXAMPLE_PATH tag contains directories, you can use the
+# EXAMPLE_PATTERNS tag to specify one or more wildcard pattern (like *.cpp and
+# *.h) to filter out the source-files in the directories. If left blank all
+# files are included.
+
+EXAMPLE_PATTERNS       = *
+
+# If the EXAMPLE_RECURSIVE tag is set to YES then subdirectories will be
+# searched for input files to be used with the \include or \dontinclude commands
+# irrespective of the value of the RECURSIVE tag.
+# The default value is: NO.
+
+EXAMPLE_RECURSIVE      = NO
+
+# The IMAGE_PATH tag can be used to specify one or more files or directories
+# that contain images that are to be included in the documentation (see the
+# \image command).
+
+IMAGE_PATH             = ../../doc/rtd/images
+
+# The INPUT_FILTER tag can be used to specify a program that doxygen should
+# invoke to filter for each input file. Doxygen will invoke the filter program
+# by executing (via popen()) the command:
+#
+# <filter> <input-file>
+#
+# where <filter> is the value of the INPUT_FILTER tag, and <input-file> is the
+# name of an input file. Doxygen will then use the output that the filter
+# program writes to standard output. If FILTER_PATTERNS is specified, this tag
+# will be ignored.
+#
+# Note that the filter must not add or remove lines; it is applied before the
+# code is scanned, but not when the output code is generated. If lines are added
+# or removed, the anchors will not be placed correctly.
+#
+# Note that for custom extensions or not directly supported extensions you also
+# need to set EXTENSION_MAPPING for the extension otherwise the files are not
+# properly processed by doxygen.
+
+INPUT_FILTER           =
+
+# The FILTER_PATTERNS tag can be used to specify filters on a per file pattern
+# basis. Doxygen will compare the file name with each pattern and apply the
+# filter if there is a match. The filters are a list of the form: pattern=filter
+# (like *.cpp=my_cpp_filter). See INPUT_FILTER for further information on how
+# filters are used. If the FILTER_PATTERNS tag is empty or if none of the
+# patterns match the file name, INPUT_FILTER is applied.
+#
+# Note that for custom extensions or not directly supported extensions you also
+# need to set EXTENSION_MAPPING for the extension otherwise the files are not
+# properly processed by doxygen.
+
+FILTER_PATTERNS        =
+
+# If the FILTER_SOURCE_FILES tag is set to YES, the input filter (if set using
+# INPUT_FILTER) will also be used to filter the input files that are used for
+# producing the source files to browse (i.e. when SOURCE_BROWSER is set to YES).
+# The default value is: NO.
+
+FILTER_SOURCE_FILES    = NO
+
+# The FILTER_SOURCE_PATTERNS tag can be used to specify source filters per file
+# pattern. A pattern will override the setting for FILTER_PATTERN (if any) and
+# it is also possible to disable source filtering for a specific pattern using
+# *.ext= (so without naming a filter).
+# This tag requires that the tag FILTER_SOURCE_FILES is set to YES.
+
+FILTER_SOURCE_PATTERNS =
+
+# If the USE_MDFILE_AS_MAINPAGE tag refers to the name of a markdown file that
+# is part of the input, its contents will be placed on the main page
+# (index.html). This can be useful if you have a project on for instance GitHub
+# and want to reuse the introduction page also for the doxygen output.
+
+USE_MDFILE_AS_MAINPAGE = README.md
+
+#---------------------------------------------------------------------------
+# Configuration options related to source browsing
+#---------------------------------------------------------------------------
+
+# If the SOURCE_BROWSER tag is set to YES then a list of source files will be
+# generated. Documented entities will be cross-referenced with these sources.
+#
+# Note: To get rid of all source code in the generated output, make sure that
+# also VERBATIM_HEADERS is set to NO.
+# The default value is: NO.
+
+SOURCE_BROWSER         = NO
+
+# Setting the INLINE_SOURCES tag to YES will include the body of functions,
+# classes and enums directly into the documentation.
+# The default value is: NO.
+
+INLINE_SOURCES         = NO
+
+# Setting the STRIP_CODE_COMMENTS tag to YES will instruct doxygen to hide any
+# special comment blocks from generated source code fragments. Normal C, C++ and
+# Fortran comments will always remain visible.
+# The default value is: YES.
+
+STRIP_CODE_COMMENTS    = NO
+
+# If the REFERENCED_BY_RELATION tag is set to YES then for each documented
+# entity all documented functions referencing it will be listed.
+# The default value is: NO.
+
+REFERENCED_BY_RELATION = NO
+
+# If the REFERENCES_RELATION tag is set to YES then for each documented function
+# all documented entities called/used by that function will be listed.
+# The default value is: NO.
+
+REFERENCES_RELATION    = NO
+
+# If the REFERENCES_LINK_SOURCE tag is set to YES and SOURCE_BROWSER tag is set
+# to YES then the hyperlinks from functions in REFERENCES_RELATION and
+# REFERENCED_BY_RELATION lists will link to the source code. Otherwise they will
+# link to the documentation.
+# The default value is: YES.
+
+REFERENCES_LINK_SOURCE = YES
+
+# If SOURCE_TOOLTIPS is enabled (the default) then hovering a hyperlink in the
+# source code will show a tooltip with additional information such as prototype,
+# brief description and links to the definition and documentation. Since this
+# will make the HTML file larger and loading of large files a bit slower, you
+# can opt to disable this feature.
+# The default value is: YES.
+# This tag requires that the tag SOURCE_BROWSER is set to YES.
+
+SOURCE_TOOLTIPS        = YES
+
+# If the USE_HTAGS tag is set to YES then the references to source code will
+# point to the HTML generated by the htags(1) tool instead of doxygen built-in
+# source browser. The htags tool is part of GNU's global source tagging system
+# (see https://www.gnu.org/software/global/global.html). You will need version
+# 4.8.6 or higher.
+#
+# To use it do the following:
+# - Install the latest version of global
+# - Enable SOURCE_BROWSER and USE_HTAGS in the configuration file
+# - Make sure the INPUT points to the root of the source tree
+# - Run doxygen as normal
+#
+# Doxygen will invoke htags (and that will in turn invoke gtags), so these
+# tools must be available from the command line (i.e. in the search path).
+#
+# The result: instead of the source browser generated by doxygen, the links to
+# source code will now point to the output of htags.
+# The default value is: NO.
+# This tag requires that the tag SOURCE_BROWSER is set to YES.
+
+USE_HTAGS              = NO
+
+# If the VERBATIM_HEADERS tag is set the YES then doxygen will generate a
+# verbatim copy of the header file for each class for which an include is
+# specified. Set to NO to disable this.
+# See also: Section \class.
+# The default value is: YES.
+
+VERBATIM_HEADERS       = YES
+
+#---------------------------------------------------------------------------
+# Configuration options related to the alphabetical class index
+#---------------------------------------------------------------------------
+
+# If the ALPHABETICAL_INDEX tag is set to YES, an alphabetical index of all
+# compounds will be generated. Enable this if the project contains a lot of
+# classes, structs, unions or interfaces.
+# The default value is: YES.
+
+ALPHABETICAL_INDEX     = YES
+
+# The COLS_IN_ALPHA_INDEX tag can be used to specify the number of columns in
+# which the alphabetical index list will be split.
+# Minimum value: 1, maximum value: 20, default value: 5.
+# This tag requires that the tag ALPHABETICAL_INDEX is set to YES.
+
+COLS_IN_ALPHA_INDEX    = 5
+
+# In case all classes in a project start with a common prefix, all classes will
+# be put under the same header in the alphabetical index. The IGNORE_PREFIX tag
+# can be used to specify a prefix (or a list of prefixes) that should be ignored
+# while generating the index headers.
+# This tag requires that the tag ALPHABETICAL_INDEX is set to YES.
+
+IGNORE_PREFIX          =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the HTML output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_HTML tag is set to YES, doxygen will generate HTML output
+# The default value is: YES.
+
+GENERATE_HTML          = YES
+
+# The HTML_OUTPUT tag is used to specify where the HTML docs will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it.
+# The default directory is: html.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_OUTPUT            = html/doxygen
+
+# The HTML_FILE_EXTENSION tag can be used to specify the file extension for each
+# generated HTML page (for example: .htm, .php, .asp).
+# The default value is: .html.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_FILE_EXTENSION    = .html
+
+# The HTML_HEADER tag can be used to specify a user-defined HTML header file for
+# each generated HTML page. If the tag is left blank doxygen will generate a
+# standard header.
+#
+# To get valid HTML the header file that includes any scripts and style sheets
+# that doxygen needs, which is dependent on the configuration options used (e.g.
+# the setting GENERATE_TREEVIEW). It is highly recommended to start with a
+# default header using
+# doxygen -w html new_header.html new_footer.html new_stylesheet.css
+# YourConfigFile
+# and then modify the file new_header.html. See also section "Doxygen usage"
+# for information on how to generate the default header that doxygen normally
+# uses.
+# Note: The header is subject to change so you typically have to regenerate the
+# default header when upgrading to a newer version of doxygen. For a description
+# of the possible markers and block names see the documentation.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_HEADER            =
+
+# The HTML_FOOTER tag can be used to specify a user-defined HTML footer for each
+# generated HTML page. If the tag is left blank doxygen will generate a standard
+# footer. See HTML_HEADER for more information on how to generate a default
+# footer and what special commands can be used inside the footer. See also
+# section "Doxygen usage" for information on how to generate the default footer
+# that doxygen normally uses.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_FOOTER            =
+
+# The HTML_STYLESHEET tag can be used to specify a user-defined cascading style
+# sheet that is used by each HTML page. It can be used to fine-tune the look of
+# the HTML output. If left blank doxygen will generate a default style sheet.
+# See also section "Doxygen usage" for information on how to generate the style
+# sheet that doxygen normally uses.
+# Note: It is recommended to use HTML_EXTRA_STYLESHEET instead of this tag, as
+# it is more robust and this tag (HTML_STYLESHEET) will in the future become
+# obsolete.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_STYLESHEET        =
+
+# The HTML_EXTRA_STYLESHEET tag can be used to specify additional user-defined
+# cascading style sheets that are included after the standard style sheets
+# created by doxygen. Using this option one can overrule certain style aspects.
+# This is preferred over using HTML_STYLESHEET since it does not replace the
+# standard style sheet and is therefore more robust against future updates.
+# Doxygen will copy the style sheet files to the output directory.
+# Note: The order of the extra style sheet files is of importance (e.g. the last
+# style sheet in the list overrules the setting of the previous ones in the
+# list). For an example see the documentation.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_EXTRA_STYLESHEET  =
+
+# The HTML_EXTRA_FILES tag can be used to specify one or more extra images or
+# other source files which should be copied to the HTML output directory. Note
+# that these files will be copied to the base HTML output directory. Use the
+# $relpath^ marker in the HTML_HEADER and/or HTML_FOOTER files to load these
+# files. In the HTML_STYLESHEET file, use the file name only. Also note that the
+# files will be copied as-is; there are no commands or markers available.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_EXTRA_FILES       =
+
+# The HTML_COLORSTYLE_HUE tag controls the color of the HTML output. Doxygen
+# will adjust the colors in the style sheet and background images according to
+# this color. Hue is specified as an angle on a colorwheel, see
+# https://en.wikipedia.org/wiki/Hue for more information. For instance the value
+# 0 represents red, 60 is yellow, 120 is green, 180 is cyan, 240 is blue, 300
+# purple, and 360 is red again.
+# Minimum value: 0, maximum value: 359, default value: 220.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_COLORSTYLE_HUE    = 220
+
+# The HTML_COLORSTYLE_SAT tag controls the purity (or saturation) of the colors
+# in the HTML output. For a value of 0 the output will use grayscales only. A
+# value of 255 will produce the most vivid colors.
+# Minimum value: 0, maximum value: 255, default value: 100.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_COLORSTYLE_SAT    = 100
+
+# The HTML_COLORSTYLE_GAMMA tag controls the gamma correction applied to the
+# luminance component of the colors in the HTML output. Values below 100
+# gradually make the output lighter, whereas values above 100 make the output
+# darker. The value divided by 100 is the actual gamma applied, so 80 represents
+# a gamma of 0.8, The value 220 represents a gamma of 2.2, and 100 does not
+# change the gamma.
+# Minimum value: 40, maximum value: 240, default value: 80.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_COLORSTYLE_GAMMA  = 80
+
+# If the HTML_TIMESTAMP tag is set to YES then the footer of each generated HTML
+# page will contain the date and time when the page was generated. Setting this
+# to YES can help to show when doxygen was last run and thus if the
+# documentation is up to date.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_TIMESTAMP         = YES
+
+# If the HTML_DYNAMIC_MENUS tag is set to YES then the generated HTML
+# documentation will contain a main index with vertical navigation menus that
+# are dynamically created via JavaScript. If disabled, the navigation index will
+# consists of multiple levels of tabs that are statically embedded in every HTML
+# page. Disable this option to support browsers that do not have JavaScript,
+# like the Qt help browser.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_DYNAMIC_MENUS     = YES
+
+# If the HTML_DYNAMIC_SECTIONS tag is set to YES then the generated HTML
+# documentation will contain sections that can be hidden and shown after the
+# page has loaded.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_DYNAMIC_SECTIONS  = NO
+
+# With HTML_INDEX_NUM_ENTRIES one can control the preferred number of entries
+# shown in the various tree structured indices initially; the user can expand
+# and collapse entries dynamically later on. Doxygen will expand the tree to
+# such a level that at most the specified number of entries are visible (unless
+# a fully collapsed tree already exceeds this amount). So setting the number of
+# entries 1 will produce a full collapsed tree by default. 0 is a special value
+# representing an infinite number of entries and will result in a full expanded
+# tree by default.
+# Minimum value: 0, maximum value: 9999, default value: 100.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_INDEX_NUM_ENTRIES = 100
+
+# If the GENERATE_DOCSET tag is set to YES, additional index files will be
+# generated that can be used as input for Apple's Xcode 3 integrated development
+# environment (see: https://developer.apple.com/xcode/), introduced with OSX
+# 10.5 (Leopard). To create a documentation set, doxygen will generate a
+# Makefile in the HTML output directory. Running make will produce the docset in
+# that directory and running make install will install the docset in
+# ~/Library/Developer/Shared/Documentation/DocSets so that Xcode will find it at
+# startup. See https://developer.apple.com/library/archive/featuredarticles/Doxy
+# genXcode/_index.html for more information.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_DOCSET        = NO
+
+# This tag determines the name of the docset feed. A documentation feed provides
+# an umbrella under which multiple documentation sets from a single provider
+# (such as a company or product suite) can be grouped.
+# The default value is: Doxygen generated docs.
+# This tag requires that the tag GENERATE_DOCSET is set to YES.
+
+DOCSET_FEEDNAME        = "Doxygen generated docs"
+
+# This tag specifies a string that should uniquely identify the documentation
+# set bundle. This should be a reverse domain-name style string, e.g.
+# com.mycompany.MyDocSet. Doxygen will append .docset to the name.
+# The default value is: org.doxygen.Project.
+# This tag requires that the tag GENERATE_DOCSET is set to YES.
+
+DOCSET_BUNDLE_ID       = org.doxygen.Project
+
+# The DOCSET_PUBLISHER_ID tag specifies a string that should uniquely identify
+# the documentation publisher. This should be a reverse domain-name style
+# string, e.g. com.mycompany.MyDocSet.documentation.
+# The default value is: org.doxygen.Publisher.
+# This tag requires that the tag GENERATE_DOCSET is set to YES.
+
+DOCSET_PUBLISHER_ID    = org.doxygen.Publisher
+
+# The DOCSET_PUBLISHER_NAME tag identifies the documentation publisher.
+# The default value is: Publisher.
+# This tag requires that the tag GENERATE_DOCSET is set to YES.
+
+DOCSET_PUBLISHER_NAME  = Publisher
+
+# If the GENERATE_HTMLHELP tag is set to YES then doxygen generates three
+# additional HTML index files: index.hhp, index.hhc, and index.hhk. The
+# index.hhp is a project file that can be read by Microsoft's HTML Help Workshop
+# (see: https://www.microsoft.com/en-us/download/details.aspx?id=21138) on
+# Windows.
+#
+# The HTML Help Workshop contains a compiler that can convert all HTML output
+# generated by doxygen into a single compiled HTML file (.chm). Compiled HTML
+# files are now used as the Windows 98 help format, and will replace the old
+# Windows help format (.hlp) on all Windows platforms in the future. Compressed
+# HTML files also contain an index, a table of contents, and you can search for
+# words in the documentation. The HTML workshop also contains a viewer for
+# compressed HTML files.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_HTMLHELP      = NO
+
+# The CHM_FILE tag can be used to specify the file name of the resulting .chm
+# file. You can add a path in front of the file if the result should not be
+# written to the html output directory.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+CHM_FILE               =
+
+# The HHC_LOCATION tag can be used to specify the location (absolute path
+# including file name) of the HTML help compiler (hhc.exe). If non-empty,
+# doxygen will try to run the HTML help compiler on the generated index.hhp.
+# The file has to be specified with full path.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+HHC_LOCATION           =
+
+# The GENERATE_CHI flag controls if a separate .chi index file is generated
+# (YES) or that it should be included in the main .chm file (NO).
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+GENERATE_CHI           = NO
+
+# The CHM_INDEX_ENCODING is used to encode HtmlHelp index (hhk), content (hhc)
+# and project file content.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+CHM_INDEX_ENCODING     =
+
+# The BINARY_TOC flag controls whether a binary table of contents is generated
+# (YES) or a normal table of contents (NO) in the .chm file. Furthermore it
+# enables the Previous and Next buttons.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+BINARY_TOC             = NO
+
+# The TOC_EXPAND flag can be set to YES to add extra items for group members to
+# the table of contents of the HTML help documentation and to the tree view.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTMLHELP is set to YES.
+
+TOC_EXPAND             = NO
+
+# If the GENERATE_QHP tag is set to YES and both QHP_NAMESPACE and
+# QHP_VIRTUAL_FOLDER are set, an additional index file will be generated that
+# can be used as input for Qt's qhelpgenerator to generate a Qt Compressed Help
+# (.qch) of the generated HTML documentation.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_QHP           = NO
+
+# If the QHG_LOCATION tag is specified, the QCH_FILE tag can be used to specify
+# the file name of the resulting .qch file. The path specified is relative to
+# the HTML output folder.
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QCH_FILE               =
+
+# The QHP_NAMESPACE tag specifies the namespace to use when generating Qt Help
+# Project output. For more information please see Qt Help Project / Namespace
+# (see: https://doc.qt.io/archives/qt-4.8/qthelpproject.html#namespace).
+# The default value is: org.doxygen.Project.
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_NAMESPACE          = org.doxygen.Project
+
+# The QHP_VIRTUAL_FOLDER tag specifies the namespace to use when generating Qt
+# Help Project output. For more information please see Qt Help Project / Virtual
+# Folders (see: https://doc.qt.io/archives/qt-4.8/qthelpproject.html#virtual-
+# folders).
+# The default value is: doc.
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_VIRTUAL_FOLDER     = doc
+
+# If the QHP_CUST_FILTER_NAME tag is set, it specifies the name of a custom
+# filter to add. For more information please see Qt Help Project / Custom
+# Filters (see: https://doc.qt.io/archives/qt-4.8/qthelpproject.html#custom-
+# filters).
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_CUST_FILTER_NAME   =
+
+# The QHP_CUST_FILTER_ATTRS tag specifies the list of the attributes of the
+# custom filter to add. For more information please see Qt Help Project / Custom
+# Filters (see: https://doc.qt.io/archives/qt-4.8/qthelpproject.html#custom-
+# filters).
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_CUST_FILTER_ATTRS  =
+
+# The QHP_SECT_FILTER_ATTRS tag specifies the list of the attributes this
+# project's filter section matches. Qt Help Project / Filter Attributes (see:
+# https://doc.qt.io/archives/qt-4.8/qthelpproject.html#filter-attributes).
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHP_SECT_FILTER_ATTRS  =
+
+# The QHG_LOCATION tag can be used to specify the location of Qt's
+# qhelpgenerator. If non-empty doxygen will try to run qhelpgenerator on the
+# generated .qhp file.
+# This tag requires that the tag GENERATE_QHP is set to YES.
+
+QHG_LOCATION           =
+
+# If the GENERATE_ECLIPSEHELP tag is set to YES, additional index files will be
+# generated, together with the HTML files, they form an Eclipse help plugin. To
+# install this plugin and make it available under the help contents menu in
+# Eclipse, the contents of the directory containing the HTML and XML files needs
+# to be copied into the plugins directory of eclipse. The name of the directory
+# within the plugins directory should be the same as the ECLIPSE_DOC_ID value.
+# After copying Eclipse needs to be restarted before the help appears.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_ECLIPSEHELP   = NO
+
+# A unique identifier for the Eclipse help plugin. When installing the plugin
+# the directory name containing the HTML and XML files should also have this
+# name. Each documentation set should have its own identifier.
+# The default value is: org.doxygen.Project.
+# This tag requires that the tag GENERATE_ECLIPSEHELP is set to YES.
+
+ECLIPSE_DOC_ID         = org.doxygen.Project
+
+# If you want full control over the layout of the generated HTML pages it might
+# be necessary to disable the index and replace it with your own. The
+# DISABLE_INDEX tag can be used to turn on/off the condensed index (tabs) at top
+# of each HTML page. A value of NO enables the index and the value YES disables
+# it. Since the tabs in the index contain the same information as the navigation
+# tree, you can set this option to YES if you also set GENERATE_TREEVIEW to YES.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+DISABLE_INDEX          = NO
+
+# The GENERATE_TREEVIEW tag is used to specify whether a tree-like index
+# structure should be generated to display hierarchical information. If the tag
+# value is set to YES, a side panel will be generated containing a tree-like
+# index structure (just like the one that is generated for HTML Help). For this
+# to work a browser that supports JavaScript, DHTML, CSS and frames is required
+# (i.e. any modern browser). Windows users are probably better off using the
+# HTML help feature. Via custom style sheets (see HTML_EXTRA_STYLESHEET) one can
+# further fine-tune the look of the index. As an example, the default style
+# sheet generated by doxygen has an example that shows how to put an image at
+# the root of the tree instead of the PROJECT_NAME. Since the tree basically has
+# the same information as the tab index, you could consider setting
+# DISABLE_INDEX to YES when enabling this option.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+GENERATE_TREEVIEW      = YES
+
+# The ENUM_VALUES_PER_LINE tag can be used to set the number of enum values that
+# doxygen will group on one line in the generated HTML documentation.
+#
+# Note that a value of 0 will completely suppress the enum values from appearing
+# in the overview section.
+# Minimum value: 0, maximum value: 20, default value: 4.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+ENUM_VALUES_PER_LINE   = 4
+
+# If the treeview is enabled (see GENERATE_TREEVIEW) then this tag can be used
+# to set the initial width (in pixels) of the frame in which the tree is shown.
+# Minimum value: 0, maximum value: 1500, default value: 250.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+TREEVIEW_WIDTH         = 200
+
+# If the EXT_LINKS_IN_WINDOW option is set to YES, doxygen will open links to
+# external symbols imported via tag files in a separate window.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+EXT_LINKS_IN_WINDOW    = NO
+
+# If the HTML_FORMULA_FORMAT option is set to svg, doxygen will use the pdf2svg
+# tool (see https://github.com/dawbarton/pdf2svg) or inkscape (see
+# https://inkscape.org) to generate formulas as SVG images instead of PNGs for
+# the HTML output. These images will generally look nicer at scaled resolutions.
+# Possible values are: png (the default) and svg (looks nicer but requires the
+# pdf2svg or inkscape tool).
+# The default value is: png.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+HTML_FORMULA_FORMAT    = png
+
+# Use this tag to change the font size of LaTeX formulas included as images in
+# the HTML documentation. When you change the font size after a successful
+# doxygen run you need to manually remove any form_*.png images from the HTML
+# output directory to force them to be regenerated.
+# Minimum value: 8, maximum value: 50, default value: 10.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+FORMULA_FONTSIZE       = 10
+
+# Use the FORMULA_TRANSPARENT tag to determine whether or not the images
+# generated for formulas are transparent PNGs. Transparent PNGs are not
+# supported properly for IE 6.0, but are supported on all modern browsers.
+#
+# Note that when changing this option you need to delete any form_*.png files in
+# the HTML output directory before the changes have effect.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+FORMULA_TRANSPARENT    = YES
+
+# The FORMULA_MACROFILE can contain LaTeX \newcommand and \renewcommand commands
+# to create new LaTeX commands to be used in formulas as building blocks. See
+# the section "Including formulas" for details.
+
+FORMULA_MACROFILE      =
+
+# Enable the USE_MATHJAX option to render LaTeX formulas using MathJax (see
+# https://www.mathjax.org) which uses client side JavaScript for the rendering
+# instead of using pre-rendered bitmaps. Use this if you do not have LaTeX
+# installed or if you want to formulas look prettier in the HTML output. When
+# enabled you may also need to install MathJax separately and configure the path
+# to it using the MATHJAX_RELPATH option.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+USE_MATHJAX            = YES
+
+# When MathJax is enabled you can set the default output format to be used for
+# the MathJax output. See the MathJax site (see:
+# http://docs.mathjax.org/en/latest/output.html) for more details.
+# Possible values are: HTML-CSS (which is slower, but has the best
+# compatibility), NativeMML (i.e. MathML) and SVG.
+# The default value is: HTML-CSS.
+# This tag requires that the tag USE_MATHJAX is set to YES.
+
+MATHJAX_FORMAT         = HTML-CSS
+
+# When MathJax is enabled you need to specify the location relative to the HTML
+# output directory using the MATHJAX_RELPATH option. The destination directory
+# should contain the MathJax.js script. For instance, if the mathjax directory
+# is located at the same level as the HTML output directory, then
+# MATHJAX_RELPATH should be ../mathjax. The default value points to the MathJax
+# Content Delivery Network so you can quickly see the result without installing
+# MathJax. However, it is strongly recommended to install a local copy of
+# MathJax from https://www.mathjax.org before deployment.
+# The default value is: https://cdn.jsdelivr.net/npm/mathjax@2.
+# This tag requires that the tag USE_MATHJAX is set to YES.
+
+MATHJAX_RELPATH        = https://cdn.jsdelivr.net/npm/mathjax@2
+
+# The MATHJAX_EXTENSIONS tag can be used to specify one or more MathJax
+# extension names that should be enabled during MathJax rendering. For example
+# MATHJAX_EXTENSIONS = TeX/AMSmath TeX/AMSsymbols
+# This tag requires that the tag USE_MATHJAX is set to YES.
+
+MATHJAX_EXTENSIONS     =
+
+# The MATHJAX_CODEFILE tag can be used to specify a file with javascript pieces
+# of code that will be used on startup of the MathJax code. See the MathJax site
+# (see: http://docs.mathjax.org/en/latest/output.html) for more details. For an
+# example see the documentation.
+# This tag requires that the tag USE_MATHJAX is set to YES.
+
+MATHJAX_CODEFILE       =
+
+# When the SEARCHENGINE tag is enabled doxygen will generate a search box for
+# the HTML output. The underlying search engine uses javascript and DHTML and
+# should work on any modern browser. Note that when using HTML help
+# (GENERATE_HTMLHELP), Qt help (GENERATE_QHP), or docsets (GENERATE_DOCSET)
+# there is already a search function so this one should typically be disabled.
+# For large projects the javascript based search engine can be slow, then
+# enabling SERVER_BASED_SEARCH may provide a better solution. It is possible to
+# search using the keyboard; to jump to the search box use <access key> + S
+# (what the <access key> is depends on the OS and browser, but it is typically
+# <CTRL>, <ALT>/<option>, or both). Inside the search box use the <cursor down
+# key> to jump into the search results window, the results can be navigated
+# using the <cursor keys>. Press <Enter> to select an item or <escape> to cancel
+# the search. The filter options can be selected when the cursor is inside the
+# search box by pressing <Shift>+<cursor down>. Also here use the <cursor keys>
+# to select a filter and <Enter> or <escape> to activate or cancel the filter
+# option.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_HTML is set to YES.
+
+SEARCHENGINE           = YES
+
+# When the SERVER_BASED_SEARCH tag is enabled the search engine will be
+# implemented using a web server instead of a web client using JavaScript. There
+# are two flavors of web server based searching depending on the EXTERNAL_SEARCH
+# setting. When disabled, doxygen will generate a PHP script for searching and
+# an index file used by the script. When EXTERNAL_SEARCH is enabled the indexing
+# and searching needs to be provided by external tools. See the section
+# "External Indexing and Searching" for details.
+# The default value is: NO.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+SERVER_BASED_SEARCH    = NO
+
+# When EXTERNAL_SEARCH tag is enabled doxygen will no longer generate the PHP
+# script for searching. Instead the search results are written to an XML file
+# which needs to be processed by an external indexer. Doxygen will invoke an
+# external search engine pointed to by the SEARCHENGINE_URL option to obtain the
+# search results.
+#
+# Doxygen ships with an example indexer (doxyindexer) and search engine
+# (doxysearch.cgi) which are based on the open source search engine library
+# Xapian (see: https://xapian.org/).
+#
+# See the section "External Indexing and Searching" for details.
+# The default value is: NO.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+EXTERNAL_SEARCH        = NO
+
+# The SEARCHENGINE_URL should point to a search engine hosted by a web server
+# which will return the search results when EXTERNAL_SEARCH is enabled.
+#
+# Doxygen ships with an example indexer (doxyindexer) and search engine
+# (doxysearch.cgi) which are based on the open source search engine library
+# Xapian (see: https://xapian.org/). See the section "External Indexing and
+# Searching" for details.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+SEARCHENGINE_URL       =
+
+# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the unindexed
+# search data is written to a file for indexing by an external tool. With the
+# SEARCHDATA_FILE tag the name of this file can be specified.
+# The default file is: searchdata.xml.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+SEARCHDATA_FILE        = searchdata.xml
+
+# When SERVER_BASED_SEARCH and EXTERNAL_SEARCH are both enabled the
+# EXTERNAL_SEARCH_ID tag can be used as an identifier for the project. This is
+# useful in combination with EXTRA_SEARCH_MAPPINGS to search through multiple
+# projects and redirect the results back to the right project.
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+EXTERNAL_SEARCH_ID     =
+
+# The EXTRA_SEARCH_MAPPINGS tag can be used to enable searching through doxygen
+# projects other than the one defined by this configuration file, but that are
+# all added to the same external search index. Each project needs to have a
+# unique id set via EXTERNAL_SEARCH_ID. The search mapping then maps the id of
+# to a relative location where the documentation can be found. The format is:
+# EXTRA_SEARCH_MAPPINGS = tagname1=loc1 tagname2=loc2 ...
+# This tag requires that the tag SEARCHENGINE is set to YES.
+
+EXTRA_SEARCH_MAPPINGS  =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the LaTeX output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_LATEX tag is set to YES, doxygen will generate LaTeX output.
+# The default value is: YES.
+
+GENERATE_LATEX         = NO
+
+# The LATEX_OUTPUT tag is used to specify where the LaTeX docs will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it.
+# The default directory is: latex.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_OUTPUT           = latex
+
+# The LATEX_CMD_NAME tag can be used to specify the LaTeX command name to be
+# invoked.
+#
+# Note that when not enabling USE_PDFLATEX the default is latex when enabling
+# USE_PDFLATEX the default is pdflatex and when in the later case latex is
+# chosen this is overwritten by pdflatex. For specific output languages the
+# default can have been set differently, this depends on the implementation of
+# the output language.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_CMD_NAME         =
+
+# The MAKEINDEX_CMD_NAME tag can be used to specify the command name to generate
+# index for LaTeX.
+# Note: This tag is used in the Makefile / make.bat.
+# See also: LATEX_MAKEINDEX_CMD for the part in the generated output file
+# (.tex).
+# The default file is: makeindex.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+MAKEINDEX_CMD_NAME     = makeindex
+
+# The LATEX_MAKEINDEX_CMD tag can be used to specify the command name to
+# generate index for LaTeX. In case there is no backslash (\) as first character
+# it will be automatically added in the LaTeX code.
+# Note: This tag is used in the generated output file (.tex).
+# See also: MAKEINDEX_CMD_NAME for the part in the Makefile / make.bat.
+# The default value is: makeindex.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_MAKEINDEX_CMD    = makeindex
+
+# If the COMPACT_LATEX tag is set to YES, doxygen generates more compact LaTeX
+# documents. This may be useful for small projects and may help to save some
+# trees in general.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+COMPACT_LATEX          = NO
+
+# The PAPER_TYPE tag can be used to set the paper type that is used by the
+# printer.
+# Possible values are: a4 (210 x 297 mm), letter (8.5 x 11 inches), legal (8.5 x
+# 14 inches) and executive (7.25 x 10.5 inches).
+# The default value is: a4.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+PAPER_TYPE             = a4
+
+# The EXTRA_PACKAGES tag can be used to specify one or more LaTeX package names
+# that should be included in the LaTeX output. The package can be specified just
+# by its name or with the correct syntax as to be used with the LaTeX
+# \usepackage command. To get the times font for instance you can specify :
+# EXTRA_PACKAGES=times or EXTRA_PACKAGES={times}
+# To use the option intlimits with the amsmath package you can specify:
+# EXTRA_PACKAGES=[intlimits]{amsmath}
+# If left blank no extra packages will be included.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+EXTRA_PACKAGES         =
+
+# The LATEX_HEADER tag can be used to specify a personal LaTeX header for the
+# generated LaTeX document. The header should contain everything until the first
+# chapter. If it is left blank doxygen will generate a standard header. See
+# section "Doxygen usage" for information on how to let doxygen write the
+# default header to a separate file.
+#
+# Note: Only use a user-defined header if you know what you are doing! The
+# following commands have a special meaning inside the header: $title,
+# $datetime, $date, $doxygenversion, $projectname, $projectnumber,
+# $projectbrief, $projectlogo. Doxygen will replace $title with the empty
+# string, for the replacement values of the other commands the user is referred
+# to HTML_HEADER.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_HEADER           =
+
+# The LATEX_FOOTER tag can be used to specify a personal LaTeX footer for the
+# generated LaTeX document. The footer should contain everything after the last
+# chapter. If it is left blank doxygen will generate a standard footer. See
+# LATEX_HEADER for more information on how to generate a default footer and what
+# special commands can be used inside the footer.
+#
+# Note: Only use a user-defined footer if you know what you are doing!
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_FOOTER           =
+
+# The LATEX_EXTRA_STYLESHEET tag can be used to specify additional user-defined
+# LaTeX style sheets that are included after the standard style sheets created
+# by doxygen. Using this option one can overrule certain style aspects. Doxygen
+# will copy the style sheet files to the output directory.
+# Note: The order of the extra style sheet files is of importance (e.g. the last
+# style sheet in the list overrules the setting of the previous ones in the
+# list).
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_EXTRA_STYLESHEET =
+
+# The LATEX_EXTRA_FILES tag can be used to specify one or more extra images or
+# other source files which should be copied to the LATEX_OUTPUT output
+# directory. Note that the files will be copied as-is; there are no commands or
+# markers available.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_EXTRA_FILES      =
+
+# If the PDF_HYPERLINKS tag is set to YES, the LaTeX that is generated is
+# prepared for conversion to PDF (using ps2pdf or pdflatex). The PDF file will
+# contain links (just like the HTML output) instead of page references. This
+# makes the output suitable for online browsing using a PDF viewer.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+PDF_HYPERLINKS         = YES
+
+# If the USE_PDFLATEX tag is set to YES, doxygen will use the engine as
+# specified with LATEX_CMD_NAME to generate the PDF file directly from the LaTeX
+# files. Set this option to YES, to get a higher quality PDF documentation.
+#
+# See also section LATEX_CMD_NAME for selecting the engine.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+USE_PDFLATEX           = YES
+
+# If the LATEX_BATCHMODE tag is set to YES, doxygen will add the \batchmode
+# command to the generated LaTeX files. This will instruct LaTeX to keep running
+# if errors occur, instead of asking the user for help. This option is also used
+# when generating formulas in HTML.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_BATCHMODE        = NO
+
+# If the LATEX_HIDE_INDICES tag is set to YES then doxygen will not include the
+# index chapters (such as File Index, Compound Index, etc.) in the output.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_HIDE_INDICES     = NO
+
+# If the LATEX_SOURCE_CODE tag is set to YES then doxygen will include source
+# code with syntax highlighting in the LaTeX output.
+#
+# Note that which sources are shown also depends on other settings such as
+# SOURCE_BROWSER.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_SOURCE_CODE      = NO
+
+# The LATEX_BIB_STYLE tag can be used to specify the style to use for the
+# bibliography, e.g. plainnat, or ieeetr. See
+# https://en.wikipedia.org/wiki/BibTeX and \cite for more info.
+# The default value is: plain.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_BIB_STYLE        = plain
+
+# If the LATEX_TIMESTAMP tag is set to YES then the footer of each generated
+# page will contain the date and time when the page was generated. Setting this
+# to NO can help when comparing the output of multiple runs.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_TIMESTAMP        = NO
+
+# The LATEX_EMOJI_DIRECTORY tag is used to specify the (relative or absolute)
+# path from which the emoji images will be read. If a relative path is entered,
+# it will be relative to the LATEX_OUTPUT directory. If left blank the
+# LATEX_OUTPUT directory will be used.
+# This tag requires that the tag GENERATE_LATEX is set to YES.
+
+LATEX_EMOJI_DIRECTORY  =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the RTF output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_RTF tag is set to YES, doxygen will generate RTF output. The
+# RTF output is optimized for Word 97 and may not look too pretty with other RTF
+# readers/editors.
+# The default value is: NO.
+
+GENERATE_RTF           = NO
+
+# The RTF_OUTPUT tag is used to specify where the RTF docs will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it.
+# The default directory is: rtf.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_OUTPUT             = rtf
+
+# If the COMPACT_RTF tag is set to YES, doxygen generates more compact RTF
+# documents. This may be useful for small projects and may help to save some
+# trees in general.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+COMPACT_RTF            = NO
+
+# If the RTF_HYPERLINKS tag is set to YES, the RTF that is generated will
+# contain hyperlink fields. The RTF file will contain links (just like the HTML
+# output) instead of page references. This makes the output suitable for online
+# browsing using Word or some other Word compatible readers that support those
+# fields.
+#
+# Note: WordPad (write) and others do not support links.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_HYPERLINKS         = NO
+
+# Load stylesheet definitions from file. Syntax is similar to doxygen's
+# configuration file, i.e. a series of assignments. You only have to provide
+# replacements, missing definitions are set to their default value.
+#
+# See also section "Doxygen usage" for information on how to generate the
+# default style sheet that doxygen normally uses.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_STYLESHEET_FILE    =
+
+# Set optional variables used in the generation of an RTF document. Syntax is
+# similar to doxygen's configuration file. A template extensions file can be
+# generated using doxygen -e rtf extensionFile.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_EXTENSIONS_FILE    =
+
+# If the RTF_SOURCE_CODE tag is set to YES then doxygen will include source code
+# with syntax highlighting in the RTF output.
+#
+# Note that which sources are shown also depends on other settings such as
+# SOURCE_BROWSER.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_RTF is set to YES.
+
+RTF_SOURCE_CODE        = NO
+
+#---------------------------------------------------------------------------
+# Configuration options related to the man page output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_MAN tag is set to YES, doxygen will generate man pages for
+# classes and files.
+# The default value is: NO.
+
+GENERATE_MAN           = NO
+
+# The MAN_OUTPUT tag is used to specify where the man pages will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it. A directory man3 will be created inside the directory specified by
+# MAN_OUTPUT.
+# The default directory is: man.
+# This tag requires that the tag GENERATE_MAN is set to YES.
+
+MAN_OUTPUT             = man
+
+# The MAN_EXTENSION tag determines the extension that is added to the generated
+# man pages. In case the manual section does not start with a number, the number
+# 3 is prepended. The dot (.) at the beginning of the MAN_EXTENSION tag is
+# optional.
+# The default value is: .3.
+# This tag requires that the tag GENERATE_MAN is set to YES.
+
+MAN_EXTENSION          = .3
+
+# The MAN_SUBDIR tag determines the name of the directory created within
+# MAN_OUTPUT in which the man pages are placed. If defaults to man followed by
+# MAN_EXTENSION with the initial . removed.
+# This tag requires that the tag GENERATE_MAN is set to YES.
+
+MAN_SUBDIR             =
+
+# If the MAN_LINKS tag is set to YES and doxygen generates man output, then it
+# will generate one additional man file for each entity documented in the real
+# man page(s). These additional files only source the real man page, but without
+# them the man command would be unable to find the correct page.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_MAN is set to YES.
+
+MAN_LINKS              = NO
+
+#---------------------------------------------------------------------------
+# Configuration options related to the XML output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_XML tag is set to YES, doxygen will generate an XML file that
+# captures the structure of the code including all documentation.
+# The default value is: NO.
+
+GENERATE_XML           = YES
+
+# The XML_OUTPUT tag is used to specify where the XML pages will be put. If a
+# relative path is entered the value of OUTPUT_DIRECTORY will be put in front of
+# it.
+# The default directory is: xml.
+# This tag requires that the tag GENERATE_XML is set to YES.
+
+XML_OUTPUT             = xml
+
+# If the XML_PROGRAMLISTING tag is set to YES, doxygen will dump the program
+# listings (including syntax highlighting and cross-referencing information) to
+# the XML output. Note that enabling this will significantly increase the size
+# of the XML output.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_XML is set to YES.
+
+XML_PROGRAMLISTING     = YES
+
+# If the XML_NS_MEMB_FILE_SCOPE tag is set to YES, doxygen will include
+# namespace members in file scope as well, matching the HTML output.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_XML is set to YES.
+
+XML_NS_MEMB_FILE_SCOPE = NO
+
+#---------------------------------------------------------------------------
+# Configuration options related to the DOCBOOK output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_DOCBOOK tag is set to YES, doxygen will generate Docbook files
+# that can be used to generate PDF.
+# The default value is: NO.
+
+GENERATE_DOCBOOK       = NO
+
+# The DOCBOOK_OUTPUT tag is used to specify where the Docbook pages will be put.
+# If a relative path is entered the value of OUTPUT_DIRECTORY will be put in
+# front of it.
+# The default directory is: docbook.
+# This tag requires that the tag GENERATE_DOCBOOK is set to YES.
+
+DOCBOOK_OUTPUT         = docbook
+
+# If the DOCBOOK_PROGRAMLISTING tag is set to YES, doxygen will include the
+# program listings (including syntax highlighting and cross-referencing
+# information) to the DOCBOOK output. Note that enabling this will significantly
+# increase the size of the DOCBOOK output.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_DOCBOOK is set to YES.
+
+DOCBOOK_PROGRAMLISTING = NO
+
+#---------------------------------------------------------------------------
+# Configuration options for the AutoGen Definitions output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_AUTOGEN_DEF tag is set to YES, doxygen will generate an
+# AutoGen Definitions (see http://autogen.sourceforge.net/) file that captures
+# the structure of the code including all documentation. Note that this feature
+# is still experimental and incomplete at the moment.
+# The default value is: NO.
+
+GENERATE_AUTOGEN_DEF   = NO
+
+#---------------------------------------------------------------------------
+# Configuration options related to the Perl module output
+#---------------------------------------------------------------------------
+
+# If the GENERATE_PERLMOD tag is set to YES, doxygen will generate a Perl module
+# file that captures the structure of the code including all documentation.
+#
+# Note that this feature is still experimental and incomplete at the moment.
+# The default value is: NO.
+
+GENERATE_PERLMOD       = NO
+
+# If the PERLMOD_LATEX tag is set to YES, doxygen will generate the necessary
+# Makefile rules, Perl scripts and LaTeX code to be able to generate PDF and DVI
+# output from the Perl module output.
+# The default value is: NO.
+# This tag requires that the tag GENERATE_PERLMOD is set to YES.
+
+PERLMOD_LATEX          = NO
+
+# If the PERLMOD_PRETTY tag is set to YES, the Perl module output will be nicely
+# formatted so it can be parsed by a human reader. This is useful if you want to
+# understand what is going on. On the other hand, if this tag is set to NO, the
+# size of the Perl module output will be much smaller and Perl will parse it
+# just the same.
+# The default value is: YES.
+# This tag requires that the tag GENERATE_PERLMOD is set to YES.
+
+PERLMOD_PRETTY         = YES
+
+# The names of the make variables in the generated doxyrules.make file are
+# prefixed with the string contained in PERLMOD_MAKEVAR_PREFIX. This is useful
+# so different doxyrules.make files included by the same Makefile don't
+# overwrite each other's variables.
+# This tag requires that the tag GENERATE_PERLMOD is set to YES.
+
+PERLMOD_MAKEVAR_PREFIX =
+
+#---------------------------------------------------------------------------
+# Configuration options related to the preprocessor
+#---------------------------------------------------------------------------
+
+# If the ENABLE_PREPROCESSING tag is set to YES, doxygen will evaluate all
+# C-preprocessor directives found in the sources and include files.
+# The default value is: YES.
+
+ENABLE_PREPROCESSING   = YES
+
+# If the MACRO_EXPANSION tag is set to YES, doxygen will expand all macro names
+# in the source code. If set to NO, only conditional compilation will be
+# performed. Macro expansion can be done in a controlled way by setting
+# EXPAND_ONLY_PREDEF to YES.
+# The default value is: NO.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+MACRO_EXPANSION        = YES
+
+# If the EXPAND_ONLY_PREDEF and MACRO_EXPANSION tags are both set to YES then
+# the macro expansion is limited to the macros specified with the PREDEFINED and
+# EXPAND_AS_DEFINED tags.
+# The default value is: NO.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+EXPAND_ONLY_PREDEF     = NO
+
+# If the SEARCH_INCLUDES tag is set to YES, the include files in the
+# INCLUDE_PATH will be searched if a #include is found.
+# The default value is: YES.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+SEARCH_INCLUDES        = YES
+
+# The INCLUDE_PATH tag can be used to specify one or more directories that
+# contain include files that are not input files but should be processed by the
+# preprocessor.
+# This tag requires that the tag SEARCH_INCLUDES is set to YES.
+
+INCLUDE_PATH           = ../../alg \
+                         ../../core \
+                         ../../data \
+                         ../../io \
+                         ../../python
+
+# You can use the INCLUDE_FILE_PATTERNS tag to specify one or more wildcard
+# patterns (like *.h and *.hpp) to filter out the header-files in the
+# directories. If left blank, the patterns specified with FILE_PATTERNS will be
+# used.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+INCLUDE_FILE_PATTERNS  =
+
+# The PREDEFINED tag can be used to specify one or more macro names that are
+# defined before the preprocessor is started (similar to the -D option of e.g.
+# gcc). The argument of the tag is a list of macros of the form: name or
+# name=definition (no spaces). If the definition and the "=" are omitted, "=1"
+# is assumed. To prevent a macro definition from being undefined via #undef or
+# recursively expanded use the := operator instead of the = operator.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+PREDEFINED             = DOXYGEN=1
+
+# If the MACRO_EXPANSION and EXPAND_ONLY_PREDEF tags are set to YES then this
+# tag can be used to specify a list of macro names that should be expanded. The
+# macro definition that is found in the sources will be used. Use the PREDEFINED
+# tag if you want to use a different macro definition that overrules the
+# definition found in the source code.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+EXPAND_AS_DEFINED      =
+
+# If the SKIP_FUNCTION_MACROS tag is set to YES then doxygen's preprocessor will
+# remove all references to function-like macros that are alone on a line, have
+# an all uppercase name, and do not end with a semicolon. Such function macros
+# are typically used for boiler-plate code, and will confuse the parser if not
+# removed.
+# The default value is: YES.
+# This tag requires that the tag ENABLE_PREPROCESSING is set to YES.
+
+SKIP_FUNCTION_MACROS   = NO
+
+#---------------------------------------------------------------------------
+# Configuration options related to external references
+#---------------------------------------------------------------------------
+
+# The TAGFILES tag can be used to specify one or more tag files. For each tag
+# file the location of the external documentation should be added. The format of
+# a tag file without this location is as follows:
+# TAGFILES = file1 file2 ...
+# Adding location for the tag files is done as follows:
+# TAGFILES = file1=loc1 "file2 = loc2" ...
+# where loc1 and loc2 can be relative or absolute paths or URLs. See the
+# section "Linking to external documentation" for more information about the use
+# of tag files.
+# Note: Each tag file must have a unique name (where the name does NOT include
+# the path). If a tag file is not located in the directory in which doxygen is
+# run, you must also specify the path to the tagfile here.
+
+TAGFILES               =
+
+# When a file name is specified after GENERATE_TAGFILE, doxygen will create a
+# tag file that is based on the input files it reads. See section "Linking to
+# external documentation" for more information about the usage of tag files.
+
+GENERATE_TAGFILE       =
+
+# If the ALLEXTERNALS tag is set to YES, all external class will be listed in
+# the class index. If set to NO, only the inherited external classes will be
+# listed.
+# The default value is: NO.
+
+ALLEXTERNALS           = NO
+
+# If the EXTERNAL_GROUPS tag is set to YES, all external groups will be listed
+# in the modules index. If set to NO, only the current project's groups will be
+# listed.
+# The default value is: YES.
+
+EXTERNAL_GROUPS        = NO
+
+# If the EXTERNAL_PAGES tag is set to YES, all external pages will be listed in
+# the related pages index. If set to NO, only the current project's pages will
+# be listed.
+# The default value is: YES.
+
+EXTERNAL_PAGES         = YES
+
+#---------------------------------------------------------------------------
+# Configuration options related to the dot tool
+#---------------------------------------------------------------------------
+
+# If the CLASS_DIAGRAMS tag is set to YES, doxygen will generate a class diagram
+# (in HTML and LaTeX) for classes with base or super classes. Setting the tag to
+# NO turns the diagrams off. Note that this option also works with HAVE_DOT
+# disabled, but it is recommended to install and use dot, since it yields more
+# powerful graphs.
+# The default value is: YES.
+
+CLASS_DIAGRAMS         = YES
+
+# You can include diagrams made with dia in doxygen documentation. Doxygen will
+# then run dia to produce the diagram and insert it in the documentation. The
+# DIA_PATH tag allows you to specify the directory where the dia binary resides.
+# If left empty dia is assumed to be found in the default search path.
+
+DIA_PATH               =
+
+# If set to YES the inheritance and collaboration graphs will hide inheritance
+# and usage relations if the target is undocumented or is not a class.
+# The default value is: YES.
+
+HIDE_UNDOC_RELATIONS   = NO
+
+# If you set the HAVE_DOT tag to YES then doxygen will assume the dot tool is
+# available from the path. This tool is part of Graphviz (see:
+# http://www.graphviz.org/), a graph visualization toolkit from AT&T and Lucent
+# Bell Labs. The other options in this section have no effect if this option is
+# set to NO
+# The default value is: NO.
+
+HAVE_DOT               = YES
+
+# The DOT_NUM_THREADS specifies the number of dot invocations doxygen is allowed
+# to run in parallel. When set to 0 doxygen will base this on the number of
+# processors available in the system. You can set it explicitly to a value
+# larger than 0 to get control over the balance between CPU load and processing
+# speed.
+# Minimum value: 0, maximum value: 32, default value: 0.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_NUM_THREADS        = 0
+
+# When you want a differently looking font in the dot files that doxygen
+# generates you can specify the font name using DOT_FONTNAME. You need to make
+# sure dot is able to find the font, which can be done by putting it in a
+# standard location or by setting the DOTFONTPATH environment variable or by
+# setting DOT_FONTPATH to the directory containing the font.
+# The default value is: Helvetica.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_FONTNAME           = Helvetica
+
+# The DOT_FONTSIZE tag can be used to set the size (in points) of the font of
+# dot graphs.
+# Minimum value: 4, maximum value: 24, default value: 10.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_FONTSIZE           = 12
+
+# By default doxygen will tell dot to use the default font as specified with
+# DOT_FONTNAME. If you specify a different font using DOT_FONTNAME you can set
+# the path where dot can find it using this tag.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_FONTPATH           =
+
+# If the CLASS_GRAPH tag is set to YES then doxygen will generate a graph for
+# each documented class showing the direct and indirect inheritance relations.
+# Setting this tag to YES will force the CLASS_DIAGRAMS tag to NO.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+CLASS_GRAPH            = YES
+
+# If the COLLABORATION_GRAPH tag is set to YES then doxygen will generate a
+# graph for each documented class showing the direct and indirect implementation
+# dependencies (inheritance, containment, and class references variables) of the
+# class with other documented classes.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+COLLABORATION_GRAPH    = YES
+
+# If the GROUP_GRAPHS tag is set to YES then doxygen will generate a graph for
+# groups, showing the direct groups dependencies.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+GROUP_GRAPHS           = NO
+
+# If the UML_LOOK tag is set to YES, doxygen will generate inheritance and
+# collaboration diagrams in a style similar to the OMG's Unified Modeling
+# Language.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+UML_LOOK               = NO
+
+# If the UML_LOOK tag is enabled, the fields and methods are shown inside the
+# class node. If there are many fields or methods and many nodes the graph may
+# become too big to be useful. The UML_LIMIT_NUM_FIELDS threshold limits the
+# number of items for each type to make the size more manageable. Set this to 0
+# for no limit. Note that the threshold may be exceeded by 50% before the limit
+# is enforced. So when you set the threshold to 10, up to 15 fields may appear,
+# but if the number exceeds 15, the total amount of fields shown is limited to
+# 10.
+# Minimum value: 0, maximum value: 100, default value: 10.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+UML_LIMIT_NUM_FIELDS   = 10
+
+# If the TEMPLATE_RELATIONS tag is set to YES then the inheritance and
+# collaboration graphs will show the relations between templates and their
+# instances.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+TEMPLATE_RELATIONS     = YES
+
+# If the INCLUDE_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are set to
+# YES then doxygen will generate a graph for each documented file showing the
+# direct and indirect include dependencies of the file with other documented
+# files.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+INCLUDE_GRAPH          = YES
+
+# If the INCLUDED_BY_GRAPH, ENABLE_PREPROCESSING and SEARCH_INCLUDES tags are
+# set to YES then doxygen will generate a graph for each documented file showing
+# the direct and indirect include dependencies of the file with other documented
+# files.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+INCLUDED_BY_GRAPH      = YES
+
+# If the CALL_GRAPH tag is set to YES then doxygen will generate a call
+# dependency graph for every global function or class method.
+#
+# Note that enabling this option will significantly increase the time of a run.
+# So in most cases it will be better to enable call graphs for selected
+# functions only using the \callgraph command. Disabling a call graph can be
+# accomplished by means of the command \hidecallgraph.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+CALL_GRAPH             = NO
+
+# If the CALLER_GRAPH tag is set to YES then doxygen will generate a caller
+# dependency graph for every global function or class method.
+#
+# Note that enabling this option will significantly increase the time of a run.
+# So in most cases it will be better to enable caller graphs for selected
+# functions only using the \callergraph command. Disabling a caller graph can be
+# accomplished by means of the command \hidecallergraph.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+CALLER_GRAPH           = NO
+
+# If the GRAPHICAL_HIERARCHY tag is set to YES then doxygen will graphical
+# hierarchy of all classes instead of a textual one.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+GRAPHICAL_HIERARCHY    = YES
+
+# If the DIRECTORY_GRAPH tag is set to YES then doxygen will show the
+# dependencies a directory has on other directories in a graphical way. The
+# dependency relations are determined by the #include relations between the
+# files in the directories.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DIRECTORY_GRAPH        = YES
+
+# The DOT_IMAGE_FORMAT tag can be used to set the image format of the images
+# generated by dot. For an explanation of the image formats see the section
+# output formats in the documentation of the dot tool (Graphviz (see:
+# http://www.graphviz.org/)).
+# Note: If you choose svg you need to set HTML_FILE_EXTENSION to xhtml in order
+# to make the SVG files visible in IE 9+ (other browsers do not have this
+# requirement).
+# Possible values are: png, jpg, gif, svg, png:gd, png:gd:gd, png:cairo,
+# png:cairo:gd, png:cairo:cairo, png:cairo:gdiplus, png:gdiplus and
+# png:gdiplus:gdiplus.
+# The default value is: png.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_IMAGE_FORMAT       = svg
+
+# If DOT_IMAGE_FORMAT is set to svg, then this option can be set to YES to
+# enable generation of interactive SVG images that allow zooming and panning.
+#
+# Note that this requires a modern browser other than Internet Explorer. Tested
+# and working are Firefox, Chrome, Safari, and Opera.
+# Note: For IE 9+ you need to set HTML_FILE_EXTENSION to xhtml in order to make
+# the SVG files visible. Older versions of IE do not have SVG support.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+INTERACTIVE_SVG        = NO
+
+# The DOT_PATH tag can be used to specify the path where the dot tool can be
+# found. If left blank, it is assumed the dot tool can be found in the path.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_PATH               =
+
+# The DOTFILE_DIRS tag can be used to specify one or more directories that
+# contain dot files that are included in the documentation (see the \dotfile
+# command).
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOTFILE_DIRS           =
+
+# The MSCFILE_DIRS tag can be used to specify one or more directories that
+# contain msc files that are included in the documentation (see the \mscfile
+# command).
+
+MSCFILE_DIRS           =
+
+# The DIAFILE_DIRS tag can be used to specify one or more directories that
+# contain dia files that are included in the documentation (see the \diafile
+# command).
+
+DIAFILE_DIRS           =
+
+# When using plantuml, the PLANTUML_JAR_PATH tag should be used to specify the
+# path where java can find the plantuml.jar file. If left blank, it is assumed
+# PlantUML is not used or called during a preprocessing step. Doxygen will
+# generate a warning when it encounters a \startuml command in this case and
+# will not generate output for the diagram.
+
+PLANTUML_JAR_PATH      =
+
+# When using plantuml, the PLANTUML_CFG_FILE tag can be used to specify a
+# configuration file for plantuml.
+
+PLANTUML_CFG_FILE      =
+
+# When using plantuml, the specified paths are searched for files specified by
+# the !include statement in a plantuml block.
+
+PLANTUML_INCLUDE_PATH  =
+
+# The DOT_GRAPH_MAX_NODES tag can be used to set the maximum number of nodes
+# that will be shown in the graph. If the number of nodes in a graph becomes
+# larger than this value, doxygen will truncate the graph, which is visualized
+# by representing a node as a red box. Note that doxygen if the number of direct
+# children of the root node in a graph is already larger than
+# DOT_GRAPH_MAX_NODES then the graph will not be shown at all. Also note that
+# the size of a graph can be further restricted by MAX_DOT_GRAPH_DEPTH.
+# Minimum value: 0, maximum value: 10000, default value: 50.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_GRAPH_MAX_NODES    = 10000
+
+# The MAX_DOT_GRAPH_DEPTH tag can be used to set the maximum depth of the graphs
+# generated by dot. A depth value of 3 means that only nodes reachable from the
+# root by following a path via at most 3 edges will be shown. Nodes that lay
+# further from the root node will be omitted. Note that setting this option to 1
+# or 2 may greatly reduce the computation time needed for large code bases. Also
+# note that the size of a graph can be further restricted by
+# DOT_GRAPH_MAX_NODES. Using a depth of 0 means no depth restriction.
+# Minimum value: 0, maximum value: 1000, default value: 0.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+MAX_DOT_GRAPH_DEPTH    = 100
+
+# Set the DOT_TRANSPARENT tag to YES to generate images with a transparent
+# background. This is disabled by default, because dot on Windows does not seem
+# to support this out of the box.
+#
+# Warning: Depending on the platform used, enabling this option may lead to
+# badly anti-aliased labels on the edges of a graph (i.e. they become hard to
+# read).
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_TRANSPARENT        = NO
+
+# Set the DOT_MULTI_TARGETS tag to YES to allow dot to generate multiple output
+# files in one run (i.e. multiple -o and -T options on the command line). This
+# makes dot run faster, but since only newer versions of dot (>1.8.10) support
+# this, this feature is disabled by default.
+# The default value is: NO.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_MULTI_TARGETS      = NO
+
+# If the GENERATE_LEGEND tag is set to YES doxygen will generate a legend page
+# explaining the meaning of the various boxes and arrows in the dot generated
+# graphs.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+GENERATE_LEGEND        = YES
+
+# If the DOT_CLEANUP tag is set to YES, doxygen will remove the intermediate dot
+# files that are used to generate the various graphs.
+# The default value is: YES.
+# This tag requires that the tag HAVE_DOT is set to YES.
+
+DOT_CLEANUP            = YES
diff --git a/doc/rtd/DoxygenLayout.xml b/doc/rtd/DoxygenLayout.xml
new file mode 100644
index 000000000..97700e63a
--- /dev/null
+++ b/doc/rtd/DoxygenLayout.xml
@@ -0,0 +1,256 @@
+<doxygenlayout version="1.0">
+  <!-- Generated by doxygen 1.8.20 -->
+  <!-- Navigation index tabs for HTML output -->
+  <navindex>
+    <tab type="mainpage" visible="yes" title=""/>
+    <tab type="pages" visible="yes" title="" intro=""/>
+    <tab type="modules" visible="yes" title="" intro=""/>
+
+    <tab type="user" url="https://github.com/LBL-EESA/TECA" title="Source code"/>
+
+    <!-- RTD uses too old a version for this
+    <tab type="interfaces" visible="yes" title="">
+      <tab type="interfacelist" visible="yes" title="" intro=""/>
+      <tab type="interfaceindex" visible="$ALPHABETICAL_INDEX" title=""/>
+      <tab type="interfacehierarchy" visible="yes" title="" intro=""/>
+    </tab>
+    -->
+
+    <tab type="classes" visible="yes" title="">
+      <tab type="classlist" visible="yes" title="" intro=""/>
+      <tab type="classindex" visible="yes" title=""/>
+      <tab type="hierarchy" visible="no" title="" intro=""/>
+      <tab type="classmembers" visible="no" title="" intro=""/>
+    </tab>
+
+    <!-- RTD uses too old a version for this
+    <tab type="structs" visible="yes" title="">
+      <tab type="structlist" visible="yes" title="" intro=""/>
+      <tab type="structindex" visible="no" title=""/>
+    </tab>
+    -->
+
+    <tab type="namespaces" visible="yes" title="">
+      <tab type="namespacelist" visible="yes" title="" intro=""/>
+      <tab type="namespacemembers" visible="no" title="" intro=""/>
+    </tab>
+
+    <!-- RTD uses too old a version for this
+    <tab type="exceptions" visible="no" title="">
+      <tab type="exceptionlist" visible="yes" title="" intro=""/>
+      <tab type="exceptionindex" visible="$ALPHABETICAL_INDEX" title=""/>
+      <tab type="exceptionhierarchy" visible="yes" title="" intro=""/>
+    </tab>
+    -->
+
+    <tab type="files" visible="no" title="">
+      <tab type="filelist" visible="no" title="" intro=""/>
+      <tab type="globals" visible="no" title="" intro=""/>
+    </tab>
+    <tab type="examples" visible="yes" title="" intro=""/>
+  </navindex>
+
+  <!-- Layout definition for a class page -->
+  <class>
+    <briefdescription visible="yes"/>
+    <includes visible="$SHOW_INCLUDE_FILES"/>
+    <inheritancegraph visible="$CLASS_GRAPH"/>
+    <collaborationgraph visible="$COLLABORATION_GRAPH"/>
+    <memberdecl>
+      <nestedclasses visible="yes" title=""/>
+      <publictypes title=""/>
+      <services title=""/>
+      <interfaces title=""/>
+      <publicslots title=""/>
+      <signals title=""/>
+      <publicmethods title=""/>
+      <publicstaticmethods title=""/>
+      <publicattributes title=""/>
+      <publicstaticattributes title=""/>
+      <protectedtypes title=""/>
+      <protectedslots title=""/>
+      <protectedmethods title=""/>
+      <protectedstaticmethods title=""/>
+      <protectedattributes title=""/>
+      <protectedstaticattributes title=""/>
+      <packagetypes title=""/>
+      <packagemethods title=""/>
+      <packagestaticmethods title=""/>
+      <packageattributes title=""/>
+      <packagestaticattributes title=""/>
+      <properties title=""/>
+      <events title=""/>
+      <privatetypes title=""/>
+      <privateslots title=""/>
+      <privatemethods title=""/>
+      <privatestaticmethods title=""/>
+      <privateattributes title=""/>
+      <privatestaticattributes title=""/>
+      <friends title=""/>
+      <related title="" subtitle=""/>
+      <membergroups visible="yes"/>
+    </memberdecl>
+    <detaileddescription title=""/>
+    <memberdef>
+      <inlineclasses title=""/>
+      <typedefs title=""/>
+      <enums title=""/>
+      <services title=""/>
+      <interfaces title=""/>
+      <constructors title=""/>
+      <functions title=""/>
+      <related title=""/>
+      <variables title=""/>
+      <properties title=""/>
+      <events title=""/>
+    </memberdef>
+    <allmemberslink visible="yes"/>
+    <usedfiles visible="$SHOW_USED_FILES"/>
+    <authorsection visible="yes"/>
+  </class>
+
+  <!-- Layout definition for a namespace page -->
+  <namespace>
+    <briefdescription visible="yes"/>
+    <memberdecl>
+      <nestednamespaces visible="yes" title=""/>
+      <constantgroups visible="yes" title=""/>
+      <!-- RTD uses too old a version for these
+
+        <interfaces visible="yes" title=""/>
+        <structs visible="yes" title=""/>
+        <sequences title=""/>
+        <exceptions visible="yes" title=""/>
+        <dictionaries title=""/>
+
+      -->
+      <classes visible="yes" title=""/>
+      <typedefs title=""/>
+      <enums title=""/>
+      <functions title=""/>
+      <variables title=""/>
+      <membergroups visible="yes"/>
+    </memberdecl>
+    <detaileddescription title=""/>
+    <memberdef>
+      <inlineclasses title=""/>
+      <typedefs title=""/>
+      <!-- RTD uses too old a version for these
+          <sequences title=""/>
+          <dictionaries title=""/>
+      -->
+      <enums title=""/>
+      <functions title=""/>
+      <variables title=""/>
+    </memberdef>
+    <authorsection visible="yes"/>
+  </namespace>
+
+  <!-- Layout definition for a file page -->
+  <file>
+    <briefdescription visible="yes"/>
+    <includes visible="$SHOW_INCLUDE_FILES"/>
+    <includegraph visible="$INCLUDE_GRAPH"/>
+    <includedbygraph visible="$INCLUDED_BY_GRAPH"/>
+    <sourcelink visible="yes"/>
+    <memberdecl>
+      <!-- RTD uses too old a version for these
+
+        <interfaces visible="yes" title=""/>
+        <structs visible="yes" title=""/>
+        <sequences title=""/>
+        <exceptions visible="yes" title=""/>
+        <dictionaries title=""/>
+
+      -->
+      <classes visible="yes" title=""/>
+      <namespaces visible="yes" title=""/>
+      <constantgroups visible="yes" title=""/>
+      <defines title=""/>
+      <typedefs title=""/>
+      <enums title=""/>
+      <functions title=""/>
+      <variables title=""/>
+      <membergroups visible="yes"/>
+    </memberdecl>
+    <detaileddescription title=""/>
+    <memberdef>
+      <inlineclasses title=""/>
+      <defines title=""/>
+      <typedefs title=""/>
+      <!-- RTD uses too old a version for these
+          <sequences title=""/>
+          <dictionaries title=""/>
+      -->
+      <enums title=""/>
+      <functions title=""/>
+      <variables title=""/>
+    </memberdef>
+    <authorsection/>
+  </file>
+
+  <!-- Layout definition for a group page -->
+  <group>
+    <briefdescription visible="yes"/>
+    <groupgraph visible="$GROUP_GRAPHS"/>
+    <memberdecl>
+      <nestedgroups visible="yes" title=""/>
+      <dirs visible="yes" title=""/>
+      <files visible="yes" title=""/>
+      <namespaces visible="yes" title=""/>
+      <classes visible="yes" title=""/>
+      <defines title=""/>
+      <typedefs title=""/>
+      <!-- RTD uses too old a version for these
+          <sequences title=""/>
+          <dictionaries title=""/>
+      -->
+      <enums title=""/>
+      <enumvalues title=""/>
+      <functions title=""/>
+      <variables title=""/>
+      <signals title=""/>
+      <publicslots title=""/>
+      <protectedslots title=""/>
+      <privateslots title=""/>
+      <events title=""/>
+      <properties title=""/>
+      <friends title=""/>
+      <membergroups visible="yes"/>
+    </memberdecl>
+    <detaileddescription title=""/>
+    <memberdef>
+      <pagedocs/>
+      <inlineclasses title=""/>
+      <defines title=""/>
+      <typedefs title=""/>
+      <!-- RTD uses too old a version for these
+          <sequences title=""/>
+          <dictionaries title=""/>
+      -->
+      <enums title=""/>
+      <enumvalues title=""/>
+      <functions title=""/>
+      <variables title=""/>
+      <signals title=""/>
+      <publicslots title=""/>
+      <protectedslots title=""/>
+      <privateslots title=""/>
+      <events title=""/>
+      <properties title=""/>
+      <friends title=""/>
+    </memberdef>
+    <authorsection visible="yes"/>
+  </group>
+
+  <!-- Layout definition for a directory page -->
+  <directory>
+    <briefdescription visible="yes"/>
+    <directorygraph visible="yes"/>
+    <memberdecl>
+      <dirs visible="yes"/>
+      <files visible="yes"/>
+    </memberdecl>
+    <detaileddescription title=""/>
+  </directory>
+</doxygenlayout>
diff --git a/doc/rtd/_static/collapsible-lists/LICENSE.md b/doc/rtd/_static/collapsible-lists/LICENSE.md
new file mode 100644
index 000000000..ef81a6453
--- /dev/null
+++ b/doc/rtd/_static/collapsible-lists/LICENSE.md
@@ -0,0 +1,7 @@
+This code is the fruit of Kate Morley's labor, taken from here:
+
+- http://code.iamkate.com/javascript/collapsible-lists/
+
+She includes a generous CC0 1.0 license for all materials on her site:
+
+- http://code.iamkate.com/
diff --git a/doc/rtd/_static/collapsible-lists/css/button-closed.png b/doc/rtd/_static/collapsible-lists/css/button-closed.png
new file mode 100644
index 000000000..417eb2fc4
Binary files /dev/null and b/doc/rtd/_static/collapsible-lists/css/button-closed.png differ
diff --git a/doc/rtd/_static/collapsible-lists/css/button-open.png b/doc/rtd/_static/collapsible-lists/css/button-open.png
new file mode 100644
index 000000000..ac4a6ef32
Binary files /dev/null and b/doc/rtd/_static/collapsible-lists/css/button-open.png differ
diff --git a/doc/rtd/_static/collapsible-lists/css/button.png b/doc/rtd/_static/collapsible-lists/css/button.png
new file mode 100644
index 000000000..631d734d1
Binary files /dev/null and b/doc/rtd/_static/collapsible-lists/css/button.png differ
diff --git a/doc/rtd/_static/collapsible-lists/css/list-item-contents.png b/doc/rtd/_static/collapsible-lists/css/list-item-contents.png
new file mode 100644
index 000000000..bc082929d
Binary files /dev/null and b/doc/rtd/_static/collapsible-lists/css/list-item-contents.png differ
diff --git a/doc/rtd/_static/collapsible-lists/css/list-item-last-open.png b/doc/rtd/_static/collapsible-lists/css/list-item-last-open.png
new file mode 100644
index 000000000..cf4cf9bdb
Binary files /dev/null and b/doc/rtd/_static/collapsible-lists/css/list-item-last-open.png differ
diff --git a/doc/rtd/_static/collapsible-lists/css/list-item-last.png b/doc/rtd/_static/collapsible-lists/css/list-item-last.png
new file mode 100644
index 000000000..1eb1c64a2
Binary files /dev/null and b/doc/rtd/_static/collapsible-lists/css/list-item-last.png differ
diff --git a/doc/rtd/_static/collapsible-lists/css/list-item-open.png b/doc/rtd/_static/collapsible-lists/css/list-item-open.png
new file mode 100644
index 000000000..0889c801a
Binary files /dev/null and b/doc/rtd/_static/collapsible-lists/css/list-item-open.png differ
diff --git a/doc/rtd/_static/collapsible-lists/css/list-item-root.png b/doc/rtd/_static/collapsible-lists/css/list-item-root.png
new file mode 100644
index 000000000..874417106
Binary files /dev/null and b/doc/rtd/_static/collapsible-lists/css/list-item-root.png differ
diff --git a/doc/rtd/_static/collapsible-lists/css/list-item.png b/doc/rtd/_static/collapsible-lists/css/list-item.png
new file mode 100644
index 000000000..81934f9b8
Binary files /dev/null and b/doc/rtd/_static/collapsible-lists/css/list-item.png differ
diff --git a/doc/rtd/_static/collapsible-lists/css/tree_view.css b/doc/rtd/_static/collapsible-lists/css/tree_view.css
new file mode 100644
index 000000000..fa21ac4e8
--- /dev/null
+++ b/doc/rtd/_static/collapsible-lists/css/tree_view.css
@@ -0,0 +1,61 @@
+/* Source taken directly from:
+ *     view-source:http://code.iamkate.com/javascript/collapsible-lists/
+ *
+ * Kate Morley's license for this code is CC0:
+ *     Created by [Kate Morley](http://iamkate.com/). Except where explicitly
+ *     stated otherwise, all content is released under the terms of the
+ *     [CC0 1.0 Universal legal code](http://creativecommons.org/publicdomain/zero/1.0/legalcode).
+ */
+.treeView{
+  -moz-user-select:none;
+  position:relative;
+}
+
+.treeView ul{
+  margin:0 0 0 -1.5em ! important;
+  padding:0 0 0 1.5em ! important;
+}
+
+.treeView ul ul{
+  background:url('list-item-contents.png') repeat-y left ! important;
+}
+
+.treeView li.lastChild > ul{
+  background-image:none ! important;
+}
+
+.treeView li{
+  margin:0 ! important;
+  padding:0 ! important;
+  background:url('list-item-root.png') no-repeat top left ! important;
+  list-style-position:inside ! important;
+  list-style-image:url('button.png') ! important;
+  cursor:auto;
+}
+
+.treeView li.collapsibleListOpen{
+  list-style-image:url('button-open.png') ! important;
+  cursor:pointer;
+}
+
+.treeView li.collapsibleListClosed{
+  list-style-image:url('button-closed.png') ! important;
+  cursor:pointer;
+}
+
+.treeView li li{
+  background-image:url('list-item.png') ! important;
+  padding-left:1.5em ! important;
+}
+
+.treeView li.lastChild{
+  background-image:url('list-item-last.png') ! important;
+}
+
+.treeView li.collapsibleListOpen{
+  background-image:url('list-item-open.png') ! important;
+}
+
+.treeView li.collapsibleListOpen.lastChild{
+  background-image:url('list-item-last-open.png') ! important;
+}
diff --git a/doc/rtd/_static/collapsible-lists/js/CollapsibleLists.compressed.js b/doc/rtd/_static/collapsible-lists/js/CollapsibleLists.compressed.js
new file mode 100644
index 000000000..429406cf3
--- /dev/null
+++ b/doc/rtd/_static/collapsible-lists/js/CollapsibleLists.compressed.js
@@ -0,0 +1,83 @@
+/*
+
+CollapsibleLists.js
+
+An object allowing lists to dynamically expand and collapse
+
+Created by Kate Morley - http://code.iamkate.com/ - and released under
+the terms of the CC0 1.0 Universal legal code:
+
+http://creativecommons.org/publicdomain/zero/1.0/legalcode
+
+*/
+
+var CollapsibleLists=new function(){
+this.apply=function(_1){
+var _2=document.getElementsByTagName("ul");
+for(var _3=0;_3<_2.length;_3++){
+if(_2[_3].className.match(/(^| )collapsibleList( |$)/)){
+this.applyTo(_2[_3],true);
+if(!_1){
+var _4=_2[_3].getElementsByTagName("ul");
+for(var _5=0;_5<_4.length;_5++){
+_4[_5].className+=" collapsibleList";
+}
+}
+}
+}
+};
+this.applyTo=function(_6,_7){
+var _8=_6.getElementsByTagName("li");
+for(var _9=0;_9<_8.length;_9++){
+if(!_7||_6==_8[_9].parentNode){
+if(_8[_9].addEventListener){
+_8[_9].addEventListener("mousedown",function(e){
+e.preventDefault();
+},false);
+}else{
+_8[_9].attachEvent("onselectstart",function(){
+event.returnValue=false;
+});
+}
+if(_8[_9].addEventListener){
+_8[_9].addEventListener("click",_a(_8[_9]),false);
+}else{
+_8[_9].attachEvent("onclick",_a(_8[_9]));
+}
+_b(_8[_9]);
+}
+}
+};
+function _a(_c){
+return function(e){
+if(!e){
+e=window.event;
+}
+var _d=(e.target?e.target:e.srcElement);
+while(_d.nodeName!="LI"){
+_d=_d.parentNode;
+}
+if(_d==_c){
+_b(_c);
+}
+};
+};
+function _b(_e){
+var _f=_e.className.match(/(^| )collapsibleListClosed( |$)/);
+var uls=_e.getElementsByTagName("ul");
+for(var _10=0;_10<uls.length;_10++){
+var li=uls[_10];
+while(li.nodeName!="LI"){
+li=li.parentNode;
+}
+if(li==_e){
+uls[_10].style.display=(_f?"block":"none");
+}
+}
+_e.className=_e.className.replace(/(^| )collapsibleList(Open|Closed)( |$)/,"");
+if(uls.length>0){
+_e.className+=" collapsibleList"+(_f?"Open":"Closed");
+}
+};
+}();
+
diff --git a/doc/rtd/_static/collapsible-lists/js/apply-collapsible-lists.js b/doc/rtd/_static/collapsible-lists/js/apply-collapsible-lists.js
new file mode 100644
index 000000000..e848bb981
--- /dev/null
+++ b/doc/rtd/_static/collapsible-lists/js/apply-collapsible-lists.js
@@ -0,0 +1,3 @@
+$(document).ready(function() {
+    CollapsibleLists.apply();
+});
diff --git a/doc/rtd/applications.rst b/doc/rtd/applications.rst
index 24011a25e..307dfbc60 100644
--- a/doc/rtd/applications.rst
+++ b/doc/rtd/applications.rst
@@ -21,6 +21,8 @@ batch script rather than in your shell.
 +----------------------------------------+--------------------------------------------------+
 | :ref:`teca_integrated_vapor_transport` | Computes IVT (integrated vapor transport)        |
 +----------------------------------------+--------------------------------------------------+
+| :ref:`teca_integrated_water_vapor`     | Computes IWV (integrated water vapor)            |
++----------------------------------------+--------------------------------------------------+
 | :ref:`teca_bayesian_ar_detect`         | AR detection with uncertainty quantification     |
 +----------------------------------------+--------------------------------------------------+
 | :ref:`teca_deeplab_ar_detect`          | A machine learning based AR detector             |
@@ -49,6 +51,9 @@ batch script rather than in your shell.
 | :ref:`teca_event_filter`               | Select TC tracks using run time provided         |
 |                                        | expressions                                      |
 +----------------------------------------+--------------------------------------------------+
+| :ref:`teca_cf_restripe`                | Convert the internal layout of a dataset on disk |
+|                                        | with optional subsetting and/or regridding.      |
++----------------------------------------+--------------------------------------------------+
 
 Applying the Command Line Applications at Scale
 -----------------------------------------------
@@ -87,6 +92,8 @@ loading the teca environment module. The second line tells the module system
 where to look for the teca modulefile and the third line loads the module,
 configuring the environment for use with TECA.
 
+.. _m1517_installs:
+
 m1517 CASCADE installs
 ~~~~~~~~~~~~~~~~~~~~~~
 Members of the CASCADE project m1517 can access rolling installs on Cori. These
@@ -103,7 +110,7 @@ at the top of their batch scripts.
 .. code-block:: bash
 
    module swap PrgEnv-intel PrgEnv-gnu
-   module use /global/common/software/m1517/develop
+   module use /global/common/software/m1517/teca/develop/modulefiles
    module load teca
 
 In order to make use of the `stable` release install swap `develop` for
@@ -336,6 +343,8 @@ read the variables *hus*, *ua* and *va* each from a different subdirectory.
     data_root = /global/cfs/cdirs/m3522/cmip6/CMIP6_hrmcol/HighResMIP/CMIP6/HighResMIP/ECMWF/ECMWF-IFS-HR/highresSST-present/r1i1p1f1/6hrPlevPt
     regex = 6hrPlevPt_ECMWF-IFS-HR_highresSST-present_r1i1p1f1_gr_199[0-9].*\.nc$
 
+    z_axis_variable = plev
+
     [cf_reader]
     variables = hus
     regex = %data_root%/hus/gr/v20170915/hus_%regex%
@@ -395,6 +404,62 @@ section key words:
 |                       | reader will provide the mesh definition.            |
 +-----------------------+-----------------------------------------------------+
 
+A number of optional `teca_cf_reader` properties may be placed in either the
+global or individual sections. When not specified in the MCF file the default
+values defined by the `teca_cf_reader` are used. Such properties, when
+specified in the global section are applied to all readers. Properties
+specified with in a `[cf_reader]` section are applied only to the reader
+declared in that section. When the same property is specified in both the
+global section and a `[cf_reader]` section, the property specified in the
+`[cf_reader]` section takes precedence. The following `teca_cf_reader`
+properties are supported:
+
++-------------------------+---------------------------------------------------+
+| key word                | description                                       |
++=========================+===================================================+
+| x_axis_variable         | The name of the variable defining the x           |
+|                         | coordinate axis. The default is *lon*.            |
++-------------------------+---------------------------------------------------+
+| y_axis_variable         | The name of the variable defining the y           |
+|                         | coordinate axis. The default is *lat*.            |
++-------------------------+---------------------------------------------------+
+| z_axis_variable         | The name of the variable defining the z           |
+|                         | coordinate axis. The default is *""*. The         |
+|                         | *z_axis_variable* must be specified for 3D data.  |
++-------------------------+---------------------------------------------------+
+| t_axis_variable         | The name of the variable defining the time axis.  |
+|                         | The default is *time*.                            |
++-------------------------+---------------------------------------------------+
+| calendar                | The calendar to use with the time axis. The       |
+|                         | calendar is typically encoded in the file. The    |
+|                         | value provided here can be used to override what  |
+|                         | is in the file or to specify the calendar when it |
+|                         | is missing from the file.                         |
++-------------------------+---------------------------------------------------+
+| t_units                 | The units that the time axis is in.  This time    |
+|                         | units are typically encoded in the file. The      |
+|                         | value provided here can be used to overrides what |
+|                         | is in the file or to specify the time units when  |
+|                         | they are missing from the file.                   |
++-------------------------+---------------------------------------------------+
+| filename_time_template  | Provides a way to infer time from the filename if |
+|                         | the time axis is not stored in the file itself.   |
+|                         | *strftime* format codes are used. For example for |
+|                         | the files: *my_file_20170516_00.nc*,              |
+|                         | *my_file_20170516_03.nc*, *...*; the template     |
+|                         | would be *my_file_%Y%m%d_%H.nc*                   |
++-------------------------+---------------------------------------------------+
+| periodic_in_x           | A flag that indicates a periodic boundary in the  |
+|                         | x direction.                                      |
++-------------------------+---------------------------------------------------+
+| clamp_dimensions_of_one | If set the requested extent will be clamped in a  |
+|                         | given direction if the coordinate axis in that    |
+|                         | direction has a length of 1 and the requested     |
+|                         | extent would be out of bounds. This is a work     |
+|                         | around to enable loading 2D data with a vertical  |
+|                         | dimension of 1, into a 3D mesh and should be used |
+|                         | with caution.                                     |
++-------------------------+---------------------------------------------------+
 
 .. _rearranging_data:
 
@@ -433,7 +498,7 @@ values, the following teca_cf_reader options can be used.
   string to enable override methods (--filename_time_template, --t_values) or
   to disable time coordinates completely
 
---cf_reader::t_calendar arg
+--cf_reader::calendar arg
   An optional calendar override. May be one of: standard, Julian,
   proplectic_Julian, Gregorian, proplectic_Gregorian, Gregorian_Y0,
   proplectic_Gregorian_Y0, noleap, no_leap, 365_day, 360_day. When the
@@ -535,8 +600,13 @@ in NetCDF CF2 format.
 --output_file arg
     file pattern for output netcdf files (%t% is the time index)
 
+--file_layout arg (=monthly)
+    Selects the size and layout of the set of output files. May be one of *number_of_steps*, *daily*,
+    *monthly*, *seasonal*, or *yearly*. Files are structured such that each file contains one of the
+    selected interval. For the number_of_steps option use `--steps_per_file`.
+
 --steps_per_file arg
-    number of time steps per output file
+    The number of time steps per output file when `--file_layout number_of_steps` is specified.
 
 --cf_writer::date_format arg
     A strftime format used when encoding dates into the output
@@ -942,6 +1012,23 @@ Command Line Arguments
 --write_ivt
     when this flag is present IVT vector is written to disk with the result
 
+--dem arg
+    A teca_cf_reader regex identifying the file containing surface elevation field or DEM.
+
+--dem_variable arg (=Z)
+    Sets the name of the variable containing the surface elevation field
+
+--mesh_height arg (=Zg)
+    Sets the name of the variable containing the point wise vertical height in meters above mean
+    sea level
+
+--ar_probability arg (=ar_probability)
+    Sets the name of the variable to store the computed AR probability mask in.
+
+--ar_weighted_variables arg
+    An optional list of variables to weight with the computed AR probability. Each such variable
+    will be multiplied by the computed AR probability, and written to disk as "NAME_ar_wgtd".
+
 --x_axis_variable arg (=lon)
     name of x coordinate variable
 
@@ -954,17 +1041,34 @@ Command Line Arguments
 --periodic_in_x arg (=1)
     Flags whether the x dimension (typically longitude) is periodic.
 
---binary_ar_threshold arg (=0.667)
-    probability threshold for segmenting ar_probability to produce ar_binary_tag
+--segment_ar_probability
+    A flag that enables a binary segmentation of AR probability to be produced. `--segment_threshold`
+    controls the segmentation. threshold and `--segment_variable` to set the name of the variable to
+    store the result in.
+
+--segment_threshold arg (=0.667)
+    Sets the threshold value that is used when segmenting ar_probability. See also
+    `--segment_ar_probability`
 
---output_file arg (=CASCADE_BARD_%t%.nc)
+--segment_variable arg (=ar_binary_tag)
+    Set the name of the variable to store the result of a binary segmentation of AR probabilty. See
+    also `--segment_ar_probability`.
+
+--output_file arg (=TECA_BARD_%t%.nc)
     A path and file name pattern for the output NetCDF files. %t% is replaced with a human readable
     date and time corresponding to the time of the first time step in the file. Use
     `--cf_writer::date_format` to change the formatting
 
+--file_layout arg (=monthly)
+    Selects the size and layout of the set of output files. May be one of number_of_steps, daily,
+    monthly, seasonal, or yearly. Files are structured such that each file contains one of the
+    selected interval. For the number_of_steps option use `--steps_per_file`.
+
 --steps_per_file arg (=128)
-    number of time steps per output file
+    The number of time steps per output file when `--file_layout number_of_steps` is specified.
 
+--first_step arg (=0)
+    first time step to process
 
 --last_step arg (=-1)
     last time step to process
@@ -1041,7 +1145,7 @@ dataset using TECA's BARD(Bayesian AR detector) detector.
     time srun -N 1484 -n 23744 teca_bayesian_ar_detect \
         --input_file ./HighResMIP_ECMWF_ECMWF-IFS-HR_highresSST-present_r1i1p1f1_6hrPlevPt.mcf \
         --specific_humidity hus --wind_u ua --wind_v va --ivt_u ivt_u --ivt_v ivt_v --ivt ivt \
-        --compute_ivt --write_ivt --write_ivt_magnitude --steps_per_file 128 \
+        --compute_ivt --write_ivt --write_ivt_magnitude --file_layout monthly \
         --output_file ${out_dir}/CASCADE_BARD_AR_%t%.nc
 
 This dataset spans the year 1950 to 2014 with 7 pressure levels at a
@@ -1102,7 +1206,7 @@ minutes on the Cori KNL supercomputer at NERSC.
             --input_regex "/global/project/projectdirs/m1517/cascade/external_datasets/ARTMIP/MERRA_2D/${year}/ARTMIP_MERRA_2D_.*\.nc" \
             --cf_reader::t_axis_variable "" \
             --cf_reader::filename_time_template  "ARTMIP_MERRA_2D_%Y%m%d_%H.nc" \
-            --steps_per_file 3000 \
+            --file_layout number_of_steps --steps_per_file 3000 \
             --cf_writer::date_format "%Y" \
             --output_file MERRA2.ar_tag.teca_bard_v1.0.3hourly.%t%.nc4 &> bard_${year}_${SLURM_JOB_ID}.log &
     done
@@ -1130,8 +1234,14 @@ taken into account. See the :ref:`teca_metadata_probe` ARTMIP :ref:`example<mdp_
 
 teca_integrated_vapor_transport
 -------------------------------
-The integrated vapor transport(IVT) command line application computes IVT from
-input wind vector and specific humidity.
+The integrated vapor transport(IVT) command line application computes:
+
+.. math::
+
+    IVT = \frac{1}{g} \int_{p_{sfc}}^{p_{top}} \vec{v} q dp
+
+where q is the specific humidity, and :math:`\vec{v} = (u, v)` are the
+longitudinal and latitudinal components of wind.
 
 Inputs
 ~~~~~~
@@ -1176,7 +1286,7 @@ Command Line Arguments
     name to use for the latitudinal component of the integrated vapor transport vector.
 
 --ivt arg (=IVT)
-    name of variable with the magnitude of integrated vapor transport
+    name of variable with the magnitude of integrated vapor transport (IVT)
 
 --write_ivt_magnitude arg (=0)
     when this is set to 1 magnitude of vector IVT is calculated. use `--ivt_u` and `--ivt_v` to set the
@@ -1191,8 +1301,13 @@ Command Line Arguments
     date and time corresponding to the time of the first time step in the file. Use
     --cf_writer::date_format to change the formatting
 
+--file_layout arg (=monthly)
+    Selects the size and layout of the set of output files. May be one of number_of_steps, daily,
+    monthly, seasonal, or yearly. Files are structured such that each file contains one of the
+    selected interval. For the number_of_steps option use `--steps_per_file`.
+
 --steps_per_file arg (=128)
-    number of time steps per output file
+    The number of time steps per output file when `--file_layout number_of_steps` is specified.
 
 --x_axis_variable arg (=lon)
     name of x coordinate variable
@@ -1203,8 +1318,15 @@ Command Line Arguments
 --z_axis_variable arg (=plev)
     name of z coordinate variable
 
---periodic_in_x arg (=1)
-    Flags whether the x dimension (typically longitude) is periodic.
+--dem arg
+    A teca_cf_reader regex identifying the file containing surface elevation field or DEM.
+
+--dem_variable arg (=Z)
+    Sets the name of the variable containing the surface elevation field
+
+--mesh_height arg (=Zg)
+    Sets the name of the variable containing the point wise vertical height in meters above mean
+    sea level
 
 --first_step arg (=0)
     first time step to process
@@ -1219,8 +1341,8 @@ Command Line Arguments
 --end_date arg
     The last time to process in 'Y-M-D h:m:s' format
 
---n_threads arg
-    Sets the thread pool size on each MPI rank. When the default value of -1 is used TECA will
+--n_threads arg (=-1)
+    Sets the thread pool size on each MPI  rank. When the default value of -1 is used TECA will
     coordinate the thread pools across ranks such each thread is bound to a unique physical core.
 
 --verbose
@@ -1269,7 +1391,7 @@ HighResMIP dataset using TECA.
         --specific_humidity hus --wind_u ua --wind_v va --ivt_u ivt_u --ivt_v ivt_v --ivt ivt               \
         --write_ivt 1 --write_ivt_magnitude 1                                                               \
         --output_file ./HighResMIP_ECMWF_ECMWF-IFS-HR_highresSST-present_r1i1p1f1_6hrPlevPt/ivt/ivt_%t%.nc  \
-        --steps_per_file 32 --n_threads -1 --verbose
+        --n_threads -1 --verbose
 
 This HighResMIP dataset spans the year 1950 to 2014 with 7 pressure levels at a
 1 degree spatial and 6 hourly time resolution. There are 94964 simulated time
@@ -1286,6 +1408,113 @@ The HighResMIP data is organized such that each
 variable is stored in its own directory.  This :ref:`MCF file<HighResMIPMCF>`
 was used to configure the readers.
 
+
+.. _teca_integrated_water_vapor:
+
+teca_integrated_water_vapor
+-------------------------------
+The integrated water vapor(IWV) command line application computes:
+
+.. math::
+
+   IWV = \frac{1}{g} \int_{p_{sfc}}^{p_{top}} q dp
+
+where g is the acceleration due to Earth's gravity, p is atmospheric pressure,
+and q is specific humidity.
+
+
+Inputs
+~~~~~~
+A 3D time dependent mesh in NetCDF CF2 format with:
+
+1. specific humidity
+
+Outputs
+~~~~~~~
+A 2D mesh with:
+
+1. IWV
+
+
+Command Line Arguments
+~~~~~~~~~~~~~~~~~~~~~~
+--input_file arg
+    a teca_multi_cf_reader configuration file identifying the set of NetCDF CF2 files to process.
+    When present data is read using the teca_multi_cf_reader. Use one of either `--input_file` or
+    `--input_regex`.
+
+--input_regex arg
+    a teca_cf_reader regex identifying the set of NetCDF CF2 files to process. When present data is
+    read using the teca_cf_reader. Use one of either `--input_file` or `--input_regex`.
+
+--specific_humidity arg (=Q)
+    name of variable with the 3D specific humidity field.
+
+--iwv arg (=IWV)
+    name to use for the longitudinal component of the integrated vapor transport vector.
+
+--output_file arg (=IWV_%t%.nc)
+    A path and file name pattern for the output NetCDF files. %t% is replaced with a human readable
+    date and time corresponding to the time of the first time step in the file. Use
+    `--cf_writer::date_format` to change the formatting
+
+--file_layout arg (=monthly)
+    Selects the size and layout of the set of output files. May be one of number_of_steps, daily,
+    monthly, seasonal, or yearly. Files are structured such that each file contains one of the
+    selected interval. For the number_of_steps option use `--steps_per_file`.
+
+--steps_per_file arg (=128)
+    The number of time steps per output file when `--file_layout number_of_steps` is specified.
+
+--x_axis_variable arg (=lon)
+    name of x coordinate variable
+
+--y_axis_variable arg (=lat)
+    name of y coordinate variable
+
+--z_axis_variable arg (=plev)
+    name of z coordinate variable
+
+--dem arg
+    A teca_cf_reader regex identifying the file containing surface elevation field or DEM.
+
+--dem_variable arg (=Z)
+    Sets the name of the variable containing the surface elevation field
+
+--mesh_height arg (=Zg)
+    Sets the name of the variable containing the point wise vertical height in meters above mean
+    sea level
+
+--first_step arg (=0)
+    first time step to process
+
+--last_step arg (=-1)
+    last time step to process
+
+--start_date arg
+    The first time to process in 'Y-M-D h:m:s' format. Note: There must be a space between the date
+    and time specification
+
+--end_date arg
+    The last time to process in 'Y-M-D h:m:s' format
+
+--n_threads arg (=-1)
+    Sets the thread pool size on each MPI  rank. When the default value of -1 is used TECA will
+    coordinate the thread pools across ranks such each thread is bound to a unique physical core.
+
+--verbose
+    enable extra terminal output
+
+--help
+    displays documentation for application specific command line options
+
+--advanced_help
+    displays documentation for algorithm specific command line options
+
+--full_help
+    displays both basic and advanced documentation together
+
+
 .. _teca_tc_detect:
 
 teca_tc_detect
@@ -2081,8 +2310,13 @@ Command Line Arguments
     date and time corresponding to the time of the first time step in the file. Use --date_format to
     change the formatting (default: None)
 
+--file_layout FILE_LAYOUT
+    Selects the size and layout of the set of output files. May be one of number_of_steps, daily,
+    monthly, seasonal, or yearly. Files are structured such that each file contains one of the
+    selected interval. For the number_of_steps option use `--steps_per_file`. (default: yearly)
+
 --steps_per_file STEPS_PER_FILE
-    number of time steps to write to each output file (default: 128)
+    The number of time steps per output file when `--file_layout number_of_steps` is specified.
 
 --x_axis_variable X_AXIS_VARIABLE
     name of the variable to use for x-coordinates (default: lon)
@@ -2148,7 +2382,7 @@ simulated time at quarter degree 3 hourly resolution.
             --n_threads 2 --verbose 1 --input_regex ${data_dir}/'.*\.nc$' \
             --interval daily --operator average --point_arrays TS TMQ --ignore_fill_value \
             --output_file ${out_dir}/CAM5-1-025degree_All-Hist_est1_v3_daily_avg_%t%.nc \
-            --steps_per_file 50
+            --file_layout monthly
 
 .. _ta_era5:
 
@@ -2184,7 +2418,7 @@ degree, 1 hourly resolution.
     out_dir=CMIP6_ERA5_e5_oper_an_sfc_seasonal_avg
     mkdir -p ${out_dir}
 
-    # compute the daily average. change -N and -n to match the run size.
+    # compute the seasonal average. change -N and -n to match the run size.
     # the run size is determened by the number of output time steps. here the
     # input is 41 years of 1 hourly data, the output is seasonal, with 164 seasons.
     time srun -N 164 -n 164 \
@@ -2193,7 +2427,7 @@ degree, 1 hourly resolution.
             --x_axis_variable longitude --y_axis_variable latitude \
             --interval seasonal --operator average --point_arrays TCWV \
             --output_file ${out_dir}/e5_oper_an_sfc_128_137_tcwv_ll025sc_seasonal_avg_%t%.nc \
-            --steps_per_file 4
+            --file_layout number_of_steps --steps_per_file 4
 
 This run made use of 164 MPI ranks on 164 KNL nodes. 164 ranks were used
 because the input data spans 41 years of simulated time, and 41 years each with
@@ -2275,6 +2509,11 @@ Command Line Arguments
     date and time corresponding to the time of the first time step in the file. Use `--date_format` to
     change the formatting (default: None)
 
+--file_layout FILE_LAYOUT
+    Selects the size and layout of the set of output files. May be one of number_of_steps, daily,
+    monthly, seasonal, or yearly. Files are structured such that each file contains one of the
+    selected interval. For the number_of_steps option use `--steps_per_file`. (default: monthly)
+
 --steps_per_file STEPS_PER_FILE
     number of time steps per output file (default: 128)
 
@@ -2300,7 +2539,7 @@ Command Line Arguments
 --t_axis_variable T_AXIS_VARIABLE
     time dimension name (default: None)
 
---t_calendar T_CALENDAR
+--calendar calendar
     time calendar (default: None)
 
 --t_units T_UNITS
@@ -2402,8 +2641,7 @@ ref:`cmip6_ex_desc<teca_bayesian_ar_detect examples>`.
         --input_file ./HighResMIP_ECMWF_ECMWF-IFS-HR_highresSST-present_r1i1p1f1_6hrPlevPt.mcf \
         --compute_ivt --wind_u ua --wind_v va --specific_humidity hus \
         --write_ivt --write_ivt_magnitude \
-        --output_file ${out_dir}/deeplab_AR_%t%.nc \
-        --steps_per_file 128
+        --output_file ${out_dir}/deeplab_AR_%t%.nc
 
 .. _teca_convert_table:
 
@@ -2463,3 +2701,199 @@ Examples
 
 This example converts a table stored in TECA's binary format to NetCDF. To covnert
 to CSV instead one would change the extension from *.nc* to *.csv*.
+
+
+.. _teca_cf_restripe:
+
+teca_cf_restripe
+----------------
+
+The `teca_cf_restripe` application was written to test TECA's parallel
+collective I/O capabilities. It can be used to change the internal organization
+of the files comprising a dataset. For instance one can convert a dataset where
+each file stores a single day's worth of data to one where each file stores a
+month's worth of data, a year's worth of data, or a fixed number of time steps.
+The application can be used to subset a dataset in either space and time,
+extracting a reduced sized selection of interest. It can also be used to
+spatially regrid a dataset onto a Cartesian mesh of user supplied bounds and
+extents. The regridding feature can be used to slice a 3D dataset in
+preparation for GFDL TC tracker which requires 2D slices at specified vertical
+pressure levels.
+
+Inputs
+~~~~~~
+A NetCDF CF dataset.
+
+Outputs
+~~~~~~~
+A copy of the input NetCDF data, potentially reorganized on disk, and/or subset
+in space and time, and/or spatially regridded.
+
+
+Command Line Options
+~~~~~~~~~~~~~~~~~~~~
+
+--input_file arg
+    a teca_multi_cf_reader configuration file identifying the set of NetCDF CF2 files to process.
+    When present data is read using the teca_multi_cf_reader. Use one of either --input_file or
+    --input_regex.
+
+--input_regex arg
+    a teca_cf_reader regex identifying the set of NetCDF CF2 files to process. When present data is
+    read using the teca_cf_reader. Use one of either --input_file or --input_regex.
+
+--x_axis_variable arg
+    name of x coordinate variable (lon)
+
+--y_axis_variable arg
+    name of y coordinate variable (lat)
+
+--z_axis_variable arg
+    name of z coordinate variable (plev)
+
+--point_arrays arg
+    A list of point centered arrays to write
+
+--information_arrays arg
+    A list of non-geometric arrays to write
+
+--output_file arg
+    A path and file name pattern for the output NetCDF files. %t% is replaced with a human readable
+    date and time corresponding to the time of the first time step in the file. Use
+    --cf_writer::date_format to change the formatting
+
+--file_layout arg (=monthly)
+    Selects the size and layout of the set of output files. May be one of number_of_steps, daily,
+    monthly, seasonal, or yearly. Files are structured such that each file contains one of the
+    selected interval. For the number_of_steps option use --steps_per_file.
+
+--steps_per_file arg
+    The number of time steps per output file when  --file_layout number_of_steps is specified.
+
+--normalize_coordinates
+    Enable coordinate normalization pipeline stage
+
+--regrid
+    Enable mesh regridding pipeline stage. When enabled requires --dims to be provided
+
+--dims arg
+    A 3-tuple of values specifying the mesh size of the output dataset in the x, y, and z
+    dimensions. The accepted format for dimensions is: nx ny nz
+
+--bounds arg
+    A hex-tuple of low and high values specifying lon lat lev bounding box to subset the input
+    dataset with. The accepted format for bounds is: x0 x1 y0 y1 z0 z1
+
+--rename
+    Enable variable renaming stage
+
+--original_name arg
+    A list of variables to rename. Use --new_name to set the new names
+
+--new_name arg
+    The new names to use when renaming variables. Use --original_name to set the list of variables
+    to rename
+
+--first_step arg
+    first time step to process
+
+--last_step arg
+    last time step to process
+
+--start_date arg
+    first time to proces in YYYY-MM-DD hh:mm:ss format
+
+--end_date arg
+    first time to proces in YYYY-MM-DD hh:mm:ss format
+
+--n_threads arg
+    Sets the thread pool size on each MPI rank. When the default value of -1 is used TECA will
+    coordinate the thread pools across ranks such each thread is bound to a unique physical core.
+
+--verbose
+    enable extra terminal output
+
+--help
+    displays documentation for application specific command line options
+
+--advanced_help
+    displays documentation for algorithm specific command line options
+
+--full_help
+    displays both basic and advanced documentation together
+
+
+Examples
+~~~~~~~~
+
+.. _slicing_3d_data:
+
+Slicing 3D CMIP6 Data
+^^^^^^^^^^^^^^^^^^^^^
+
+This example shows how to regrid 3D data onto run time specified 2D slices at
+the pressure levels needed for the GFDL TC tracker. In this CMIP6 dataset seal
+level pressure and surface winds are on a 2D Cartesian mesh but atmospheric
+wind speed, temperature, and geopotential height are on a 3D Cartesian mesh. In
+order to run the GFDL TC tracker we'll need to compute the following slices:
+850 mB wind vector, 500 and 200 mB air temperature, 1000 and 200 mB
+geopotential height. The input dataset spans 65 years at 6 hourly, 1/2 degree
+resolution. There are a total of 94964 time steps to process. The following
+script illustrates computing the slices using 1024 compute nodes and 4096 MPI
+ranks.
+
+.. code-block:: bash
+
+    #!/bin/bash
+    #SBATCH -C knl
+    #SBATCH -N 1024
+    #SBATCH -q regular
+    #SBATCH -t 04:00:00
+    #SBATCH -A m1517
+    #SBATCH -J 2_slice_data
+
+    # load gcc
+    module swap PrgEnv-intel PrgEnv-gnu
+
+    # bring a TECA install into your environment.
+    module use /global/common/software/m1517/teca/develop/modulefiles
+    module load teca
+
+    # run with 4 MPI ranks per node
+    NN=1024
+    let nn=${NN}*4
+
+    # store the output data here
+    data_root_out=ECMWF-IFS-HR_highresSST-present_r1i1p1f1_6hrPlevPt
+    mkdir ${data_root_out}
+
+    # get the input data here
+    data_root_in=/global/cfs/cdirs/m3522/cmip6/CMIP6_hrmcol/HighResMIP/CMIP6/HighResMIP/ECMWF/ECMWF-IFS-HR/highresSST-present/r1i1p1f1/6hrPlevPt
+    regex_in=6hrPlevPt_ECMWF-IFS-HR_highresSST-present_r1i1p1f1_gr_'.*\.nc$'
+
+    # slice the following variables on the following pressure levels (in millibar)
+    var_in=(ua va ta ta zg zg)
+    plev_mb=(850 850 200 500 200 924)
+
+    let n=${#var_in[@]}-1
+    for i in `seq 0 $n`
+    do
+        # convert from millbar to Pascals
+        let plev_pa=${plev_mb[${i}]}*100
+        var_out=${var_in[${i}]}${plev_mb[${i}]}
+
+        echo "====================================================="
+        echo "slicing ${var_in[${i}]} at ${plev_pa} into ${var_out}"
+        echo "====================================================="
+
+        rm -rf "${data_root_out}/${var_out}"
+        mkdir -p "${data_root_out}/${var_out}"
+
+        time srun -n ${nn} -N ${NN}                                                                                             \
+            teca_cf_restripe                                                                                                    \
+            --input_regex "${data_root_in}/${var_in[${i}]}/gr/v20170915/${var_in[${i}]}_${regex_in}"                            \
+            --z_axis_variable plev --regrid --dims 720 361 1 --bounds 0 359.5 -90 90 ${plev_pa} ${plev_pa}                      \
+            --rename --original_name ${var_in[${i}]} --new_name ${var_out}                                                      \
+            --output_file "${data_root_out}/${var_out}/${var_out}_6hrPlevPt_ECMWF-IFS-HR_highresSST-present_r1i1p1f1_gr_%t%.nc" \
+            --point_arrays ${var_out} --file_layout monthly
+    done
diff --git a/doc/rtd/conf.py b/doc/rtd/conf.py
index 9471228ed..4bbc31c09 100644
--- a/doc/rtd/conf.py
+++ b/doc/rtd/conf.py
@@ -1,3 +1,5 @@
+import subprocess, os
+
 # Configuration file for the Sphinx documentation builder.
 #
 # This file only contains a selection of the most common options. For a full
@@ -18,19 +20,44 @@
 # -- Project information -----------------------------------------------------
 
 project = 'TECA'
-copyright = "2019, Burlen Loring, Travis O'Brien & Abdelrahman Elbashandy"
+copyright = "2021, Burlen Loring, Travis O'Brien & Abdelrahman Elbashandy"
 author = "Burlen Loring, Travis O'Brien & Abdelrahman Elbashandy"
 
 # -- General configuration ---------------------------------------------------
 
+
+if not os.path.exists('_build/html'):
+    os.makedirs('_build/html')
+
+subprocess.call('cat /etc/issue', shell=True)
+subprocess.call('doxygen --version', shell=True)
+
+# RTD version of Doxygen has a bug that crashes it on our code due to a fixed
+# buffer size. When RTD updates to Ubuntu 20.04 this will be resolved. See
+# issue 613
+resolved_613 = False
+if resolved_613:
+    subprocess.call('doxygen', shell=True)
+    subprocess.call('./parse_xml.py', shell=True)
+else:
+    subprocess.call('svn checkout svn://svn.code.sf.net/p/teca/rtd_extras/doxygen _build/html/doxygen', shell=True)
+    subprocess.call('svn checkout svn://svn.code.sf.net/p/teca/rtd_extras/rst _build/rst', shell=True)
+
 # Add any Sphinx extension module names here, as strings. They can be
 # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
 # ones.
 
-# pip install sphinxcontrib-bibtex
-extensions = ['sphinxcontrib.bibtex']
+# pip install sphinxcontrib-bibtex breathe
+extensions = ['sphinxcontrib.bibtex', 'breathe']
+
 bibtex_bibfiles = ['bibliography.bib']
 
+# Configuring Breathe
+breathe_projects = {
+    "TECA": "_build/xml"
+}
+breathe_default_project = "TECA"
+
 # Add any paths that contain templates here, relative to this directory.
 templates_path = ['_templates']
 
@@ -53,13 +80,16 @@
 # Add any paths that contain custom static files (such as style sheets) here,
 # relative to this directory. They are copied after the builtin static files,
 # so a file named "default.css" will overwrite the builtin "default.css".
-#html_static_path = ['_static']
 html_static_path = ['_static']
 
-html_context = {
-    'css_files': [
-        '_static/theme_overrides.css',  # overrides for wide tables in RTD theme
-        ],
-    }
+html_css_files = [
+    'theme_overrides.css',  # overrides for wide tables in RTD theme
+    'collapsible-lists/css/tree_view.css'
+    ]
+
+html_js_files = [
+    'collapsible-lists/js/CollapsibleLists.compressed.js',
+    'collapsible-lists/js/apply-collapsible-lists.js'
+    ]
 
 numfig = True
diff --git a/doc/rtd/developer.rst b/doc/rtd/developer.rst
index fa43c9bc8..fa9b0b803 100644
--- a/doc/rtd/developer.rst
+++ b/doc/rtd/developer.rst
@@ -1,5 +1,23 @@
 Development
 ===========
+
+Online Source Code Documentation
+--------------------------------
+TECA's C++ sources are documented via Doxygen at the `TECA Doxygen site <doxygen/index.html>`_.
+
+Class Indices
+-------------
+
+.. tip::
+
+    The following tables contain a listing of some commonly used TECA classes. The
+    `TECA Doxygen site <doxygen/index.html>`_ is a more complete reference.
+
+.. include:: _build/rst/generated_rtd_alg.rst
+.. include:: _build/rst/generated_rtd_io.rst
+.. include:: _build/rst/generated_rtd_core.rst
+.. include:: _build/rst/generated_rtd_data.rst
+
 Testing
 -------
 TECA comes with an extensive regression test suite which can be used to validate
@@ -93,3 +111,18 @@ to the title of the plot. Example output is shown in :numref:`prof_vis_10t_1r`.
    Visualization of TECA's run time profiler for the test_bayesian_ar_detect
    regression test, run with 1 MPI rank and 10 threads.
 
+
+Creating PyPi Packages
+----------------------
+The typical sequence for pushing and testing to PyPi is as follows. Be sure to
+add an rc number to the version in setup.py when testing since these are unique
+and cannot be reused.
+
+.. code-block:: bash
+
+    python3 setup.py build_ext
+    python3 setup.py install
+    python3 setup.py sdist
+    python3 -m twine upload --repository-url https://test.pypi.org/legacy/ dist/*
+    pip3 install --index-url https://test.pypi.org/simple/ teca
+
diff --git a/doc/rtd/installation.rst b/doc/rtd/installation.rst
index 53a8f2be9..4fe5d842f 100644
--- a/doc/rtd/installation.rst
+++ b/doc/rtd/installation.rst
@@ -8,6 +8,13 @@ on the platform and desired use.
 
 On a Cray Supercomputer
 -----------------------
+
+.. tip::
+
+   CASCADE team members who need to run the command line applications on NERSC
+   Cori can use the m1517 group installs instead of manually installing TECA.
+   See :ref:`m1517_installs` for more information.
+
 When installing TECA on a supercomputer one of the best options is the
 superbuild, a piece of CMake code that downloads and builds TECA and its many
 dependencies. The superbuild is located in a git repository here
@@ -226,7 +233,7 @@ For Python package dependencies pip is used as described in :ref:`python-environ
 
 It is recommended to have a parallel HDF5 based NetCDF install, on some systems
 (Ubuntu, Mac) this requires installing NetCDF from source as outlined in
-:ref:`netcdf-parallel-4`.
+:ref:`netcdf-parallel4`.
 
 Apple Mac OS
 ^^^^^^^^^^^^
@@ -302,7 +309,7 @@ Once the venv is installed and activated, see :ref:`compile`.
     but is no longer maintained and should not be used.
 
 
-.. _netcdf-parallel-4:
+.. _netcdf-parallel4:
 
 NetCDF w/ Parallel 4
 ^^^^^^^^^^^^^^^^^^^^^
@@ -323,7 +330,7 @@ On Ubuntu 20.04
     $ cd netcdf-c-4.7.4
     $ ./configure CC=mpicc CFLAGS="-O3 -I/usr/include/hdf5/mpich"       \
           LDFLAGS="-L/usr/lib/x86_64-linux-gnu/hdf5/mpich/ -lhdf5"      \
-          --prefix=`pwd`/../netcdf-c-4.7.4-install --enable-parallel-4  \
+          --prefix=`pwd`/../netcdf-c-4.7.4-install --enable-parallel4   \
           --disable-dap
     $ make -j install
 
@@ -423,7 +430,7 @@ build to the local install by passing options on the pip command line.
    pip install teca --global-option=build_ext \
        --global-option="--with-netcdf=/Users/bloring/netcdf-c-4.7.4-install/"
 
-See section :ref:`netcdf-parallel-4` for information on compiling NetCDF with
+See section :ref:`netcdf-parallel4` for information on compiling NetCDF with
 MPI enabled.
 
 with conda
diff --git a/doc/rtd/parse_xml.py b/doc/rtd/parse_xml.py
new file mode 100755
index 000000000..a899da4d6
--- /dev/null
+++ b/doc/rtd/parse_xml.py
@@ -0,0 +1,373 @@
+#!/usr/bin/env python3
+
+import sys, os, traceback
+import xml.etree.ElementTree as ET
+from collections import defaultdict
+
+
+class TECA_Tree(object):
+    def __init__(
+            self, xml_dir='_build/xml',
+            index_file='index.xml', kinds=['class']):
+        """Construct TECA ('class' for now) Tree
+
+        :param index_file: Doxygen's index.xml path
+        :type index_file: str
+        """
+        self.index_file = index_file
+        self.xml_dir = xml_dir
+        self.kinds = kinds
+
+        xml_tree = ET.parse(os.path.join(xml_dir, index_file))
+        self.xml_root = xml_tree.getroot()
+
+        self.nodes = defaultdict(None)
+        self.directory_structure = None
+
+        self.meta_info = {
+            'alg': {
+                'full_name': 'Algorithms',
+                'description': 'TECA\'s suite of algorithms that can ' \
+                               'be inserted in functional pipelines'
+            },
+            'core': {
+                'full_name': 'Core',
+                'description': 'TECA\'s core components'
+            },
+            'data': {
+                'full_name': 'Data',
+                'description': 'TECA\'s data structures'
+            },
+            'io': {
+                'full_name': 'I/O',
+                'description': 'TECA\'s I/O components to read datasets ' \
+                               'efficiently'
+            }
+        }
+
+        self.get_components()
+
+        self.generate_file_hierarchy()
+
+        self.rescue_every_family()
+        self.generate_class_hierarchy()
+
+        self.generate_api_pages(output_dir='_build/rst')
+
+    def get_first_dir(self, trunk_dict):
+        for key, _ in trunk_dict.items():
+            if key != 'files':
+                return key
+
+    def get_compound_refid(self, name, kind='file'):
+        for teca_element in self.xml_root.findall('compound'):
+            if teca_element.get('kind') == kind:
+                if name == teca_element.find('name').text:
+                    return teca_element.get('refid')
+
+    def get_components(self):
+        for teca_element in self.xml_root.findall('compound'):
+            kind = teca_element.get('kind')
+            if kind in self.kinds:
+                name = teca_element.find('name').text
+                if '::' not in name:
+                    node = self.Node(
+                        teca_element.get('refid'),
+                        name,
+                        self.xml_dir
+                        )
+
+                    if node.location:
+                        self.nodes[teca_element.get('refid')] = node
+
+    def rescue_every_family(self):
+        for node_refid, node in self.nodes.items():
+            node.find_family(self.nodes)
+
+            self.nodes[node_refid] = node
+
+    def generate_class_hierarchy(self, output_dir='_build/rst'):
+        def structure_class_hierarchy(
+                node, element_type='Class', lastChild=False):
+            html = ''
+            if lastChild:
+                html += '<li class="lastChild">'
+            else:
+                html += '<li>'
+
+            html += element_type + ' <a href="' + node.refid + '.html">'
+            html += node.name + '</a>'
+
+            if node.children:
+                html += '<ul>'
+                children_len_minus_one = len(node.children) - 1
+                for i, child_node in enumerate(node.children):
+                    if i == children_len_minus_one:
+                        html += structure_class_hierarchy(
+                                    child_node, lastChild=True)
+                    else:
+                        html += structure_class_hierarchy(child_node)
+                html += '</ul>'
+            html += '</li>'
+            return html
+
+        rst = '\nClass Hierarchy\n~~~~~~~~~~~~~~~\n\n.. raw:: html\n\n   '
+
+        html = '<ul class="treeView" id="class-treeView">'
+        html += '<li><ul class="collapsibleList">'
+
+        root_nodes = []
+        for _, node in self.nodes.items():
+            if node.parent is None and ('::' not in node.name):
+                root_nodes.append(node)
+
+        for i, root_node in enumerate(root_nodes):
+            if i == len(root_nodes) - 1:
+                html += structure_class_hierarchy(root_node, lastChild=True)
+            else:
+                html += structure_class_hierarchy(root_node)
+
+        html += '</ul></li></ul>'
+
+        rst += html + '\n\n.. end raw html for treeView\n'
+
+        if not os.path.exists(output_dir):
+            os.makedirs(output_dir)
+
+        with open(os.path.join(
+                    output_dir, 'generated_rtd_class_hierarchy.rst'),
+                  'w') as f:
+            f.write(rst)
+
+    def generate_file_hierarchy(self, output_dir='_build/rst'):
+        def structure_file_hierarchy(name, trunk, lastChild=False):
+            html = ''
+            if lastChild:
+                html += '<li class="lastChild">'
+            else:
+                html += '<li>'
+
+            html += name
+
+            trunk_len_minus_one = len(trunk.items()) - 1
+            for i, (key, value) in enumerate(trunk.items()):
+                html += '<ul>'
+
+                if key == 'files':
+                    files_len_minus_one = len(value) - 1
+                    for j, file in enumerate(value):
+                        if j == files_len_minus_one:
+                            html += '<li class="lastChild">'
+                        else:
+                            html += '<li>'
+                        html += '<a href="' + file[2] + '.html">'
+                        html += file[0] + '</a>'
+                        html += '</li>'
+                else:
+                    if i == trunk_len_minus_one:
+                        html += structure_file_hierarchy(
+                                    key, trunk[key], lastChild=True)
+                    else:
+                        html += structure_file_hierarchy(key, trunk[key])
+                html += '</ul>'
+            html += '</li>'
+
+            return html
+
+        trunk = defaultdict(dict, (('files', []),))
+
+        def attach(location, trunk, refid):
+            parts = location.split('/', 1)
+            if len(parts) == 1:  # branch is a file
+                trunk['files'].append((
+                        parts[0],
+                        refid,
+                        self.get_compound_refid(parts[0]) + '_source')
+                    )
+            else:
+                directory, others = parts
+                if directory not in trunk:
+                    trunk[directory] = defaultdict(dict, (('files', []),))
+                attach(others, trunk[directory], refid)
+
+        rst = '\nFile Hierarchy\n~~~~~~~~~~~~~~~\n\n.. raw:: html\n\n   '
+
+        html = '<ul class="treeView" id="file-treeView">'
+        html += '<li><ul class="collapsibleList">'
+
+        for _, node in self.nodes.items():
+            attach(node.location, trunk, node.refid)
+
+        trunk['TECA'] = trunk.pop(self.get_first_dir(trunk))
+        self.directory_structure = trunk
+
+        first_dir = 'TECA'
+        html += structure_file_hierarchy(
+                    first_dir, trunk[first_dir], lastChild=True)
+
+        html += '</ul></li></ul>'
+
+        rst += html + '\n\n.. end raw html for treeView\n'
+
+        if not os.path.exists(output_dir):
+            os.makedirs(output_dir)
+
+        with open(os.path.join(
+                    output_dir, 'generated_rtd_file_hierarchy.rst'),
+                  'w') as f:
+            f.write(rst)
+
+    def generate_api_pages(self, output_dir='_build/rst'):
+
+        first_dir = 'TECA'
+        trunk = self.directory_structure[first_dir]
+
+        if not os.path.exists(output_dir):
+            os.makedirs(output_dir)
+
+        generated_files = []
+
+        for key, value in trunk.items():
+
+            try:
+                if key == 'files':
+                    continue
+
+                page_name = self.meta_info[key]['full_name']
+
+                rst = ''
+                rst += '\n.. _' + page_name + ':\n'
+                rst += '\n' + page_name + '\n'
+                rst += '~' * len(page_name) + '\n\n'
+                rst += self.meta_info[key]['description'] + '. '
+                rst += '(For more details, click on the class name) \n\n'
+
+                rst += '.. csv-table:: TECA Classes\n'
+                rst += '   :header: "Class", "Description"\n'
+                rst += '   :widths: 5, 30\n\n'
+
+                for _, refid, _ in value['files']:
+                    node = self.nodes[refid]
+
+                    rst += '   ' + node.name + '_ , '
+
+                    if (node.brief_description and
+                            not node.brief_description.isspace()):
+                        rst += node.brief_description.strip()
+
+                    rst += '\n'
+
+                rst += '\n'
+                for _, refid, _ in value['files']:
+                    node = self.nodes[refid]
+
+                    rst += '.. _' + node.name + ': doxygen/' + node.refid + '.html\n'
+
+                filename = 'generated_rtd_%s.rst' % key
+                with open(os.path.join(output_dir, filename), 'w') as f:
+                    f.write(rst)
+
+                generated_files.append(
+                    (filename, self.meta_info[key]['full_name']))
+
+            except Exception:
+                sys.stderr.write('Exception caught in parse_xml.py !\n')
+                traceback.print_exc()
+                sys.stderr.write('Exception ignored !\n')
+
+        rst = '\n\n.. toctree::\n   :maxdepth: 1\n   :caption: Contents:\n\n'
+
+        for file, full_name in generated_files:
+            rst += '   ' + full_name + '<' + file.replace('.rst', '') + '>\n'
+
+        with open(os.path.join(
+                    output_dir, 'generated_rtd_pages.txt'),
+                  'w') as f:
+            f.write(rst)
+
+    class Node:
+        def __init__(self, refid, name, xml_dir):
+            self.refid = refid
+            self.name = name
+
+            self.xml_dir = xml_dir
+
+            self.location = None
+
+            self.brief_description = None
+
+            self.parent = None
+            self.children = []
+            self.found_family = False
+
+            self.node_xml_root = None
+
+            self._construct_xml_root()
+            self.find_location()
+            self.find_brief_description()
+
+        def _construct_xml_root(self):
+            node_xml_tree = ET.parse(
+                os.path.join(self.xml_dir, self.refid + '.xml'))
+
+            node_xml_root = node_xml_tree.getroot()
+            self.node_xml_root = node_xml_root.find('compounddef')
+
+        def find_location(self, avoids=['.cxx']):
+            if self.node_xml_root is None:
+                raise ValueError("The Node's xml tree root has to be set!")
+
+            location = self.node_xml_root.find('location')
+            if location is not None:
+                location = location.get('file')
+                for txt in avoids:
+                    if txt in location:
+                        return
+                self.location = location
+
+        def find_brief_description(self):
+            if self.node_xml_root is None:
+                raise ValueError("The Node's xml tree root has to be set!")
+
+            briefdescription = self.node_xml_root.find('briefdescription')
+
+            brief_description = ""
+            for text in briefdescription.itertext():
+                brief_description += text
+
+            self.brief_description = brief_description
+
+        def find_family(self, nodes):
+            if self.found_family:
+                return
+
+            if self.node_xml_root is None:
+                raise ValueError("The Node's xml tree root has to be set!")
+
+            parent = self.node_xml_root.find('basecompoundref')
+            if parent is not None and 'refid' in parent.attrib:
+                self.parent = nodes[parent.get('refid')]
+
+            children = []
+            for child_element in self.node_xml_root.findall(
+                    'derivedcompoundref'):
+                try:
+                    if 'refid' in child_element.attrib:
+                        child = nodes[child_element.get('refid')]
+                        children.append(child)
+                except Exception:
+                   sys.stderr.write('Exception caught in parse_xml.py !\n')
+                   traceback.print_exc()
+                   sys.stderr.write('Exception ignored !\n')
+
+            self.children = children
+
+            self.found_family = True
+
+
+def main():
+    teca_tree = TECA_Tree()
+
+
+if __name__ == '__main__':
+    main()
diff --git a/doc/rtd/requirements.txt b/doc/rtd/requirements.txt
index ef36addc6..afcc10ca6 100644
--- a/doc/rtd/requirements.txt
+++ b/doc/rtd/requirements.txt
@@ -1 +1,2 @@
 sphinxcontrib-bibtex
+breathe
diff --git a/doc/teca_users_guide.pdf b/doc/teca_users_guide.pdf
deleted file mode 100644
index 4e6923b7e..000000000
Binary files a/doc/teca_users_guide.pdf and /dev/null differ
diff --git a/io/CMakeLists.txt b/io/CMakeLists.txt
index 001174d55..b93602d9b 100644
--- a/io/CMakeLists.txt
+++ b/io/CMakeLists.txt
@@ -16,6 +16,8 @@ set(teca_io_srcs
     teca_cartesian_mesh_writer_factory.cxx
     teca_cf_layout_manager.cxx
     teca_cf_time_step_mapper.cxx
+    teca_cf_block_time_step_mapper.cxx
+    teca_cf_interval_time_step_mapper.cxx
     teca_cf_time_axis_data.cxx
     teca_cf_time_axis_data_reduce.cxx
     teca_cf_time_axis_reader.cxx
diff --git a/io/teca_cartesian_mesh_reader.cxx b/io/teca_cartesian_mesh_reader.cxx
index dfeca9e6e..3f2030b1b 100644
--- a/io/teca_cartesian_mesh_reader.cxx
+++ b/io/teca_cartesian_mesh_reader.cxx
@@ -103,6 +103,8 @@ void teca_cartesian_mesh_reader::get_properties_description(
             "a file name to read")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -110,6 +112,8 @@ void teca_cartesian_mesh_reader::get_properties_description(
 void teca_cartesian_mesh_reader::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, file_name)
 }
 #endif
diff --git a/io/teca_cartesian_mesh_reader.h b/io/teca_cartesian_mesh_reader.h
index 66b6ddcd5..b91de1089 100644
--- a/io/teca_cartesian_mesh_reader.h
+++ b/io/teca_cartesian_mesh_reader.h
@@ -13,19 +13,19 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_cartesian_mesh_reader)
 
-/// a reader for data stored in binary cartesian_mesh format
+/// A reader for data stored in binary cartesian_mesh format.
 /**
-A reader for data stored in binary cartesian_mesh format. By default
-the reader reads and returns the entire cartesian_mesh on rank 0.
-The reader can partition the data accross an "index column".
-The index column assigns a unique id to rows that should be
-returned together. The reader reports the number of unique
-ids to the pipeline which can then be requested by the pipeline
-during parallel or sequential execution.
-
-output:
-    generates a cartesian_mesh containing the data read from the file.
-*/
+ * A reader for data stored in binary cartesian_mesh format. By default
+ * the reader reads and returns the entire cartesian_mesh on rank 0.
+ * The reader can partition the data accross an "index column".
+ * The index column assigns a unique id to rows that should be
+ * returned together. The reader reports the number of unique
+ * ids to the pipeline which can then be requested by the pipeline
+ * during parallel or sequential execution.
+ *
+ * output:
+ *     generates a cartesian_mesh containing the data read from the file.
+ */
 class teca_cartesian_mesh_reader : public teca_algorithm
 {
 public:
diff --git a/io/teca_cartesian_mesh_reader_factory.h b/io/teca_cartesian_mesh_reader_factory.h
index 40a1bc4e1..862a8091c 100644
--- a/io/teca_cartesian_mesh_reader_factory.h
+++ b/io/teca_cartesian_mesh_reader_factory.h
@@ -1,21 +1,25 @@
 #ifndef teca_cartesian_mesh_reader_factory_h
 #define teca_cartesian_mesh_reader_factory_h
 
+/// @file
+
 #include "teca_algorithm.h"
 
+/// A factory for Cartesian mesh readers
 struct teca_cartesian_mesh_reader_factory
 {
-    // creates and initialized a reader from a given file name
-    // or regular expression.  the file extension is examined,
-    // to determine the type of reader to create. the supported
-    // extentsions and the associated readers are as follows:
-    //
-    // bin -- teca_cartesian_mesh_reader
-    // nc  -- teca_cf_reader
-    // mcf -- teca_multi_cf_reader
-    //
-    // returns a new instance of the reader with the file or
-    // regex set or a nullptr if an error is encountered
+    /** creates and initialized a reader from a given file name or regular
+     * expression.  the file extension is examined, to determine the type of
+     * reader to create. the supported extentsions and the associated readers
+     * are as follows:
+     *
+     *      bin -- teca_cartesian_mesh_reader
+     *      nc  -- teca_cf_reader
+     *      mcf -- teca_multi_cf_reader
+     *
+     * returns a new instance of the reader with the file or regex set or a
+     * nullptr if an error is encountered
+     */
     static p_teca_algorithm New(const std::string &file);
 };
 
diff --git a/io/teca_cartesian_mesh_writer.cxx b/io/teca_cartesian_mesh_writer.cxx
index 7531edbdf..719ccc1d7 100644
--- a/io/teca_cartesian_mesh_writer.cxx
+++ b/io/teca_cartesian_mesh_writer.cxx
@@ -91,7 +91,7 @@ void write_vtk_array_data(FILE *ofile,
             if (binary)
             {
                 // because VTK's legacy file fomrat  requires big endian storage
-                if (!is_big_endian())
+                if ((sizeof(NT) > 1) && !is_big_endian())
                     fwrite_big_endian(pa, sizeof(NT), na, ofile);
                 else
                     fwrite_native_endian(pa, sizeof(NT), na, ofile);
@@ -692,6 +692,8 @@ void teca_cartesian_mesh_writer::get_properties_description(
             "if auto is used, format is deduced from file_name")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -699,6 +701,8 @@ void teca_cartesian_mesh_writer::get_properties_description(
 void teca_cartesian_mesh_writer::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, file_name)
     TECA_POPTS_SET(opts, int, prefix, output_format)
     TECA_POPTS_SET(opts, int, prefix, binary)
diff --git a/io/teca_cartesian_mesh_writer.h b/io/teca_cartesian_mesh_writer.h
index 6fcea92da..2839577c7 100644
--- a/io/teca_cartesian_mesh_writer.h
+++ b/io/teca_cartesian_mesh_writer.h
@@ -10,12 +10,12 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_cartesian_mesh_writer)
 
+/// An algorithm that writes Cartesian meshes in VTK format.
 /**
-an algorithm that writes cartesian meshes in VTK format.
-when VTK is found then the files are written using the
-XML formats. otherwise legacy format is used. Can be
-written as raw binary (default) or as ascii.
-*/
+ * When VTK is found then the files are written using the
+ * XML formats. Otherwise legacy format is used. Can be
+ * written as raw binary (default) or as ASCII.
+ */
 class teca_cartesian_mesh_writer : public teca_algorithm
 {
 public:
@@ -33,7 +33,7 @@ class teca_cartesian_mesh_writer : public teca_algorithm
     // %t% is replaced with the current time step.
     TECA_ALGORITHM_PROPERTY(std::string, file_name)
 
-    // set the output type. can be binary or ascii.
+    // set the output type. can be binary or ASCII.
     TECA_ALGORITHM_PROPERTY(int, binary)
 
     // Select the output file format. 0:bin, 1:vtr, 2:vtk, 3:auto
diff --git a/io/teca_cartesian_mesh_writer_factory.h b/io/teca_cartesian_mesh_writer_factory.h
index 8a3c70034..c76decc0d 100644
--- a/io/teca_cartesian_mesh_writer_factory.h
+++ b/io/teca_cartesian_mesh_writer_factory.h
@@ -3,18 +3,20 @@
 
 #include "teca_algorithm.h"
 
+/// A factory for Cartesian mesh writers
 struct teca_cartesian_mesh_writer_factory
 {
-    // creates and initialized a writer from a given file name
-    // or regular expression.  the file extension is examined,
-    // to determine the type of writer to create. the supported
-    // extentsions and the associated writers are as follows:
-    //
-    // bin -- teca_cartesian_mesh_writer
-    // nc  -- teca_cf_writer
-    //
-    // returns a new instance of the writer with the file or
-    // regex set or a nullptr if an error is encountered
+     /** creates and initialized a writer from a given file name
+      * or regular expression.  the file extension is examined,
+      * to determine the type of writer to create. the supported
+      * extentsions and the associated writers are as follows:
+      *
+      * bin -- teca_cartesian_mesh_writer
+      * nc  -- teca_cf_writer
+      *
+      * returns a new instance of the writer with the file or
+      * regex set or a nullptr if an error is encountered
+      */
     static p_teca_algorithm New(const std::string &file);
 };
 
diff --git a/io/teca_cf_block_time_step_mapper.cxx b/io/teca_cf_block_time_step_mapper.cxx
new file mode 100644
index 000000000..ce6bf68ab
--- /dev/null
+++ b/io/teca_cf_block_time_step_mapper.cxx
@@ -0,0 +1,212 @@
+#include "teca_cf_block_time_step_mapper.h"
+
+// --------------------------------------------------------------------------
+int teca_cf_block_time_step_mapper::to_stream(std::ostream &os)
+{
+    int rank = 0;
+    int n_ranks = 1;
+#if defined(TECA_HAS_MPI)
+    int is_init = 0;
+    MPI_Initialized(&is_init);
+    if (is_init)
+    {
+        MPI_Comm_rank(this->comm, &rank);
+        MPI_Comm_size(this->comm, &n_ranks);
+    }
+#endif
+    if (rank == 0)
+    {
+        os << "start_time_step = " << this->start_time_step << std::endl
+            << "end_time_step = " << this->end_time_step << std::endl
+            << "n_time_steps = " << this->n_time_steps << std::endl
+            << "n_time_steps_per_file = " << this->n_time_steps_per_file << std::endl
+            << "n_files = " << this->n_files << std::endl
+            << "n_ranks = " << n_ranks << std::endl
+            << "rank\tfirst_time_step\tlast_time_step" << std::endl;
+
+        for (int i = 0; i < n_ranks; ++i)
+            os << i << "\t" << block_start[i] << "\t"
+                << block_start[i] + block_size[i] - 1 << std::endl;
+
+        os << "file\tranks" << std::endl;
+        for (int i = 0; i < this->n_files; ++i)
+        {
+            os << i << "\t";
+            std::set<int> &f_ranks = this->file_ranks[i];
+            std::set<int>::iterator it = f_ranks.begin();
+            std::set<int>::iterator end = f_ranks.end();
+            for (; it != end; ++it)
+            {
+                os << *it << ", ";
+            }
+            os << std::endl;
+        }
+    }
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int teca_cf_block_time_step_mapper::get_file_id(long time_step, long &file_id)
+{
+    file_id = (time_step - this->start_time_step)/this->n_time_steps_per_file;
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+p_teca_cf_layout_manager teca_cf_block_time_step_mapper::get_layout_manager(
+    long time_step)
+{
+    long file_id = (time_step - this->start_time_step)/this->n_time_steps_per_file;
+    file_table_t::iterator it = this->file_table.find(file_id);
+    if (it == this->file_table.end())
+    {
+        TECA_ERROR("No layout manager for time step " << time_step)
+        return nullptr;
+    }
+    return it->second;
+}
+
+// --------------------------------------------------------------------------
+int teca_cf_block_time_step_mapper::initialize(MPI_Comm comm, long first_step,
+    long last_step, long steps_per_file, const teca_metadata &md)
+{
+#if !defined(TECA_HAS_MPI)
+    (void)comm;
+#endif
+    this->comm = comm;
+    this->start_time_step = first_step;
+    this->end_time_step = last_step;
+    this->n_time_steps_per_file = steps_per_file;
+
+    // locate the keys that enable us to know how many
+    // requests we need to make and what key to use
+    if (md.get("index_initializer_key", this->index_initializer_key))
+    {
+        TECA_ERROR("No time_step initializer key has been specified")
+        return -1;
+    }
+
+    if (md.get("index_request_key", this->index_request_key))
+    {
+        TECA_ERROR("No time_step request key has been specified")
+        return -1;
+    }
+
+    // locate available time_steps
+    this->n_time_steps = 0;
+    if (md.get(this->index_initializer_key, n_time_steps))
+    {
+        TECA_ERROR("metadata is missing the initializer key \""
+            << this->index_initializer_key << "\"")
+        return -1;
+    }
+
+    // apply restriction
+    long last
+        = this->end_time_step >= 0 ? this->end_time_step : n_time_steps - 1;
+
+    long first
+        = ((this->start_time_step >= 0) && (this->start_time_step <= last))
+            ? this->start_time_step : 0;
+
+    this->n_time_steps = last - first + 1;
+
+    // partition time_steps across MPI ranks. each rank
+    // will end up with a unique block of time_steps
+    // to process.
+    int rank = 0;
+    int n_ranks = 1;
+#if defined(TECA_HAS_MPI)
+    int is_init = 0;
+    MPI_Initialized(&is_init);
+    if (is_init)
+    {
+        MPI_Comm_rank(this->comm, &rank);
+        MPI_Comm_size(this->comm, &n_ranks);
+    }
+#endif
+
+    // map time_steps to ranks
+    long n_big_blocks = this->n_time_steps%n_ranks;
+    this->block_size.resize(n_ranks);
+    this->block_start.resize(n_ranks);
+    for (int i = 0; i < n_ranks; ++i)
+    {
+        this->block_size[i] = 1;
+        this->block_start[i] = 0;
+        if (i < n_big_blocks)
+        {
+            this->block_size[i] = this->n_time_steps/n_ranks + 1;
+            this->block_start[i] = first + this->block_size[i]*i;
+        }
+        else
+        {
+            this->block_size[i] = this->n_time_steps/n_ranks;
+            this->block_start[i] = first + this->block_size[i]*i + n_big_blocks;
+        }
+    }
+
+    // get the number of files to write
+    this->n_files = this->n_time_steps / this->n_time_steps_per_file +
+        (this->n_time_steps % this->n_time_steps_per_file ? 1 : 0);
+
+    // map file id to ranks
+    this->file_ranks.resize(this->n_files);
+    int last_file_rank = 0;
+    std::vector<int> file_ranks_i;
+    file_ranks_i.reserve(n_ranks);
+    for (long i = 0; i < this->n_files; ++i)
+    {
+        long file_time_step_0 = first + i*this->n_time_steps_per_file;
+        long file_time_step_1 = file_time_step_0 + this->n_time_steps_per_file - 1;
+
+        file_ranks_i.clear();
+
+        for (int j = last_file_rank; j < n_ranks; ++j)
+        {
+            long block_time_step_0 = this->block_start[j];
+            long block_time_step_1 = block_time_step_0 + this->block_size[j] - 1;
+
+            // check if this rank is writing to this file
+            long bf_int_0 = file_time_step_0 > block_time_step_0 ?
+                 file_time_step_0 : block_time_step_0;
+
+            long bf_int_1 = file_time_step_1 < block_time_step_1 ?
+                file_time_step_1 : block_time_step_1;
+            if (bf_int_0 <= bf_int_1)
+            {
+                // yes add it to the list
+                file_ranks_i.push_back(j);
+            }
+        }
+
+        last_file_rank = file_ranks_i.size() ? file_ranks_i[0] : 0;
+
+        // store for a later look up
+        this->file_ranks[i].insert(file_ranks_i.begin(), file_ranks_i.end());
+    }
+
+    // allocate per-file communicators
+    this->alloc_file_comms();
+
+    // create layout managers for the local files
+    // proceed file by file, this ensures a deterministic non-blocking order
+    for (long i = 0; i < this->n_files; ++i)
+    {
+        MPI_Comm comm_i = this->file_comms[i];
+        if (comm_i != MPI_COMM_NULL)
+        {
+            // this rank will write to this file, create a layout
+            // manager that will do the work of putting data on disk
+            long first_step = i*this->n_time_steps_per_file;
+
+            long n_steps = first_step + this->n_time_steps_per_file > this->n_time_steps ?
+                this->n_time_steps - first_step : this->n_time_steps_per_file;
+
+            this->file_table[i] = teca_cf_layout_manager::New(comm_i, i, first + first_step, n_steps);
+        }
+    }
+
+    return 0;
+}
diff --git a/io/teca_cf_block_time_step_mapper.h b/io/teca_cf_block_time_step_mapper.h
new file mode 100644
index 000000000..836450b3a
--- /dev/null
+++ b/io/teca_cf_block_time_step_mapper.h
@@ -0,0 +1,66 @@
+#ifndef teca_cf_block_time_step_mapper_h
+#define teca_cf_block_time_step_mapper_h
+
+#include "teca_metadata.h"
+#include "teca_cf_layout_manager.h"
+#include "teca_cf_time_step_mapper.h"
+#include "teca_mpi.h"
+
+#include <iostream>
+#include <sstream>
+#include <cstring>
+#include <cerrno>
+#include <string>
+#include <unordered_map>
+#include <vector>
+#include <memory>
+
+class teca_cf_block_time_step_mapper;
+using p_teca_cf_block_time_step_mapper = std::shared_ptr<teca_cf_block_time_step_mapper>;
+
+/// Maps time steps to files in fixed sized blocks
+class teca_cf_block_time_step_mapper : public teca_cf_time_step_mapper
+{
+public:
+
+    /// allocate and return a new object
+    static p_teca_cf_block_time_step_mapper New()
+    { return p_teca_cf_block_time_step_mapper(new teca_cf_block_time_step_mapper); }
+
+    ~teca_cf_block_time_step_mapper() {}
+
+    /** initialize based on input metadata. this is a collective call creates
+     * communicator groups for each file and creates the file layout managers
+     * for the local rank. After this call on can access file managers to
+     * create, define and write local datasets to the NetCDF files in cf
+     * format.
+     */
+    int initialize(MPI_Comm comm, long first_step, long last_step,
+        long steps_per_file, const teca_metadata &md);
+
+    /** given a time step, get the corresponding layout manager that can be
+     * used to create, define and write data to disk.
+     */
+    p_teca_cf_layout_manager get_layout_manager(long time_step) override;
+
+    /// print a summary to the stream
+    int to_stream(std::ostream &os) override;
+
+protected:
+    teca_cf_block_time_step_mapper() : n_time_steps_per_file(1)
+    {}
+
+    // remove these for convenience
+    teca_cf_block_time_step_mapper(const teca_cf_block_time_step_mapper&) = delete;
+    teca_cf_block_time_step_mapper(const teca_cf_block_time_step_mapper&&) = delete;
+    void operator=(const teca_cf_block_time_step_mapper&) = delete;
+    void operator=(const teca_cf_block_time_step_mapper&&) = delete;
+
+    // given a time step, get the corresponding file id
+    int get_file_id(long time_step, long &file_id);
+
+protected:
+    long n_time_steps_per_file;
+};
+
+#endif
diff --git a/io/teca_cf_interval_time_step_mapper.cxx b/io/teca_cf_interval_time_step_mapper.cxx
new file mode 100644
index 000000000..5198ac900
--- /dev/null
+++ b/io/teca_cf_interval_time_step_mapper.cxx
@@ -0,0 +1,326 @@
+#include "teca_cf_interval_time_step_mapper.h"
+
+#include <iomanip>
+
+namespace {
+// **************************************************************************
+int locate(long step, const std::vector<std::pair<long, long>> &brackets,
+    size_t l, size_t r, long &i)
+{
+    size_t m = (l + r) / 2;
+
+    const std::pair<long, long> &br = brackets[m];
+
+    if ((step >= br.first) && (step <= br.second))
+    {
+        // found
+        i = m;
+        return 0;
+    }
+    else if (l == r)
+    {
+        // not found
+        return -1;
+    }
+    else if (step < br.first)
+    {
+        // search left
+        return locate(step, brackets, l, m, i);
+    }
+    else if (step > br.second)
+    {
+        // search right
+        if (m == l) m = r;
+        return locate(step, brackets, m, r, i);
+    }
+
+    // not found
+    return -1;
+}
+}
+
+
+// --------------------------------------------------------------------------
+int teca_cf_interval_time_step_mapper::to_stream(std::ostream &os)
+{
+    int rank = 0;
+    int n_ranks = 1;
+#if defined(TECA_HAS_MPI)
+    int is_init = 0;
+    MPI_Initialized(&is_init);
+    if (is_init)
+    {
+        MPI_Comm_rank(this->comm, &rank);
+        MPI_Comm_size(this->comm, &n_ranks);
+    }
+#endif
+    if (rank == 0)
+    {
+        os << "start_time_step = " << this->start_time_step << std::endl
+            << "end_time_step = " << this->end_time_step << std::endl
+            << "n_time_steps = " << this->n_time_steps << std::endl
+            << "n_files = " << this->n_files << std::endl
+            << "n_ranks = " << n_ranks << std::endl << std::endl
+            << std::left << std::setw(8) << "rank"
+            << std::left << std::setw(12) << "first_step"
+            << std::left << std::setw(12) << "last_step"
+            << std::endl;
+
+        for (int i = 0; i < n_ranks; ++i)
+            os << std::left << std::setw(8) << i
+                << std::left << std::setw(12) << block_start[i]
+                << std::left << std::setw(12) << block_start[i] + block_size[i] - 1
+                << std::endl;
+
+        os << std::endl
+            << std::left << std::setw(8) << "file"
+            << std::left << std::setw(16) << "steps"
+            << std::left << std::setw(8) << "n_steps"
+            << "ranks" << std::endl;
+
+        long n_steps_total = 0;
+
+        for (int i = 0; i < this->n_files; ++i)
+        {
+            std::string steps("[");
+            steps += std::to_string(this->file_steps[i].first);
+            steps += ", ";
+            steps += std::to_string(this->file_steps[i].second);
+            steps += "]";
+
+            long n_steps = this->file_steps[i].second - this->file_steps[i].first + 1;
+            n_steps_total += n_steps;
+
+            os << std::left << std::setw(8) << i
+                << std::left << std::setw(16) << steps
+                << std::left << std::setw(8) << n_steps;
+
+            std::set<int> &f_ranks = this->file_ranks[i];
+            size_t n_f_ranks = f_ranks.size();
+            std::set<int>::iterator it = f_ranks.begin();
+            std::set<int>::iterator end = f_ranks.end();
+
+            if (n_f_ranks)
+            {
+                os << "[" << *it;
+                ++it;
+
+                for (; it != end; ++it)
+                    os << ", " << *it;
+
+                os << "]";
+            }
+
+            os << std::endl;
+        }
+
+        os << std::endl << "n_steps_total = " << n_steps_total << std::endl;
+    }
+
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+int teca_cf_interval_time_step_mapper::get_file_id(long time_step, long &file_id)
+{
+    file_id = -1;
+    if (::locate(time_step, this->file_steps, 0, this->n_files - 1, file_id))
+    {
+        TECA_ERROR("Failed to locate the file id for time step " << time_step)
+        return -1;
+    }
+    return 0;
+}
+
+// --------------------------------------------------------------------------
+p_teca_cf_layout_manager teca_cf_interval_time_step_mapper::get_layout_manager(
+    long time_step)
+{
+    long file_id = -1;
+    if (locate(time_step, this->file_steps, 0, this->n_files - 1, file_id))
+    {
+        TECA_ERROR("Failed to locate the file id for time step " << time_step)
+        return nullptr;
+    }
+
+    file_table_t::iterator it = this->file_table.find(file_id);
+    if (it == this->file_table.end())
+    {
+        TECA_ERROR("No layout manager for time step " << time_step)
+        return nullptr;
+    }
+
+    return it->second;
+}
+
+// --------------------------------------------------------------------------
+int teca_cf_interval_time_step_mapper::initialize(MPI_Comm comm,
+    long first_step, long last_step,
+    const teca_calendar_util::p_interval_iterator &it,
+    const teca_metadata &md)
+{
+#if !defined(TECA_HAS_MPI)
+    (void)comm;
+#endif
+    this->comm = comm;
+    this->start_time_step = first_step;
+    this->end_time_step = last_step;
+
+    // locate the keys that enable us to know how many
+    // requests we need to make and what key to use
+    if (md.get("index_initializer_key", this->index_initializer_key))
+    {
+        TECA_ERROR("No time_step initializer key has been specified")
+        return -1;
+    }
+
+    if (md.get("index_request_key", this->index_request_key))
+    {
+        TECA_ERROR("No time_step request key has been specified")
+        return -1;
+    }
+
+    // locate available time_steps
+    this->n_time_steps = 0;
+    if (md.get(this->index_initializer_key, n_time_steps))
+    {
+        TECA_ERROR("metadata is missing the initializer key \""
+            << this->index_initializer_key << "\"")
+        return -1;
+    }
+
+    // apply restriction
+    long last
+        = this->end_time_step >= 0 ? this->end_time_step : n_time_steps - 1;
+
+    long first
+        = ((this->start_time_step >= 0) && (this->start_time_step <= last))
+            ? this->start_time_step : 0;
+
+    // enumerate the steps in each file
+    if (it->initialize(md, first, last))
+    {
+        TECA_ERROR("Failed to initialize the interval iterator")
+        return -1;
+    }
+
+    this->file_steps.clear();
+    while (*it)
+    {
+        teca_calendar_util::time_point first_step;
+        teca_calendar_util::time_point last_step;
+
+        it->get_next_interval(first_step, last_step);
+
+        // apply subset on a bracket that intersects it
+        first_step.index = first > first_step.index ? first : first_step.index;
+        last_step.index = last < last_step.index ? last : last_step.index;
+
+        this->file_steps.emplace_back(
+            std::make_pair(first_step.index, last_step.index));
+    }
+
+    // make a correction to the restriction because the seasonal iterator only
+    // works on full seasons.
+    first = this->file_steps[0].first;
+    last = this->file_steps.back().second;
+    this->n_time_steps = last - first + 1;
+
+    // partition time_steps across MPI ranks. each rank
+    // will end up with a unique block of time_steps
+    // to process.
+    int rank = 0;
+    int n_ranks = 1;
+#if defined(TECA_HAS_MPI)
+    int is_init = 0;
+    MPI_Initialized(&is_init);
+    if (is_init)
+    {
+        MPI_Comm_rank(this->comm, &rank);
+        MPI_Comm_size(this->comm, &n_ranks);
+    }
+#endif
+
+    // map time_steps to ranks
+    long n_big_blocks = this->n_time_steps % n_ranks;
+    this->block_size.resize(n_ranks);
+    this->block_start.resize(n_ranks);
+    for (int i = 0; i < n_ranks; ++i)
+    {
+        this->block_size[i] = 1;
+        this->block_start[i] = 0;
+        if (i < n_big_blocks)
+        {
+            this->block_size[i] = this->n_time_steps / n_ranks + 1;
+            this->block_start[i] = first + this->block_size[i]*i;
+        }
+        else
+        {
+            this->block_size[i] = this->n_time_steps / n_ranks;
+            this->block_start[i] = first + this->block_size[i]*i + n_big_blocks;
+        }
+    }
+
+    // get the number of files to write
+    this->n_files = this->file_steps.size();
+
+    // map file id to ranks
+    this->file_ranks.resize(this->n_files);
+    int last_file_rank = 0;
+    std::vector<int> file_ranks_i;
+    file_ranks_i.reserve(n_ranks);
+    for (long i = 0; i < this->n_files; ++i)
+    {
+        long file_time_step_0 = this->file_steps[i].first;
+        long file_time_step_1 = this->file_steps[i].second;
+
+        file_ranks_i.clear();
+
+        for (int j = last_file_rank; j < n_ranks; ++j)
+        {
+            long block_time_step_0 = this->block_start[j];
+            long block_time_step_1 = block_time_step_0 + this->block_size[j] - 1;
+
+            // check if this rank is writing to this file
+            long bf_int_0 = file_time_step_0 > block_time_step_0 ?
+                 file_time_step_0 : block_time_step_0;
+
+            long bf_int_1 = file_time_step_1 < block_time_step_1 ?
+                file_time_step_1 : block_time_step_1;
+
+            if (bf_int_0 <= bf_int_1)
+            {
+                // yes add it to the list
+                file_ranks_i.push_back(j);
+            }
+        }
+
+        last_file_rank = file_ranks_i.size() ? file_ranks_i[0] : 0;
+
+        // store for a later look up
+        this->file_ranks[i].insert(file_ranks_i.begin(), file_ranks_i.end());
+    }
+
+    // allocate per-file communicators
+    this->alloc_file_comms();
+
+    // create layout managers for the local files
+    // proceed file by file, this ensures a deterministic non-blocking order
+    for (long i = 0; i < this->n_files; ++i)
+    {
+        MPI_Comm comm_i = this->file_comms[i];
+        if (comm_i != MPI_COMM_NULL)
+        {
+            // this rank will write to this file, create a layout
+            // manager that will do the work of putting data on disk
+            long first_step = this->file_steps[i].first;
+            long last_step = this->file_steps[i].second;
+
+            long n_steps = last_step - first_step + 1;
+
+            this->file_table[i] = teca_cf_layout_manager::New(comm_i, i, first_step, n_steps);
+        }
+    }
+
+    return 0;
+}
diff --git a/io/teca_cf_interval_time_step_mapper.h b/io/teca_cf_interval_time_step_mapper.h
new file mode 100644
index 000000000..96042e3b9
--- /dev/null
+++ b/io/teca_cf_interval_time_step_mapper.h
@@ -0,0 +1,69 @@
+#ifndef teca_cf_interval_time_step_mapper_h
+#define teca_cf_interval_time_step_mapper_h
+
+#include "teca_metadata.h"
+#include "teca_cf_layout_manager.h"
+#include "teca_cf_time_step_mapper.h"
+#include "teca_calendar_util.h"
+#include "teca_mpi.h"
+
+#include <iostream>
+#include <sstream>
+#include <cstring>
+#include <cerrno>
+#include <string>
+#include <unordered_map>
+#include <vector>
+#include <memory>
+
+class teca_cf_interval_time_step_mapper;
+using p_teca_cf_interval_time_step_mapper = std::shared_ptr<teca_cf_interval_time_step_mapper>;
+
+/// NetCDF CF2 files time step mapper.
+class teca_cf_interval_time_step_mapper : public teca_cf_time_step_mapper
+{
+public:
+
+    // allocate and return a new object
+    static p_teca_cf_interval_time_step_mapper New()
+    { return p_teca_cf_interval_time_step_mapper(new teca_cf_interval_time_step_mapper); }
+
+    ~teca_cf_interval_time_step_mapper() {}
+
+    // initialize based on input metadata. this is a collective call
+    // creates communicator groups for each file and creates the
+    // file layout managers for the local rank. After this call
+    // on can access file managers to create, define and write
+    // local datasets to the NetCDF files in cf format.
+    int initialize(MPI_Comm comm, long first_step, long last_step,
+        const teca_calendar_util::p_interval_iterator &it,
+        const teca_metadata &md);
+
+    // given a time step, get the corresponding layout manager that
+    // can be used to create, define and write data to disk.
+    p_teca_cf_layout_manager get_layout_manager(long time_step) override;
+
+    // print a summary to the stream
+    int to_stream(std::ostream &os) override;
+
+protected:
+    teca_cf_interval_time_step_mapper() : file_steps()
+    {}
+
+    // remove these for convenience
+    teca_cf_interval_time_step_mapper(const teca_cf_interval_time_step_mapper&) = delete;
+    teca_cf_interval_time_step_mapper(const teca_cf_interval_time_step_mapper&&) = delete;
+    void operator=(const teca_cf_interval_time_step_mapper&) = delete;
+    void operator=(const teca_cf_interval_time_step_mapper&&) = delete;
+
+    // given a time step, get the corresponding file id
+    int get_file_id(long time_step, long &file_id);
+
+protected:
+    //using teca_calendar_util::time_point;
+    //using step_bracket_t = std::pair<time_point, time_point>;
+    using step_bracket_t = std::pair<long, long>;
+    std::vector<step_bracket_t> file_steps;
+};
+
+#endif
diff --git a/io/teca_cf_layout_manager.cxx b/io/teca_cf_layout_manager.cxx
index 2f99c5a87..acbfdfca7 100644
--- a/io/teca_cf_layout_manager.cxx
+++ b/io/teca_cf_layout_manager.cxx
@@ -40,7 +40,10 @@ int teca_cf_layout_manager::create(const std::string &file_name,
     }
 
     coords.get("t_variable", this->t_variable);
-    p_teca_variant_array t = coords.get("t");
+
+    p_teca_variant_array t;
+    if (!this->t_variable.empty())
+        t = coords.get("t");
 
     // construct the file name
     if (!date_format.empty())
@@ -187,6 +190,13 @@ int teca_cf_layout_manager::define(const teca_metadata &md_in,
     for (int i = 0; i < 4; ++i)
         this->dims[i] = 0;
 
+    // check for bad bounds request on dataset with y axis in descending order.
+    if (extent[2] > extent[3])
+    {
+        TECA_ERROR("Bad y-axis extent [" << extent[2] << ", " << extent[3] << "]")
+        return -1;
+    }
+
     // the cf reader always creates 4D data, but some other tools choke
     // on it, notably ParView. All dimensions of 1 are safe to skip, unless
     // we are writing a variable with 1 value.
@@ -477,7 +487,7 @@ int teca_cf_layout_manager::define(const teca_metadata &md_in,
         if (is_init && ((ierr = nc_var_par_access(this->handle.get(), var_id,
             NC_INDEPENDENT)) != NC_NOERR))
         {
-            TECA_ERROR("Failed to set inidependant mode on variable \"" << name << "\"")
+            TECA_ERROR("Failed to set independent mode on variable \"" << name << "\"")
             return -1;
         }
 #if !defined(HDF5_THREAD_SAFE)
@@ -593,7 +603,11 @@ int teca_cf_layout_manager::write(long index,
     {
         size_t starts[4] = {0, 0, 0, 0};
         size_t counts[4] = {1, 0, 0, 0};
-        for (int i = 1; i < this->n_dims; ++i)
+
+        // make space for the time dimension
+        int i0 = this->t ? 1 : 0;
+
+        for (int i = i0; i < this->n_dims; ++i)
             counts[i] = this->dims[i];
 
         // get this data's position in the file
@@ -739,7 +753,8 @@ int teca_cf_layout_manager::to_stream(std::ostream &os)
        << n_franks << " file_id=" << file_id
        << " file_name=\"" << this->file_name
        << "\" first_index=" << this->first_index
-       << " n_indeces=" << this->n_indices;
+       << " n_indices=" << this->n_indices
+       << " n_written=" << this->n_written;
 
     return 0;
 }
diff --git a/io/teca_cf_layout_manager.h b/io/teca_cf_layout_manager.h
index e62b7ed40..37c8d2656 100644
--- a/io/teca_cf_layout_manager.h
+++ b/io/teca_cf_layout_manager.h
@@ -14,7 +14,7 @@
 class teca_cf_layout_manager;
 using p_teca_cf_layout_manager = std::shared_ptr<teca_cf_layout_manager>;
 
-// puts data on disk using NetCDF CF2 conventions
+/// Puts data on disk using NetCDF CF2 conventions.
 class teca_cf_layout_manager
 {
 public:
@@ -42,13 +42,13 @@ class teca_cf_layout_manager
         const std::vector<std::string> &point_arrays,
         const std::vector<std::string> &info_arrays, int compression_level);
 
-    // writes the colllection of arrays to the NetCDF file
+    // writes the collection of arrays to the NetCDF file
     // in the correct spot.
     int write(long index,
         const const_p_teca_array_collection &point_arrays,
         const const_p_teca_array_collection &info_arrays);
 
-    // close the file. This is an MPI collecive call.
+    // close the file. This is an MPI collective call.
     int close()  { return this->handle.close(); }
 
     // return true if the file is open and can be written to
@@ -57,7 +57,8 @@ class teca_cf_layout_manager
     // return true if the file has been defined
     bool defined()  { return this->n_dims > 0; }
 
-    // TODO -- this is no longer correct
+    // TODO -- this is only true when a rank writes all of the steps
+    // to the given file.
     bool completed()
     {
         return this->n_written == this->n_indices;
@@ -87,7 +88,7 @@ class teca_cf_layout_manager
     void operator=(const teca_cf_layout_manager&&) = delete;
 
 protected:
-    // communicator decribing ranks that act on the file
+    // communicator describing ranks that act on the file
     MPI_Comm comm;
 
     // identifying the file
@@ -95,7 +96,7 @@ class teca_cf_layout_manager
     std::string file_name;
     teca_netcdf_util::netcdf_handle handle;
 
-    // for indentifying the incoming dataset and determining its
+    // for identifying the incoming dataset and determining its
     // position in the file
     long first_index;
     long n_indices;
diff --git a/io/teca_cf_reader.cxx b/io/teca_cf_reader.cxx
index c3997d3f5..f05fe069e 100644
--- a/io/teca_cf_reader.cxx
+++ b/io/teca_cf_reader.cxx
@@ -10,7 +10,7 @@
 #include "teca_coordinate_util.h"
 #include "teca_netcdf_util.h"
 #include "teca_system_util.h"
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 
 #include <netcdf.h>
 #include <iostream>
@@ -58,13 +58,14 @@ teca_cf_reader::teca_cf_reader() :
     y_axis_variable("lat"),
     z_axis_variable(""),
     t_axis_variable("time"),
-    t_calendar(""),
+    calendar(""),
     t_units(""),
     filename_time_template(""),
     periodic_in_x(0),
     periodic_in_y(0),
     periodic_in_z(0),
     max_metadata_ranks(1024),
+    clamp_dimensions_of_one(0),
     internals(new teca_cf_reader_internals)
 {}
 
@@ -81,7 +82,7 @@ void teca_cf_reader::get_properties_description(
         + (prefix.empty()?"teca_cf_reader":prefix));
 
     opts.add_options()
-        TECA_POPTS_GET(std::vector<std::string>, prefix, file_names,
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, file_names,
             "An explcict list of files to read. If specified takes precedence"
             " over --files_regex. Use one of --files_regex or --file_names")
         TECA_POPTS_GET(std::string, prefix, files_regex,
@@ -89,17 +90,17 @@ void teca_cf_reader::get_properties_description(
             " Only the final component in a path may conatin a regular expression."
             " Use one of --files_regex or --file_names ")
         TECA_POPTS_GET(std::string, prefix, x_axis_variable,
-            "name of variable that has x axis coordinates (lon)")
+            "name of variable that has x axis coordinates")
         TECA_POPTS_GET(std::string, prefix, y_axis_variable,
-            "name of variable that has y axis coordinates (lat)")
+            "name of variable that has y axis coordinates")
         TECA_POPTS_GET(std::string, prefix, z_axis_variable,
-            "name of variable that has z axis coordinates (). If left empty the"
+            "name of variable that has z axis coordinates. If left empty the"
             " output mesh will be 2D.")
         TECA_POPTS_GET(std::string, prefix, t_axis_variable,
             "name of variable that has time axis coordinates (time). Set to an empty"
             " string to enable override methods (--filename_time_template, --t_values)"
             " or to disable time coordinates completely")
-        TECA_POPTS_GET(std::string, prefix, t_calendar,
+        TECA_POPTS_GET(std::string, prefix, calendar,
             "An optional calendar override. May be one of: standard, Julian,"
             " proplectic_Julian, Gregorian, proplectic_Gregorian, Gregorian_Y0,"
             " proplectic_Gregorian_Y0, noleap, no_leap, 365_day, 360_day. When the"
@@ -118,22 +119,27 @@ void teca_cf_reader::get_properties_description(
             " no units are specified then \"days since %Y-%m-%d 00:00:00\" where Y,m,d"
             " are determined from the filename of the first file. Set t_axis_variable to"
             " an empty string to use.")
-        TECA_POPTS_GET(std::vector<double>, prefix, t_values,
+        TECA_POPTS_MULTI_GET(std::vector<double>, prefix, t_values,
             "An optional explicit list of double precision values to use as the"
             " time axis. If provided these take precedence over the values found"
             " in the files. Otherwise the variable pointed to by the t_axis_variable"
             " provides the time values. Set t_axis_variable to an empty string"
             " to use.")
         TECA_POPTS_GET(int, prefix, periodic_in_x,
-            "the dataset has a periodic boundary in the x direction (0)")
+            "the dataset has a periodic boundary in the x direction")
         TECA_POPTS_GET(int, prefix, periodic_in_y,
-            "the dataset has a periodic boundary in the y direction (0)")
+            "the dataset has a periodic boundary in the y direction")
         TECA_POPTS_GET(int, prefix, periodic_in_z,
-            "the dataset has a periodic boundary in the z direction (0)")
+            "the dataset has a periodic boundary in the z direction")
         TECA_POPTS_GET(int, prefix, max_metadata_ranks,
-            "set the max number of MPI ranks for reading metadata (1024)")
+            "set the max number of MPI ranks for reading metadata")
+        TECA_POPTS_GET(int, prefix, clamp_dimensions_of_one,
+            "If set clamp requested axis extent in where the request is out of"
+            " bounds and the coordinate array dimension is 1.")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -141,13 +147,15 @@ void teca_cf_reader::get_properties_description(
 void teca_cf_reader::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::vector<std::string>, prefix, file_names)
     TECA_POPTS_SET(opts, std::string, prefix, files_regex)
     TECA_POPTS_SET(opts, std::string, prefix, x_axis_variable)
     TECA_POPTS_SET(opts, std::string, prefix, y_axis_variable)
     TECA_POPTS_SET(opts, std::string, prefix, z_axis_variable)
     TECA_POPTS_SET(opts, std::string, prefix, t_axis_variable)
-    TECA_POPTS_SET(opts, std::string, prefix, t_calendar)
+    TECA_POPTS_SET(opts, std::string, prefix, calendar)
     TECA_POPTS_SET(opts, std::string, prefix, t_units)
     TECA_POPTS_SET(opts, std::string, prefix, filename_time_template)
     TECA_POPTS_SET(opts, std::vector<double>, prefix, t_values)
@@ -155,6 +163,7 @@ void teca_cf_reader::set_properties(const std::string &prefix,
     TECA_POPTS_SET(opts, int, prefix, periodic_in_y)
     TECA_POPTS_SET(opts, int, prefix, periodic_in_z)
     TECA_POPTS_SET(opts, int, prefix, max_metadata_ranks)
+    TECA_POPTS_SET(opts, int, prefix, clamp_dimensions_of_one)
 }
 #endif
 
@@ -329,7 +338,10 @@ teca_metadata teca_cf_reader::get_output_metadata(
             std::string name;
             teca_metadata atts;
 
-            if (teca_netcdf_util::read_variable_attributes(fh, i, name, atts))
+            if (teca_netcdf_util::read_variable_attributes(fh, i,
+                this->x_axis_variable, this->y_axis_variable,
+                this->z_axis_variable, this->t_axis_variable,
+                this->clamp_dimensions_of_one, name, atts))
             {
                 this->clear_cached_metadata();
                 TECA_ERROR(
@@ -515,11 +527,11 @@ teca_metadata teca_cf_reader::get_output_metadata(
             }
 
             // override the calendar
-            if (!this->t_calendar.empty())
+            if (!this->calendar.empty())
             {
                 TECA_WARNING("Overriding the calendar with the runtime "
-                    "provided value \"" << this->t_calendar << "\"")
-                time_atts.set("calendar", this->t_calendar);
+                    "provided value \"" << this->calendar << "\"")
+                time_atts.set("calendar", this->calendar);
             }
 
             // override the units
@@ -599,8 +611,8 @@ teca_metadata teca_cf_reader::get_output_metadata(
                 const teca_metadata &md_i = teca_cf_time_axis_data::get_metadata(elem_i);
                 std::string calendar_i;
                 md_i.get("calendar", calendar_i);
-                if ((!has_calendar && !calendar_i.empty())
-                    || (has_calendar && (calendar_i != base_calendar)))
+                if ((has_calendar || !calendar_i.empty())
+                    && (calendar_i != base_calendar))
                 {
                     TECA_ERROR("The base calendar is \"" << base_calendar
                         << "\" but file " << i << " \"" << files[i]
@@ -656,7 +668,7 @@ teca_metadata teca_cf_reader::get_output_metadata(
                             int hh=0;
                             int mm=0;
                             double ss=0.0;
-                            if (calcalcs::date(double(p_ti[j]), &YY, &MM, &DD, &hh, &mm, &ss,
+                            if (teca_calcalcs::date(double(p_ti[j]), &YY, &MM, &DD, &hh, &mm, &ss,
                                 units_i.c_str(), base_calendar.c_str()))
                             {
                                 TECA_ERROR("Failed to convert offset ti[" << j << "] = "
@@ -667,7 +679,7 @@ teca_metadata teca_cf_reader::get_output_metadata(
 
                             // convert time to offsets from base units
                             double offs = 0.0;
-                            if (calcalcs::coordinate(YY, MM, DD, hh, mm, ss,
+                            if (teca_calcalcs::coordinate(YY, MM, DD, hh, mm, ss,
                                 base_units.c_str(), base_calendar.c_str(), &offs))
                             {
                                 TECA_ERROR("Failed to convert time "
@@ -717,7 +729,7 @@ teca_metadata teca_cf_reader::get_output_metadata(
             TECA_STATUS("The t_axis_variable was unspecified, using the "
                 "provided time values")
 
-            if (this->t_calendar.empty() || this->t_units.empty())
+            if (this->calendar.empty() || this->t_units.empty())
             {
                 TECA_ERROR("The calendar and units must to be specified when "
                     " providing time values")
@@ -735,7 +747,7 @@ teca_metadata teca_cf_reader::get_output_metadata(
             }
 
             teca_metadata time_atts;
-            time_atts.set("calendar", this->t_calendar);
+            time_atts.set("calendar", this->calendar);
             time_atts.set("units", this->t_units);
             time_atts.set("cf_dims", n_t_vals);
             time_atts.set("cf_type_code", int(teca_netcdf_util::netcdf_tt<double>::type_code));
@@ -760,12 +772,12 @@ teca_metadata teca_cf_reader::get_output_metadata(
             std::vector<double> t_values;
 
             std::string t_units = this->t_units;
-            std::string t_calendar = this->t_calendar;
+            std::string calendar = this->calendar;
 
             // assume that this is a standard calendar if none is provided
-            if (this->t_calendar.empty())
+            if (this->calendar.empty())
             {
-                t_calendar = "standard";
+                calendar = "standard";
             }
 
             // loop over all files and infer dates from names
@@ -823,8 +835,8 @@ teca_metadata teca_cf_reader::get_output_metadata(
                 int minute = current_tm.tm_min;
                 double second = current_tm.tm_sec;
                 double current_time = 0;
-                if (calcalcs::coordinate(year, mon, day, hour, minute,
-                    second, t_units.c_str(), t_calendar.c_str(), &current_time))
+                if (teca_calcalcs::coordinate(year, mon, day, hour, minute,
+                    second, t_units.c_str(), calendar.c_str(), &current_time))
                 {
                     TECA_ERROR("conversion of date inferred from "
                         "filename failed");
@@ -840,7 +852,7 @@ teca_metadata teca_cf_reader::get_output_metadata(
 
             TECA_STATUS("The time axis will be infered from file names using "
                 "the user provided template \"" << this->filename_time_template
-                << "\" with the \"" << t_calendar << "\" calendar in units \""
+                << "\" with the \"" << calendar << "\" calendar in units \""
                 << t_units << "\"")
 
             // create a teca variant array from the times
@@ -854,7 +866,7 @@ teca_metadata teca_cf_reader::get_output_metadata(
 
             // set the time metadata
             teca_metadata time_atts;
-            time_atts.set("calendar", t_calendar);
+            time_atts.set("calendar", calendar);
             time_atts.set("units", t_units);
             time_atts.set("cf_dims", n_t_vals);
             time_atts.set("cf_type_code", int(teca_netcdf_util::netcdf_tt<double>::type_code));
@@ -977,6 +989,11 @@ const_p_teca_dataset teca_cf_reader::execute(unsigned int port,
         return nullptr;
     }
 
+    // the requested extents must not exceed these limits
+    unsigned long nx_max = in_x->size();
+    unsigned long ny_max = in_y->size();
+    unsigned long nz_max = in_z->size();
+
     // get names, need to be careful since some of these depend
     // on run time information. eg: user can specify a time axis
     // via algorithm properties
@@ -1044,6 +1061,28 @@ const_p_teca_dataset teca_cf_reader::execute(unsigned int port,
         {
             memcpy(extent, whole_extent, 6*sizeof(unsigned long));
         }
+        else
+        {
+            // clamp the extent. this is a workaround to support 2D data
+            // with a vertical dimension of 1 being read into a 3D mesh.
+            if (this->clamp_dimensions_of_one)
+            {
+                teca_coordinate_util::clamp_dimensions_of_one(
+                    nx_max, ny_max, nz_max, extent, this->verbose);
+            }
+
+            // validate the requested extent before using it
+            if (teca_coordinate_util::validate_extent(nx_max,
+                ny_max, nz_max, extent, true))
+            {
+                TECA_ERROR("An invalid extent [" << extent
+                    << "] was requested. The available extent is [0, "
+                    << nx_max << ", 0, " << ny_max << ", 0, " << nz_max
+                    << "]")
+                return nullptr;
+            }
+        }
+
         // get bounds of the extent being read
         in_x->get(extent[0], bounds[0]);
         in_x->get(extent[1], bounds[1]);
@@ -1062,6 +1101,25 @@ const_p_teca_dataset teca_cf_reader::execute(unsigned int port,
             TECA_ERROR("invalid bounds requested.")
             return nullptr;
         }
+
+        // clamp the extent. this is a workaround to support 2D data
+        // with a vertical dimension of 1 being read into a 3D mesh.
+        if (this->clamp_dimensions_of_one)
+        {
+            teca_coordinate_util::clamp_dimensions_of_one(
+                nx_max, ny_max, nz_max, extent, this->verbose);
+        }
+
+        // validate the requested extent before using it
+        if (teca_coordinate_util::validate_extent(nx_max,
+            ny_max, nz_max, extent, true))
+        {
+            TECA_ERROR("An invalid extent [" << extent
+                << "] was requested. The available extent is [0, "
+                << nx_max << ", 0, " << ny_max << ", 0, " << nz_max
+                << "]")
+            return nullptr;
+        }
     }
 
     // requesting arrays is optional, but it's an error
@@ -1172,43 +1230,6 @@ const_p_teca_dataset teca_cf_reader::execute(unsigned int port,
 
     md.set("attributes", out_atrs);
 
-    // figure out the mapping between our extent and netcdf
-    // representation
-    std::vector<std::string> mesh_dim_names;
-    std::vector<size_t> starts;
-    std::vector<size_t> counts;
-    size_t mesh_size = 1;
-    if (!t_axis_variable.empty())
-    {
-        mesh_dim_names.push_back(t_axis_variable);
-        starts.push_back(offs);
-        counts.push_back(1);
-    }
-    if (!z_axis_variable.empty())
-    {
-        mesh_dim_names.push_back(z_axis_variable);
-        starts.push_back(extent[4]);
-        size_t count = extent[5] - extent[4] + 1;
-        counts.push_back(count);
-        mesh_size *= count;
-    }
-    if (!y_axis_variable.empty())
-    {
-        mesh_dim_names.push_back(y_axis_variable);
-        starts.push_back(extent[2]);
-        size_t count = extent[3] - extent[2] + 1;
-        counts.push_back(count);
-        mesh_size *= count;
-    }
-    if (!x_axis_variable.empty())
-    {
-        mesh_dim_names.push_back(x_axis_variable);
-        starts.push_back(extent[0]);
-        size_t count = extent[1] - extent[0] + 1;
-        counts.push_back(count);
-        mesh_size *= count;
-    }
-
     // read requested arrays
     for (size_t i = 0; i < n_arrays; ++i)
     {
@@ -1216,113 +1237,144 @@ const_p_teca_dataset teca_cf_reader::execute(unsigned int port,
         teca_metadata atts;
         int type = 0;
         int id = 0;
-        p_teca_size_t_array dims;
-        p_teca_string_array dim_names;
+        int have_mesh_dim[4] = {0};
+        int mesh_dim_active[4] = {0};
+        unsigned int centering = teca_array_attributes::no_centering;
+        std::vector<size_t> cf_dims;
 
         if (atrs.get(arrays[i], atts)
             || atts.get("cf_type_code", 0, type)
             || atts.get("cf_id", 0, id)
-            || !(dims = std::dynamic_pointer_cast<teca_size_t_array>(atts.get("cf_dims")))
-            || !(dim_names = std::dynamic_pointer_cast<teca_string_array>(atts.get("cf_dim_names"))))
+            || atts.get("cf_dims", cf_dims)
+            || atts.get("centering", centering)
+            || atts.get("have_mesh_dim", have_mesh_dim, 4)
+            || atts.get("mesh_dim_active", mesh_dim_active, 4))
         {
             TECA_ERROR("metadata issue can't read \"" << arrays[i] << "\"")
             continue;
         }
 
-        // check if it's a mesh variable, if it is not a mesh variable
-        // it is an information variable (ie non-spatial)
-        bool mesh_var = false;
-        unsigned int n_dims = dim_names->size();
+        size_t n_vals = 1;
+        unsigned int n_dims = cf_dims.size();
+        std::vector<size_t> starts;
+        std::vector<size_t> counts;
 
-        if (n_dims == mesh_dim_names.size())
+        if (centering == teca_array_attributes::point_centering)
         {
-            mesh_var = true;
-            for (unsigned int ii = 0; ii < n_dims; ++ii)
+            // select the requested time step
+            // subset point centered variables based on the incoming requested
+            // extent.
+            if (have_mesh_dim[3])
             {
-                if (dim_names->get(ii) != mesh_dim_names[ii])
-                {
-                    mesh_var = false;
-                    break;
-                }
+                starts.push_back(mesh_dim_active[3] ? offs : 0);
+                counts.push_back(1);
             }
-        }
 
-        // read requested variables
-        if (mesh_var)
-        {
-            // read mesh based data
-            p_teca_variant_array array;
-            NC_DISPATCH(type,
-                p_teca_variant_array_impl<NC_T> a = teca_variant_array_impl<NC_T>::New(mesh_size);
-#if !defined(HDF5_THREAD_SAFE)
-                {
-                std::lock_guard<std::mutex> lock(teca_netcdf_util::get_netcdf_mutex());
-#endif
-                if ((ierr = nc_get_vara(file_id,  id, &starts[0], &counts[0], a->get())) != NC_NOERR)
-                {
-                    TECA_ERROR("time_step=" << time_step
-                        << " Failed to read variable \"" << arrays[i] << "\" "
-                        << file << endl << nc_strerror(ierr))
-                    continue;
-                }
-#if !defined(HDF5_THREAD_SAFE)
-                }
-#endif
-                array = a;
-                )
-            mesh->get_point_arrays()->append(arrays[i], array);
+            if (have_mesh_dim[2])
+            {
+                size_t start = mesh_dim_active[2] ? extent[4] : 0;
+                size_t count = mesh_dim_active[2] ? extent[5] - extent[4] + 1 : 1;
+
+                starts.push_back(start);
+                counts.push_back(count);
+
+                n_vals *= count;
+            }
+
+            if (have_mesh_dim[1])
+            {
+                size_t start = mesh_dim_active[1] ? extent[2] : 0;
+                size_t count = mesh_dim_active[1] ? extent[3] - extent[2] + 1 : 1;
+
+                starts.push_back(start);
+                counts.push_back(count);
+
+                n_vals *= count;
+            }
+
+            if (have_mesh_dim[0])
+            {
+                size_t start = mesh_dim_active[0] ? extent[0] : 0;
+                size_t count = mesh_dim_active[0] ? extent[1] - extent[0] + 1 : 1;
+
+                starts.push_back(start);
+                counts.push_back(count);
+
+                n_vals *= count;
+            }
         }
-        else
+        else if (centering == teca_array_attributes::no_centering)
         {
+            // most of the time this is a user error, forgetting to set z_axis_variable.
+            if (have_mesh_dim[0] || have_mesh_dim[1] || have_mesh_dim[2])
+            {
+                TECA_WARNING("The variable \"" << arrays[i] << "\" is being treated"
+                    " as an information array. It has dimensions matching those of the mesh"
+                    " in the " << (have_mesh_dim[0] ? "x " : "") << (have_mesh_dim[1] ? "y " : "")
+                    << (have_mesh_dim[2] ? "z " : "") << (have_mesh_dim[3] ? "t " : "")
+                    << "directions but the " << (have_mesh_dim[0] ? "" : "x ")
+                    << (have_mesh_dim[1] ? "" : "y ") << (have_mesh_dim[2] ? "" : "z ")
+                    << (have_mesh_dim[3] ? "" : "t ") << " dimensions of the mesh have been"
+                    " disabled.")
+            }
+
             // read non-spatial data
             // if the first dimension is time then select the requested time
             // step. otherwise read the entire thing
-            std::vector<size_t> starts(n_dims);
-            std::vector<size_t> counts(n_dims);
-            size_t n_vals = 1;
-            if (!t_axis_variable.empty() && (dim_names->get(0) == t_axis_variable))
+            if (!t_axis_variable.empty() && have_mesh_dim[3])
             {
-                starts[0] = offs;
-                counts[0] = 1;
+                starts.push_back(offs);
+                counts.push_back(1);
             }
             else
             {
-                starts[0] = 0;
-                size_t dim_len = dims->get(0);
-                counts[0] = dim_len;
+                starts.push_back(0);
+
+                size_t dim_len = cf_dims[0];
+                counts.push_back(dim_len);
+
                 n_vals = dim_len;
             }
 
             for (unsigned int ii = 1; ii < n_dims; ++ii)
             {
-                size_t dim_len = dims->get(ii);
-                counts[ii] = dim_len;
+                starts.push_back(0);
+
+                size_t dim_len = cf_dims[ii];
+                counts.push_back(dim_len);
+
                 n_vals *= dim_len;
             }
+        }
+        else
+        {
+            TECA_ERROR("Invalid centering can't read \"" << arrays[i] << "\"")
+            continue;
+        }
 
-            p_teca_variant_array array;
-
-            NC_DISPATCH(type,
-                p_teca_variant_array_impl<NC_T> a = teca_variant_array_impl<NC_T>::New(n_vals);
+        // read the array
+        p_teca_variant_array array;
+        NC_DISPATCH(type,
+            p_teca_variant_array_impl<NC_T> a = teca_variant_array_impl<NC_T>::New(n_vals);
 #if !defined(HDF5_THREAD_SAFE)
-                {
-                std::lock_guard<std::mutex> lock(teca_netcdf_util::get_netcdf_mutex());
+            {
+            std::lock_guard<std::mutex> lock(teca_netcdf_util::get_netcdf_mutex());
 #endif
-                if ((ierr = nc_get_vara(file_id,  id, &starts[0], &counts[0], a->get())) != NC_NOERR)
-                {
-                    TECA_ERROR("time_step=" << time_step
-                        << " Failed to read \"" << arrays[i] << "\" "
-                        << file << endl << nc_strerror(ierr))
-                    continue;
-                }
+            if ((ierr = nc_get_vara(file_id,  id, &starts[0], &counts[0], a->get())) != NC_NOERR)
+            {
+                TECA_ERROR("time_step=" << time_step
+                    << " Failed to read variable \"" << arrays[i] << "\" "
+                    << file << endl << nc_strerror(ierr))
+                continue;
+            }
 #if !defined(HDF5_THREAD_SAFE)
-                }
+            }
 #endif
-                array = a;
-                )
+            array = a;
+            )
 
-            mesh->get_information_arrays()->append(arrays[i], array);
-        }
+        // pas it into the output
+        mesh->get_arrays(centering)->append(arrays[i], array);
     }
 
     return mesh;
diff --git a/io/teca_cf_reader.h b/io/teca_cf_reader.h
index fa3dd23b8..0ea51aecb 100644
--- a/io/teca_cf_reader.h
+++ b/io/teca_cf_reader.h
@@ -13,41 +13,58 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_cf_reader)
 class teca_cf_reader_internals;
 using p_teca_cf_reader_internals = std::shared_ptr<teca_cf_reader_internals>;
 
-/// a reader for data stored in NetCDF CF format
+/// A reader for data stored in NetCDF CF format.
 /**
-a reader for data stored in NetCDF CF format
-
-reads a set of arrays from  single time step into a cartesian
-mesh. the mesh is optionally subset.
-
-metadata keys:
-    variables - a list of all available variables.
-    <var> -  a metadata object holding all NetCDF attributes for the variable named <var>
-    time variables - a list of all variables with time as the only dimension
-    coordinates - a metadata object holding names and arrays of the coordinate axes
-        x_axis_variable - name of x axis variable
-        y_axis_variable - name of y axis variable
-        z_axis_variable - name of z axis variable
-        t_axis_variable - name of t axis variable
-        x - array of x coordinates
-        y - array of y coordinates
-        z - array of z coordinates
-        t - array of t coordinates
-    files - list of files in this dataset
-    step_count - list of the number of steps in each file
-    number_of_time_steps - total number of time steps in all files
-    whole_extent - index space extent describing (nodal) dimensions of the mesh
-
-request keys:
-    time_step - the time step to read
-    arrays - list of arrays to read
-    extent - index space extents describing the subset of data to read
-
-output:
-    generates a 1,2 or 3D cartesian mesh for the requested timestep
-    on the requested extent with the requested point based arrays
-    and value at this timestep for all time variables.
-*/
+ * Reads a set of arrays from  single time step into a cartesian mesh. the mesh
+ * is optionally subset.
+ *
+ * ### metadata keys:
+ *
+ *  | key                   | description |
+ *  | ----                  | ----------- |
+ *  | variables             | a list of all available variables. |
+ *  | attributes            | a metadata object holding all NetCDF attributes for the variables |
+ *  | coordinates           | a metadata object holding names and arrays of the coordinate axes |
+ *  | files                 | list of files in this dataset |
+ *  | step_count            | list of the number of steps in each file |
+ *  | index_initializer_key | number_of_time_steps |
+ *  | number_of_time_steps  | total number of time steps in all files |
+ *  | index_request_key     | time_step |
+ *  | whole_extent          | index space extent describing (nodal) dimensions of the mesh |
+ *
+ * ### attribute metadata:
+ *
+ *  | key             | description |
+ *  | ----            | ----------- |
+ *  | [variable name] | a metadata object holding all NetCDF attributes, and |
+ *  |                 | TECA specific per-array metadata |
+ *
+ * ### cooridnate metadata:
+ *
+ *  | key             | description |
+ *  | ----            | ----------- |
+ *  | x_axis_variable | name of x axis variable |
+ *  | y_axis_variable | name of y axis variable |
+ *  | z_axis_variable | name of z axis variable |
+ *  | t_axis_variable | name of t axis variable |
+ *  | x               | array of x coordinates |
+ *  | y               | array of y coordinates |
+ *  | z               | array of z coordinates |
+ *  | t               | array of t coordinates |
+ *
+ * ### request keys:
+ *
+ *  | key       | description |
+ *  | ----      | ----------- |
+ *  | time_step | the time step to read |
+ *  | arrays    | list of arrays to read |
+ *  | extent    | index space extents describing the subset of data to read |
+ *
+ * ### output:
+ * The reader generates a 1,2 or 3D cartesian mesh for the requested timestep
+ * on the requested extent with the requested point based arrays and value at
+ * this timestep for all time variables.
+ */
 class teca_cf_reader : public teca_algorithm
 {
 public:
@@ -61,63 +78,143 @@ class teca_cf_reader : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // list of file names to open. if this is set the files_regex
-    // is ignored.
+    /** @name file_name
+     * Set a list of files to open. If this is used then the files_regex is
+     * ignored.
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(std::string, file_name)
-
-    // describe the set of files comprising the dataset. This
-    // should contain the full path and regex describing the
-    // file name pattern. only the final component of a path
-    // can contain a regex.
+    ///@}
+
+    /** @name files_regex
+     * Set a regular expression identifying the set of files comprising the
+     * dataset. This should contain the full path to the files and the regular
+     * expression.  Only the final component of a path may contain a regex.
+     * Be aware that regular expression control characters do not have the
+     * same meaning as shell glob control characters. When used in a shell
+     * regular expression control characters need to be quoted or escaped to
+     * prevent the shell from interpreting them.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, files_regex)
+    ///@}
 
-    // set if the dataset has periodic boundary conditions
+    /** @name periodic_in_x
+     * A flag that indicates a periodic bondary in the z direction
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, periodic_in_x)
+    ///@}
+
+    /** @name periodic_in_y
+     * A flag that indicates a periodic bondary in the z direction
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, periodic_in_y)
+    ///@}
+
+    /** @name periodic_in_z
+     * A flag that indicates a periodic bondary in the z direction
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, periodic_in_z)
+    ///@}
 
-    // set the variable to use for the coordinate axes.
-    // the defaults are: x => lon, y => lat, z = "",
-    // t => "time". leaving z empty will result in a 2D
-    // mesh.
+    /** @name x_axis_variable
+     * Set the name of the variable to use for the x coordinate axis.
+     * An empty string disables this dimension.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, x_axis_variable)
+    ///@}
+
+    /** @name y_axis_variable
+     * Set the name of the variable to use for the y coordinate axis.
+     * An empty string disables this dimension.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, y_axis_variable)
+    ///@}
+    /** @name z_axis_variable
+     * Set the name of the variable to use for the z coordinate axis.
+     * An empty string disables this dimension.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, z_axis_variable)
-    TECA_ALGORITHM_PROPERTY(std::string, t_axis_variable)
+    ///@}
 
-    // Override the calendar and time unit. When these are specified
-    // their values take precedence over the values found in the file.
-    TECA_ALGORITHM_PROPERTY(std::string, t_calendar)
+    /** @name t_axis_variable
+     * Set the name of the variable to use for the t coordinate axis.
+     * An empty string disables this dimension.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, t_axis_variable)
+    ///@}
+
+    /** @name calendar
+     * Override the calendar.  When specified the values takes precedence over
+     * the values found in the file.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(std::string, calendar)
+    ///@}
+
+    /** @name t_units
+     * Override the time units. When specified the value takes precedence over
+     * the values found in the file.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, t_units)
-
-    // a way to infer time from the filename if the time axis is not
-    // stored in the file itself. std::get_time format codes are used.
-    // If a calendar is not specified then the standard calendar is
-    // used. If time units are not specified then the time units will
-    // be "days since %Y-%m-%d 00:00:00" where Y,m, and d are computed
-    // from the filename of the first file. set t_axis_variable to an
-    // empty string to use.
-    //
-    // For example, for the list of files:
-    //
-    //      my_file_20170516_00.nc
-    //      my_file_20170516_03.nc
-    //      ...
-    //
-    // the template would be
-    //
-    //      my_file_%Y%m%d_%H.nc
+    ///@}
+
+    /** @name filename_time_template
+     * a way to infer time from the filename if the time axis is not stored in
+     * the file itself. std::get_time format codes are used.  If a calendar is
+     * not specified then the standard calendar is used. If time units are not
+     * specified then the time units will be "days since %Y-%m-%d 00:00:00"
+     * where Y,m, and d are computed from the filename of the first file. set
+     * t_axis_variable to an empty string to use.
+     *
+     * For example, for the list of files:
+     *
+     * > my_file_20170516_00.nc
+     * > my_file_20170516_03.nc
+     * > ...
+     *
+     * the template would be
+     *
+     * > my_file_%Y%m%d_%H.nc
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, filename_time_template)
+    ///@}
 
-    // an explicit list of double precision time values to use.
-    // set t_axis_variable to an empty string to use.
+    /** @name t_value
+     * an explicit list of double precision time values to use.  set
+     * t_axis_variable to an empty string to use.
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(double, t_value)
-
-    // set/get the number of ranks used to read the time axis.
-    // the default value of 1024 ranks works well on NERSC
-    // Cori scratch file system and may not be optimal on
-    // other systems.
+    ///@}
+
+    /** @name max_metadata_ranks
+     * set/get the number of ranks used to read the time axis.  the default
+     * value of 1024 ranks works well on NERSC Cori scratch file system and may
+     * not be optimal on other systems.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, max_metadata_ranks)
+    ///@}
+
+    /** @name clamp_dimensions_of_one
+     * If set the requested extent will be clamped in a given direction if the
+     * coorinate axis in that dircetion has a length of 1 and the requested extent
+     * would be out of bounds. This exists to deal with non-conformant data and
+     * should be used with caution.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(int, clamp_dimensions_of_one)
+    ///@}
 
 protected:
     teca_cf_reader();
@@ -142,7 +239,7 @@ class teca_cf_reader : public teca_algorithm
     std::string y_axis_variable;
     std::string z_axis_variable;
     std::string t_axis_variable;
-    std::string t_calendar;
+    std::string calendar;
     std::string t_units;
     std::string filename_time_template;
     std::vector<double> t_values;
@@ -150,6 +247,7 @@ class teca_cf_reader : public teca_algorithm
     int periodic_in_y;
     int periodic_in_z;
     int max_metadata_ranks;
+    int clamp_dimensions_of_one;
     p_teca_cf_reader_internals internals;
 };
 
diff --git a/io/teca_cf_time_axis_data.h b/io/teca_cf_time_axis_data.h
index 552639838..9b09f5dc5 100644
--- a/io/teca_cf_time_axis_data.h
+++ b/io/teca_cf_time_axis_data.h
@@ -12,9 +12,7 @@
 #include "teca_shared_object.h"
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_cf_time_axis_data)
 
-/**
-A dataset used to read NetCDF CF2 time and metadata in parallel
-*/
+/// A dataset used to read NetCDF CF2 time and metadata in parallel.
 class teca_cf_time_axis_data : public teca_dataset
 {
 public:
@@ -63,7 +61,7 @@ class teca_cf_time_axis_data : public teca_dataset
     // return an integer identifier uniquely naming the dataset type
     int get_type_code() const override;
 
-    // covert to bool. true if the dataset is not empty.
+    // covert to boolean. true if the dataset is not empty.
     // otherwise false.
     explicit operator bool() const noexcept
     { return !this->empty(); }
diff --git a/io/teca_cf_time_axis_data_reduce.h b/io/teca_cf_time_axis_data_reduce.h
index b07cbbceb..ff51dbe15 100644
--- a/io/teca_cf_time_axis_data_reduce.h
+++ b/io/teca_cf_time_axis_data_reduce.h
@@ -2,7 +2,7 @@
 #define teca_cf_time_axis_data_reduce_h
 
 #include "teca_shared_object.h"
-#include "teca_dataset_fwd.h"
+#include "teca_dataset.h"
 #include "teca_metadata.h"
 #include "teca_index_reduce.h"
 
@@ -11,10 +11,10 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_cf_time_axis_data_reduce)
 
-/**
-gathers the time axis and metadata from a parallel read of a
-set of NetCDF CF2 files
-*/
+/** @brief
+ * Gathers the time axis and metadata from a parallel read of a
+ * set of NetCDF CF2 files.
+ */
 class teca_cf_time_axis_data_reduce : public teca_index_reduce
 {
 public:
diff --git a/io/teca_cf_time_axis_reader.h b/io/teca_cf_time_axis_reader.h
index ed3112843..b17ff158c 100644
--- a/io/teca_cf_time_axis_reader.h
+++ b/io/teca_cf_time_axis_reader.h
@@ -11,7 +11,7 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_cf_time_axis_reader)
 
-/// an algorithm to read time axis and its attributes in parallel
+/// An algorithm to read time axis and its attributes in parallel.
 class teca_cf_time_axis_reader : public teca_algorithm
 {
 public:
diff --git a/io/teca_cf_time_step_mapper.cxx b/io/teca_cf_time_step_mapper.cxx
index 570b57f7b..b7ade38b7 100644
--- a/io/teca_cf_time_step_mapper.cxx
+++ b/io/teca_cf_time_step_mapper.cxx
@@ -1,51 +1,5 @@
 #include "teca_cf_time_step_mapper.h"
 
-// --------------------------------------------------------------------------
-int teca_cf_time_step_mapper::to_stream(std::ostream &os)
-{
-    int rank = 0;
-    int n_ranks = 1;
-#if defined(TECA_HAS_MPI)
-    int is_init = 0;
-    MPI_Initialized(&is_init);
-    if (is_init)
-    {
-        MPI_Comm_rank(this->comm, &rank);
-        MPI_Comm_size(this->comm, &n_ranks);
-    }
-#endif
-    if (rank == 0)
-    {
-        os << "start_time_step = " << this->start_time_step << std::endl
-            << "end_time_step = " << this->end_time_step << std::endl
-            << "n_time_steps = " << this->n_time_steps << std::endl
-            << "n_time_steps_per_file = " << this->n_time_steps_per_file << std::endl
-            << "n_files = " << this->n_files << std::endl
-            << "n_ranks = " << n_ranks << std::endl
-            << "rank\tfirst_time_step\tlast_time_step" << std::endl;
-
-        for (int i = 0; i < n_ranks; ++i)
-            os << i << "\t" << block_start[i] << "\t"
-                << block_start[i] + block_size[i] - 1 << std::endl;
-
-        os << "file\tranks" << std::endl;
-        for (int i = 0; i < this->n_files; ++i)
-        {
-            os << i << "\t";
-            std::set<int> &f_ranks = this->file_ranks[i];
-            std::set<int>::iterator it = f_ranks.begin();
-            std::set<int>::iterator end = f_ranks.end();
-            for (; it != end; ++it)
-            {
-                os << *it << ", ";
-            }
-            os << std::endl;
-        }
-    }
-
-    return 0;
-}
-
 // --------------------------------------------------------------------------
 int teca_cf_time_step_mapper::get_upstream_requests(
     teca_metadata base_req, std::vector<teca_metadata> &up_reqs)
@@ -147,171 +101,6 @@ int teca_cf_time_step_mapper::free_file_comms()
     return 0;
 }
 
-// --------------------------------------------------------------------------
-int teca_cf_time_step_mapper::get_file_id(long time_step, long &file_id)
-{
-    file_id = (time_step - this->start_time_step)/this->n_time_steps_per_file;
-    return 0;
-}
-
-// --------------------------------------------------------------------------
-p_teca_cf_layout_manager teca_cf_time_step_mapper::get_layout_manager(
-    long time_step)
-{
-    long file_id = (time_step - this->start_time_step)/this->n_time_steps_per_file;
-    file_table_t::iterator it = this->file_table.find(file_id);
-    if (it == this->file_table.end())
-    {
-        TECA_ERROR("No layout manager for time step " << time_step)
-        return nullptr;
-    }
-    return it->second;
-}
-
-// --------------------------------------------------------------------------
-int teca_cf_time_step_mapper::initialize(MPI_Comm comm, long first_step,
-    long last_step, long steps_per_file, const teca_metadata &md)
-{
-#if !defined(TECA_HAS_MPI)
-    (void)comm;
-#endif
-    this->comm = comm;
-    this->start_time_step = first_step;
-    this->end_time_step = last_step;
-    this->n_time_steps_per_file = steps_per_file;
-
-    // locate the keys that enable us to know how many
-    // requests we need to make and what key to use
-    if (md.get("index_initializer_key", this->index_initializer_key))
-    {
-        TECA_ERROR("No time_step initializer key has been specified")
-        return -1;
-    }
-
-    if (md.get("index_request_key", this->index_request_key))
-    {
-        TECA_ERROR("No time_step request key has been specified")
-        return -1;
-    }
-
-    // locate available time_steps
-    this->n_time_steps = 0;
-    if (md.get(this->index_initializer_key, n_time_steps))
-    {
-        TECA_ERROR("metadata is missing the initializer key \""
-            << this->index_initializer_key << "\"")
-        return -1;
-    }
-
-    // apply restriction
-    long last
-        = this->end_time_step >= 0 ? this->end_time_step : n_time_steps - 1;
-
-    long first
-        = ((this->start_time_step >= 0) && (this->start_time_step <= last))
-            ? this->start_time_step : 0;
-
-    this->n_time_steps = last - first + 1;
-
-    // partition time_steps across MPI ranks. each rank
-    // will end up with a unique block of time_steps
-    // to process.
-    int rank = 0;
-    int n_ranks = 1;
-#if defined(TECA_HAS_MPI)
-    int is_init = 0;
-    MPI_Initialized(&is_init);
-    if (is_init)
-    {
-        MPI_Comm_rank(this->comm, &rank);
-        MPI_Comm_size(this->comm, &n_ranks);
-    }
-#endif
-
-    // map time_steps to ranks
-    long n_big_blocks = this->n_time_steps%n_ranks;
-    this->block_size.resize(n_ranks);
-    this->block_start.resize(n_ranks);
-    for (int i = 0; i < n_ranks; ++i)
-    {
-        this->block_size[i] = 1;
-        this->block_start[i] = 0;
-        if (i < n_big_blocks)
-        {
-            this->block_size[i] = this->n_time_steps/n_ranks + 1;
-            this->block_start[i] = first + this->block_size[i]*i;
-        }
-        else
-        {
-            this->block_size[i] = this->n_time_steps/n_ranks;
-            this->block_start[i] = first + this->block_size[i]*i + n_big_blocks;
-        }
-    }
-
-    // get the number of files to write
-    this->n_files = this->n_time_steps / this->n_time_steps_per_file +
-        (this->n_time_steps % this->n_time_steps_per_file ? 1 : 0);
-
-    // map file id to ranks
-    this->file_ranks.resize(this->n_files);
-    int last_file_rank = 0;
-    std::vector<int> file_ranks_i;
-    file_ranks_i.reserve(n_ranks);
-    for (long i = 0; i < this->n_files; ++i)
-    {
-        long file_time_step_0 = first + i*this->n_time_steps_per_file;
-        long file_time_step_1 = file_time_step_0 + this->n_time_steps_per_file - 1;
-
-        file_ranks_i.clear();
-
-        for (int j = last_file_rank; j < n_ranks; ++j)
-        {
-            long block_time_step_0 = this->block_start[j];
-            long block_time_step_1 = block_time_step_0 + this->block_size[j] - 1;
-
-            // check if this rank is writing to this file
-            long bf_int_0 = file_time_step_0 > block_time_step_0 ?
-                 file_time_step_0 : block_time_step_0;
-
-            long bf_int_1 = file_time_step_1 < block_time_step_1 ?
-                file_time_step_1 : block_time_step_1;
-            if (bf_int_0 <= bf_int_1)
-            {
-                // yes add it to the list
-                file_ranks_i.push_back(j);
-            }
-        }
-
-        last_file_rank = file_ranks_i.size() ? file_ranks_i[0] : 0;
-
-        // store for a later look up
-        this->file_ranks[i].insert(file_ranks_i.begin(), file_ranks_i.end());
-    }
-
-    // allocate per-file communicators
-    this->alloc_file_comms();
-
-    // create layout managers for the local files
-    // proceed file by file, this ensures a deterministic non-blocking order
-    for (long i = 0; i < this->n_files; ++i)
-    {
-        MPI_Comm comm_i = this->file_comms[i];
-        if (comm_i != MPI_COMM_NULL)
-        {
-            // this rank will write to this file, create a layout
-            // manager that will do the work of putting data on disk
-            long first_step = i*this->n_time_steps_per_file;
-
-            long n_steps = first_step + this->n_time_steps_per_file > this->n_time_steps ?
-                this->n_time_steps - first_step : this->n_time_steps_per_file;
-
-            this->file_table[i] = teca_cf_layout_manager::New(comm_i, i, first + first_step, n_steps);
-        }
-    }
-
-    return 0;
-}
-
 // --------------------------------------------------------------------------
 int teca_cf_time_step_mapper::finalize()
 {
diff --git a/io/teca_cf_time_step_mapper.h b/io/teca_cf_time_step_mapper.h
index 17bf6b32c..9ff8093ad 100644
--- a/io/teca_cf_time_step_mapper.h
+++ b/io/teca_cf_time_step_mapper.h
@@ -17,48 +17,36 @@
 class teca_cf_time_step_mapper;
 using p_teca_cf_time_step_mapper = std::shared_ptr<teca_cf_time_step_mapper>;
 
+/// Defines the interface for mapping time steps to files
 class teca_cf_time_step_mapper
 {
 public:
+    virtual ~teca_cf_time_step_mapper() {}
 
-    // allocate and return a new object
-    static p_teca_cf_time_step_mapper New()
-    { return p_teca_cf_time_step_mapper(new teca_cf_time_step_mapper); }
-
-    ~teca_cf_time_step_mapper() {}
-
-    // intialize based on input metadata. this is a collective call
-    // creates communicator groups for each file and creates the
-    // file layout managers for the local rank. After this call
-    // on can access file managers to create, define and write
-    // local datasets to the netcdf files in cf format.
-    int initialize(MPI_Comm comm, long first_step, long last_step,
-        long steps_per_file, const teca_metadata &md);
-
-    // returns true if the mapper has been successfully initallized
-    bool initialized() { return this->file_comms.size(); }
+    // returns true if the mapper has been successfully initialized
+    virtual bool initialized() { return this->file_comms.size(); }
 
     // close all files, destroy file managers, and release communicators
     // this should be done once all I/O is complete.
-    int finalize();
+    virtual int finalize();
 
     // construct requests for this rank
-    int get_upstream_requests(teca_metadata base_req,
+    virtual int get_upstream_requests(teca_metadata base_req,
         std::vector<teca_metadata> &up_reqs);
 
     // given a time step, get the corresponding layout manager that
     // can be used to create, define and write data to disk.
-    p_teca_cf_layout_manager get_layout_manager(long time_step);
+    virtual p_teca_cf_layout_manager get_layout_manager(long time_step) = 0;
 
     // print a summary to the stream
-    int to_stream(std::ostream &os);
+    virtual int to_stream(std::ostream &os) = 0;
 
     // call the passed in functor once per file table entry, safe
     // for MPI collective operations. The required functor signature
     // is:
     //      int f(long file_id, teca_cf_layout_manager &manager)
     //
-    // a return of non-zero from the fucntor will immediately stop the
+    // a return of non-zero from the functor will immediately stop the
     // apply and the value will be returned, but no error will be
     // reported.
     template<typename op_t>
@@ -67,7 +55,7 @@ class teca_cf_time_step_mapper
 protected:
     teca_cf_time_step_mapper() : index_initializer_key(""),
         index_request_key(""), start_time_step(0), end_time_step(-1),
-        n_files(0), n_time_steps_per_file(1)
+        n_files(0)
     {}
 
     // remove these for convenience
@@ -80,10 +68,7 @@ class teca_cf_time_step_mapper
     int alloc_file_comms();
     int free_file_comms();
 
-    // given a time step, get the corresponding file id
-    int get_file_id(long time_step, long &file_id);
-
-private:
+protected:
     // communicator to partition into per-file communicators
     MPI_Comm comm;
 
@@ -102,10 +87,9 @@ class teca_cf_time_step_mapper
 
     // output files
     long n_files;
-    long n_time_steps_per_file;
     std::vector<std::set<int>> file_ranks;
 
-    // per file communcators
+    // per file communicators
     std::vector<MPI_Comm> file_comms;
 
     // the file table maps from a time step to a specific layout manager
diff --git a/io/teca_cf_writer.cxx b/io/teca_cf_writer.cxx
index c7b02883b..ac3826358 100644
--- a/io/teca_cf_writer.cxx
+++ b/io/teca_cf_writer.cxx
@@ -8,6 +8,8 @@
 #include "teca_netcdf_util.h"
 #include "teca_coordinate_util.h"
 #include "teca_cf_time_step_mapper.h"
+#include "teca_cf_block_time_step_mapper.h"
+#include "teca_cf_interval_time_step_mapper.h"
 #include "teca_cf_layout_manager.h"
 #include "teca_coordinate_util.h"
 
@@ -27,8 +29,7 @@
 class teca_cf_writer::internals_t
 {
 public:
-    internals_t() : mapper(teca_cf_time_step_mapper::New()),
-        layout_defined(0)
+    internals_t() : mapper(), layout_defined(0)
     {}
 
     p_teca_cf_time_step_mapper mapper;
@@ -40,8 +41,8 @@ class teca_cf_writer::internals_t
 // --------------------------------------------------------------------------
 teca_cf_writer::teca_cf_writer() :
     file_name(""), date_format("%F-%HZ"), first_step(0), last_step(-1),
-    steps_per_file(16), mode_flags(NC_CLOBBER|NC_NETCDF4), use_unlimited_dim(0),
-    compression_level(-1), flush_files(0)
+    layout(monthly), steps_per_file(128), mode_flags(NC_CLOBBER|NC_NETCDF4),
+    use_unlimited_dim(0), compression_level(-1), flush_files(0)
 {
     this->set_number_of_input_connections(1);
     this->set_number_of_output_ports(1);
@@ -74,28 +75,33 @@ void teca_cf_writer::get_properties_description(
             " file names (%F-%HZ). %t% in the file name is replaced with date/time"
             " of the first time step in the file using this format specifier.")
         TECA_POPTS_GET(long, prefix, first_step,
-            "set the first time step to process (0)")
+            "set the first time step to process")
         TECA_POPTS_GET(long, prefix, last_step,
-            "set the last time step to process. A value less than 0 results "
-            "in all steps being processed.(-1)")
+            "Set the last time step to process. A value less than 0 results"
+            " in all steps being processed.")
+        TECA_POPTS_GET(int, prefix, layout,
+            "Set the layout for writing files. May be one of : number_of_steps(1),"
+            "  daily(2), monthly(3), seasonal(4), or yearly(5)")
         TECA_POPTS_GET(unsigned int, prefix, steps_per_file,
-            "set the number of time steps to write per file (1)")
+            "set the number of time steps to write per file")
         TECA_POPTS_GET(int, prefix, mode_flags,
-            "mode flags to pass to NetCDF when creating the file (NC_CLOBBER)")
+            "mode flags to pass to NetCDF when creating the file")
         TECA_POPTS_GET(int, prefix, use_unlimited_dim,
             "if set the slowest varying dimension is specified to be "
-            "NC_UNLIMITED. (0)")
+            "NC_UNLIMITED.")
         TECA_POPTS_GET(int, prefix, compression_level,
             "sets the zlib compression level used for each variable;"
-            " does nothing if the value is less than or equal to 0. (-1)")
+            " does nothing if the value is less than or equal to 0.")
         TECA_POPTS_GET(int, prefix, flush_files,
-            "if set files are flushed before they are closed. (0)")
+            "if set files are flushed before they are closed.")
         TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, point_arrays,
-            "the list of point centered arrays to write (empty)")
+            "the list of point centered arrays to write")
         TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, information_arrays,
-            "the list of non-geometric arrays to write (empty)")
+            "the list of non-geometric arrays to write")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -103,10 +109,13 @@ void teca_cf_writer::get_properties_description(
 void teca_cf_writer::set_properties(
     const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, file_name)
     TECA_POPTS_SET(opts, std::string, prefix, date_format)
     TECA_POPTS_SET(opts, long, prefix, first_step)
     TECA_POPTS_SET(opts, long, prefix, last_step)
+    TECA_POPTS_SET(opts, int, prefix, layout)
     TECA_POPTS_SET(opts, unsigned int, prefix, steps_per_file)
     TECA_POPTS_SET(opts, int, prefix, mode_flags)
     TECA_POPTS_SET(opts, int, prefix, use_unlimited_dim)
@@ -117,6 +126,37 @@ void teca_cf_writer::set_properties(
 }
 #endif
 
+// --------------------------------------------------------------------------
+int teca_cf_writer::set_layout(const std::string &mode)
+{
+    if (mode == "daily")
+    {
+        this->set_layout(daily);
+    }
+    else if (mode == "monthly")
+    {
+        this->set_layout(monthly);
+    }
+    else if (mode == "seasonal")
+    {
+        this->set_layout(seasonal);
+    }
+    else if (mode == "yearly")
+    {
+        this->set_layout(yearly);
+    }
+    else if (mode == "number_of_steps")
+    {
+        this->set_layout(number_of_steps);
+    }
+    else
+    {
+        TECA_ERROR("Invalid layout mode \"" << mode << "\"")
+        return -1;
+    }
+    return 0;
+}
+
 // --------------------------------------------------------------------------
 int teca_cf_writer::flush()
 {
@@ -264,11 +304,45 @@ std::vector<teca_metadata> teca_cf_writer::get_upstream_request(
 
     // initialize the mapper.
     MPI_Comm comm = this->get_communicator();
-    if (this->internals->mapper->initialize(comm, this->first_step,
-        this->last_step, this->steps_per_file, md_in))
+    if (this->layout == number_of_steps)
     {
-        TECA_ERROR("Failed to initialize the mapper")
-        return up_reqs;
+        p_teca_cf_block_time_step_mapper bmap =
+            teca_cf_block_time_step_mapper::New();
+
+        if (bmap->initialize(comm, this->first_step,
+            this->last_step, this->steps_per_file, md_in))
+        {
+            TECA_ERROR("Failed to initialize the block mapper")
+            return up_reqs;
+        }
+
+        this->internals->mapper = bmap;
+    }
+    else
+    {
+        // create the requested interval iterator
+        teca_calendar_util::p_interval_iterator it =
+            teca_calendar_util::interval_iterator_factory::New(this->layout);
+
+        if (!it)
+        {
+            TECA_ERROR("Failed to create an iterator for layout "
+                <<  this->layout)
+            return up_reqs;
+        }
+
+        // initialize the layout mapper
+        p_teca_cf_interval_time_step_mapper imap =
+            teca_cf_interval_time_step_mapper::New();
+
+        if (imap->initialize(comm,
+            this->first_step, this->last_step, it, md_in))
+        {
+            TECA_ERROR("Failed to initialize the interval mapper")
+            return up_reqs;
+        }
+
+        this->internals->mapper = imap;
     }
 
     if (this->get_verbose())
@@ -384,6 +458,13 @@ const_p_teca_dataset teca_cf_writer::execute(unsigned int port,
             TECA_ERROR("Write time step " << time_step << " failed for time step")
             return nullptr;
         }
+
+        if (this->verbose > 1)
+        {
+            std::ostringstream oss;
+            layout_mgr->to_stream(oss);
+            TECA_STATUS(<< oss.str())
+        }
     }
 
     // close the file when all data has been written
diff --git a/io/teca_cf_writer.h b/io/teca_cf_writer.h
index 9cced183f..61e9d98fd 100644
--- a/io/teca_cf_writer.h
+++ b/io/teca_cf_writer.h
@@ -10,49 +10,66 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_cf_writer)
 
-
-// A writer for Cartesian meshes in NetCDF CF2 format.
+/// A writer for Cartesian meshes in NetCDF CF2 format.
 /**
-Writes data to NetCDF CF2 format. This algorithm is conceptually an execution
-engine capable of driving the above pipeline with our without threads and
-stream results in the order that they are genreated placing them in the correct
-location in the output dataset. The output dataset is a collection of files
-each with a user specified number of time steps per file. The total number of
-time steps in the dataset is determined by the combination of the number of
-time steps in the input dataset and user defined subsetting if any. The writer
-uses MPI collective I/O to produce the files. In parallel time steps are mapped
-to ranks such that each rank has approximately the same number of time steps.
-Incoming steps are mapped to files. A given MPI rank may be writing to multiple
-files. The use of MPI collecitves implies care must be taken in its use to
-avoid deadlocks.
-
-Due to the use of MPI collectives I/O certain information must be known during
-the report phase of pipeline execution, before the execute phase of pipeline
-execution begins. The information that is needed is:
-
-number of time steps - specified by the pipeline control index_initializer key
-                       found in metadata produced by the source (eg CF reader)
-
-extent - 6 64 bit integers defining the 3 spatial dimensions of each time step
-         found in metadata produced by the source (eg CF reader)
-
-point arrays - list of strings naming the point centered arrays that will be
-               written. set by the user prior to execution by writer properties.
-
-information arrays - list of strings naming the non-geometric arrays that will
-                     written. set by the user prior to execution by writer
-                     properties. See also size attribute below.
-
-type_code - the teca_variant_array_code naming the type of erach array. this
-            will be in the array attributes metadata generated by the producer
-            of the array (eg any algorithm that adds an array should provide
-            this metadata).
-
-size - a 64 bit integer declaring the size of each information array. this
-            will be in the array attributes metadata generated by the producer
-            of the array (eg any algorithm that adds an array should provide
-            this metadata).
-*/
+ * Writes data to NetCDF CF2 format. This algorithm is conceptually an
+ * execution engine capable of driving the above pipeline with our without
+ * threads and stream results in the order that they are generated placing them
+ * in the correct location in the output dataset. The output dataset is a
+ * collection of files each with a user specified number of time steps per
+ * file. The output dataset may be arranged using a fixed number of steps per
+ * file or daily, monthly, seasonal, or yearly file layouts. The total number
+ * of time steps in the output dataset is determined by the combination of the
+ * number of time steps in the input dataset and user defined subsetting if
+ * any. The writer uses MPI collective I/O to produce the files. In parallel
+ * time steps are mapped to ranks such that each rank has approximately the
+ * same number of time steps. Incoming steps are mapped to files. A given MPI
+ * rank may be writing to multiple files. The use of MPI collectives implies
+ * care must be taken in its use to avoid deadlocks.
+ *
+ * Due to the use of MPI collectives I/O certain information must be known
+ * during the report phase of pipeline execution, before the execute phase of
+ * pipeline execution begins. The information that is needed is:
+ *
+ * ### number of time steps ###
+ * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+ * specified by the pipeline control index_initializer key found in metadata
+ * produced by the source (e.g CF reader)
+ * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+ *
+ * ### extent ###
+ * ~~~~~~~~~~~~~~
+ * 6, 64 bit integers defining the 3 spatial dimensions of each timestep found
+ * in metadata produced by the source (e.g CF reader)
+ * ~~~~~~~~~~~~~~
+ *
+ * ### point arrays ###
+ * ~~~~~~~~~~~~~~~~~~~~
+ * list of strings naming the point centered arrays that will be written. set
+ * by the user prior to execution by writer properties.
+ * ~~~~~~~~~~~~~~~~~~~~
+ *
+ * ### information arrays ###
+ * ~~~~~~~~~~~~~~~~~~~~~~~~~~
+ * list of strings naming the non-geometric arrays that will written. set by
+ * the user prior to execution by writer properties. See also size attribute
+ * below.
+ * ~~~~~~~~~~~~~~~~~~~~~~~~~~
+ *
+ * ### type_code ###
+ * ~~~~~~~~~~~~~~~~~
+ * the teca_variant_array_code naming the type of each array. this will be in
+ * the array attributes metadata generated by the producer of the array (e.g
+ * any algorithm that adds an array should provide this metadata).
+ * ~~~~~~~~~~~~~~~~~
+ *
+ * ### size ###
+ * ~~~~~~~~~~~~
+ * a 64 bit integer declaring the size of each information array. this will be
+ * in the array attributes metadata generated by the producer of the array (e.g
+ * any algorithm that adds an array should provide this metadata).
+ * ~~~~~~~~~~~~
+ */
 class teca_cf_writer : public teca_threaded_algorithm
 {
 public:
@@ -66,58 +83,136 @@ class teca_cf_writer : public teca_threaded_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the output filename. for time series the substring %t% is replaced
-    // with the current time step or date. See comments on date_format below
-    // for info about date formatting.
+    /** @name file_name
+     * Set the output filename. For time series the substring %t% is replaced
+     * with the current time step or date. See comments on date_format below
+     * for info about date formatting.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, file_name)
+    ///@}
+
 
-    // set the format for the date to write in the filename. this requires the
-    // input dataset to have unit/calendar information if none are available,
-    // the time index is used instead. (%F-%HZ)
+    /** @name date_format
+     * set the format for the date to write in the filename. this requires the
+     * input dataset to have unit/calendar information if none are available,
+     * the time index is used instead. (%F-%HZ)
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(std::string, date_format)
+    ///@}
 
-    // set the range of time step to process.
+    /** @name first_step
+     * Set the first step in the range of time step to process.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(long, first_step)
-    TECA_ALGORITHM_PROPERTY(long, last_step)
+    ///@}
 
-    // set how many time steps are written to each file. Note that upstream is
-    // parallelized over files rather than time steps.  this has the affect of
-    // reducing the available oportunity for MPI parallelization by this
-    // factor. For example if there are 16 timee steps and steps_per_file is 8,
-    // 2 MPI ranks each running 8 or more threads would be optimal. One
-    // should make such calculations when planning large runs if optimal
-    // performance is desired. time steps are gathered before the file is
-    // written, thus available memory per MPI rank is the limiting factor in
-    // how many steps can be stored in a single file (1).
+    /** @name last_step
+     * Set the last step in the range of time step to process.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(long, last_step)
+    ///@}
+
+    /** @name layout
+     * Set the layout mode to one of : number_of_steps, daily, monthly,
+     * seasonal, or yearly. This controls the size of the files written.  In
+     * daily, monthly, seasonal, and yearly modes each file will contain the
+     * steps spanning the given duration. The number_of_steps mode writes a
+     * fixed number of steps per file which can be set using the
+     * steps_per_file property.
+     */
+    ///@{
+    enum {invalid=0, number_of_steps=1, daily=2, monthly=3, seasonal=4, yearly=5};
+    TECA_ALGORITHM_PROPERTY_V(int, layout)
+
+    void set_layout_to_number_of_steps() { this->set_layout(number_of_steps); }
+    void set_layout_to_daily() { this->set_layout(daily); }
+    void set_layout_to_monthly() { this->set_layout(monthly); }
+    void set_layout_to_seasonal() { this->set_layout(seasonal); }
+    void set_layout_to_yearly() { this->set_layout(yearly); }
+
+    /// set the layout mode from a string.
+    int set_layout(const std::string &layout);
+
+    /// @returns 0 if the passed value is a valid layout mode
+    int validate_layout(int mode)
+    {
+        if ((mode == number_of_steps) || (mode == daily) ||
+             (mode == monthly) || (mode == seasonal) || (mode == yearly))
+            return 0;
+
+        TECA_ERROR("Invalid layout mode " << mode)
+        return -1;
+    }
+    ///@}
+
+    /** @name steps_per_file
+     * Set how many time steps are written to each file when the layout mode is
+     * set to number_of_steps.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(unsigned int, steps_per_file)
+    ///@}
 
-    // sets the flags passed to NetCDF during file creation. (NC_CLOBBER)
+    /** @name mode_flags
+     * sets the flags passed to NetCDF during file creation. (NC_CLOBBER)
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, mode_flags)
-
-    // if set the slowest varying dimension is specified to be NC_UNLIMITED.
-    // This has a negative impact on performance when reading the values in a
-    // single pass. However, unlimited dimensions are used ubiquitously thus
-    // by default it is set. For data being consumed by TECA performance will
-    // be better when using fixed dimensions. (1) This feature requires
-    // collective writes and is incompatible with out of order execution,
-    // and hence currently not suppoorted.
+    ///@}
+
+
+    /** @name use_unlimited_dim
+     * if set the slowest varying dimension is specified to be NC_UNLIMITED.
+     * This has a negative impact on performance when reading the values in a
+     * single pass. However, unlimited dimensions are used ubiquitously thus
+     * by default it is set. For data being consumed by TECA performance will
+     * be better when using fixed dimensions. (1) This feature requires
+     * collective writes and is incompatible with out of order execution,
+     * and hence currently not supported.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, use_unlimited_dim)
-
-    // sets the compression level used for each variable compression is not
-    // used if the value is less than or equal to 0. This feature requires
-    // collective writes and is incompatible with out of order execution,
-    // and hence currently not suppoorted.
+    ///@}
+
+    /** @name compression_level
+     * sets the compression level used for each variable compression is not
+     * used if the value is less than or equal to 0. This feature requires
+     * collective writes and is incompatible with out of order execution,
+     * and hence currently not supported.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, compression_level)
-
-    // flush files before closing them, this may be necessary if accessing data
-    // immediately.
-    TECA_ALGORITHM_PROPERTY(int, flush_files);
-
-    // specify the arrays to write. a data array is only written to disk if
-    // it is included in this list. it is an error to not specify at least
-    // one point centered array to write
+    ///@}
+
+    /** @name flush_files
+     * Flush files before closing them, this may be necessary if accessing data
+     * immediately.
+     */
+    ///@{
+    TECA_ALGORITHM_PROPERTY(int, flush_files)
+    ///@}
+;
+
+    /** @name point_array
+     * Specify the arrays to write. A data array is only written to disk if
+     * it is included in this list. It is an error to not specify at least
+     * one point centered array to write
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(std::string, point_array)
+    ///@}
+
+    /** @name information_array
+     * Set the list of non-geometric arrays to write.
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(std::string, information_array)
+    ///@}
+
 
 protected:
     teca_cf_writer();
@@ -143,6 +238,7 @@ class teca_cf_writer : public teca_threaded_algorithm
     std::string date_format;
     long first_step;
     long last_step;
+    int layout;
     unsigned int steps_per_file;
     int mode_flags;
     int use_unlimited_dim;
diff --git a/io/teca_file_util.h b/io/teca_file_util.h
index 077e828b4..01f2293fb 100644
--- a/io/teca_file_util.h
+++ b/io/teca_file_util.h
@@ -1,6 +1,8 @@
 #ifndef teca_file_util_h
 #define teca_file_util_h
 
+/// @file
+
 #include <vector>
 #include <deque>
 #include <string>
@@ -17,82 +19,89 @@ class teca_binary_stream;
   #define PATH_SEP "\\"
 #endif
 
+/// Codes dealing with low level file system API's
 namespace teca_file_util
 {
-// read the file into a stream. if header is not null the call will fail if the
-// given string is not found. return zero upon success. The verbose flag
-// indicates whether or not an error is reported if opening the file fails. All
-// other errors are always reported.
+/** read the file into a stream. if header is not null the call will fail if the
+ * given string is not found. return zero upon success. The verbose flag
+ * indicates whether or not an error is reported if opening the file fails. All
+ * other errors are always reported.
+ */
 int read_stream(const char *file_name, const char *header,
     teca_binary_stream &stream, bool verbose=true);
 
-// write the stream to the file. the passed in flags control file access, a
-// reasonable value is S_IRUSR|S_IWUSR|S_IRGRP|S_IROTH. if header is not null
-// the given string is prepended to the file. return zero upon success. The
-// verbose flag indicates whether or not an error is reported if creating the
-// file fails. All other errors are reported.
+/** write the stream to the file. the passed in flags control file access, a
+ * reasonable value is S_IRUSR|S_IWUSR|S_IRGRP|S_IROTH. if header is not null
+ * the given string is prepended to the file. return zero upon success. The
+ * verbose flag indicates whether or not an error is reported if creating the
+ * file fails. All other errors are reported.
+ */
 int write_stream(const char *file_name, int flags, const char *header,
     const teca_binary_stream &stream, bool verbose=true);
 
-// replace %t% with the given value
+/// replace %t% with the given value
 void replace_timestep(std::string &file_name, unsigned long time_step, int width = 6);
 
-// replace %t% with the time t in calendar with units in the strftime format
+/// replace %t% with the time t in calendar with units in the strftime format
 int replace_time(std::string &file_name, double t,
     const std::string &calendar, const std::string &units,
     const std::string &format);
 
-// replace %e% with the given string
+/// replace %e% with the given string
 void replace_extension(std::string &file_name, const std::string &ext);
 
-// replace %s% with the given string
+/// replace %s% with the given string
 void replace_identifier(std::string &file_name, const std::string &id);
 
-// return string converted to lower case
+/// return string converted to lower case
 void to_lower(std::string &in);
 
-// return 0 if the file does not exist
+/// return 0 if the file does not exist
 int file_exists(const char *path);
 
-// return 0 if the file/directory is not writeable
+/// return 0 if the file/directory is not writeable
 int file_writable(const char *path);
 
-// Returns the path not including the file name and not
-// including the final PATH_SEP. If PATH_SEP isn't found
-// then ".PATH_SEP" is returned.
+/** Returns the path not including the file name and not including the final
+ * PATH_SEP. If PATH_SEP isn't found then ".PATH_SEP" is returned.
+ */
 std::string path(const std::string &filename);
 
-// Returns the file name not including the extension (ie what ever is after
-// the last ".". If there is no "." then the filename is returned unmodified.
+/** Returns the file name not including the extension (ie what ever is after
+ * the last ".". If there is no "." then the filename is returned unmodified.
+ */
 std::string base_filename(const std::string &filename);
 
-// Returns the file name from the given path. If PATH_SEP isn't found
-// then the filename is returned unmodified.
+/** Returns the file name from the given path. If PATH_SEP isn't found
+ * then the filename is returned unmodified.
+ */
 std::string filename(const std::string &filename);
 
-// Returns the extension from the given filename.
+/// Returns the extension from the given filename.
 std::string extension(const std::string &filename);
 
-// read the lines of the ascii file into a vector
+/// read the lines of the ascii file into a vector
 size_t load_lines(const char *filename, std::vector<std::string> &lines);
 
-// read the file into a string
+/// read the file into a string
 size_t load_text(const std::string &filename, std::string &text);
 
-// write the string to the named file
+/// write the string to the named file
 int write_text(std::string &filename, std::string &text);
 
+/// Search and replace with in a string of text.
 int search_and_replace(
     const std::string &search_for,
     const std::string &replace_with,
     std::string &in_text);
 
+/// Locate files in path that match a regular expression.
 int locate_files(
     const std::string &path,
     const std::string &re,
     std::vector<std::string> &file_list);
 
-//*****************************************************************************
+/// Load a binary file into memory
 template<typename T>
 size_t load_bin(const char *filename, size_t dlen, T *buffer)
 {
@@ -125,9 +134,7 @@ size_t load_bin(const char *filename, size_t dlen, T *buffer)
   return dlen;
 }
 
-/**
-*/
-// ****************************************************************************
+/// extract a name-value pair from the given set of lines.
 template<typename T>
 int name_value(std::vector<std::string> &lines, std::string name, T &value)
 {
@@ -146,14 +153,11 @@ int name_value(std::vector<std::string> &lines, std::string name, T &value)
   return 0;
 }
 
-/**
-Parse a string for a "key", starting at offset "at" then
-advance past the key and attempt to convert what follows
-in to a value of type "T". If the key isn't found, then
-npos is returned otherwise the position imediately following
-the key is returned.
+/** Parse a string for a "key", starting at offset "at" then advance past the
+ * key and attempt to convert what follows in to a value of type "T". If the
+ * key isn't found, then npos is returned otherwise the position imediately
+ * following the key is returned.
 */
-// ****************************************************************************
 template <typename T>
 size_t parse_value(std::string &in,size_t at, std::string key, T &value)
 {
@@ -177,8 +181,9 @@ size_t parse_value(std::string &in,size_t at, std::string key, T &value)
   return p;
 }
 
-// a stack of lines. lines can be popped as they are processed
-// and the current line number is recorded.
+/** a stack of lines. lines can be popped as they are processed and the current
+ * line number is recorded.
+ */
 struct line_buffer
 {
     line_buffer() : m_buffer(nullptr), m_line_number(0) {}
diff --git a/io/teca_multi_cf_reader.cxx b/io/teca_multi_cf_reader.cxx
index cf6345e8f..da3521fa7 100644
--- a/io/teca_multi_cf_reader.cxx
+++ b/io/teca_multi_cf_reader.cxx
@@ -30,8 +30,79 @@
 class teca_multi_cf_reader_internals
 {
 public:
-    teca_multi_cf_reader_internals()
-    {}
+    teca_multi_cf_reader_internals() {}
+
+    /// packages reader options
+    struct cf_reader_options
+    {
+        cf_reader_options() :
+            name(), regex(), provides_time(0), provides_geometry(0),
+            variables(), x_axis_variable(), y_axis_variable(),
+            z_axis_variable(), t_axis_variable(), periodic_in_x(-1),
+            calendar(), t_units(), filename_time_template(),
+            clamp_dimensions_of_one(-1)
+            {}
+
+        /**
+         * parse one line for fields we own. if none are found
+         * return 0, if one is found return 1, if an error occurs
+         * return -1
+         */
+        int parse_line(char *line, unsigned long line_no);
+
+        /// return the internal value if set otherwise the default
+        std::string get_x_axis_variable(
+            const std::string &default_val) const;
+
+        /// return the internal value if set otherwise the default
+        std::string get_y_axis_variable(
+            const std::string &default_val) const;
+
+        /// return the internal value if set otherwise the default
+        std::string get_z_axis_variable(
+            const std::string &default_val) const;
+
+        /// return the internal value if set otherwise the default
+        std::string get_t_axis_variable(
+            const std::string &default_val) const;
+
+        /// return the internal value if set otherwise the default
+        int get_periodic_in_x(int default_val) const;
+
+        /// return the internal value if set otherwise the default
+        const std::string &get_calendar(
+            const std::string &default_val) const;
+
+        /// return the internal value if set otherwise the default
+        const std::string &get_t_units(
+            const std::string &default_val) const;
+
+        /// return the internal value if set otherwise the default
+        const std::string &get_filename_time_template(
+            const std::string &default_val) const;
+
+        /// return the internal value if set otherwise the default
+        int get_clamp_dimensions_of_one(int default_val) const;
+
+        /// serialize/deserialize to/from the stream
+        void to_stream(teca_binary_stream &bs) const;
+        void from_stream(teca_binary_stream &bs);
+
+        std::string name;                   /// name of the reader
+        std::string regex;                  /// files to serve data from
+        int provides_time;                  /// set if this reader provides mesh for all
+        int provides_geometry;              /// set if this reader provides time axis for all
+        std::vector<std::string> variables; /// list of variables to serve
+        std::string x_axis_variable;        /// name of mesh x-axis, empty to disable
+        std::string y_axis_variable;        /// name of mesh y-axis, empty to disable
+        std::string z_axis_variable;        /// name of mesh z-axis, empty to disable
+        std::string t_axis_variable;        /// name of mesh t-axis, empty to disable
+        int periodic_in_x;                  /// set to identify x-axis as periodic
+        std::string calendar;               /// calendar
+        std::string t_units;                /// time axis units
+        std::string filename_time_template; /// for deriving time from the filename
+        int clamp_dimensions_of_one;        /// ignore out of bounds requests if dim is 1
+    };
 
     // read a subset of arrays using the passed in reader. the passed
     // request defines what is read except that only the passed in arrays
@@ -43,33 +114,429 @@ class teca_multi_cf_reader_internals
         const std::vector<std::string> &arrays,
         p_teca_cartesian_mesh &mesh_out);
 
+
+    // get configuration from a file
     static
     int parse_cf_reader_section(teca_file_util::line_buffer &lines,
-        std::string &name, std::string &regex, int &provides_time,
-        int &provides_geometry, std::vector<std::string> &variables);
+        cf_reader_options &opts);
+
+    // adds a reader to the collection
+    int add_reader_instance(const cf_reader_options &options);
 
 public:
     // a container that packages informatiuon associated with a reader
     struct cf_reader_instance
     {
         cf_reader_instance(const p_teca_cf_reader r,
-            const std::set<std::string> v) : reader(r), variables(v) {}
+            const std::set<std::string> v, const cf_reader_options &o) :
+                reader(r), variables(v), options(o) {}
 
         p_teca_cf_reader reader;            // the reader
         teca_metadata metadata;             // cached metadata
         std::set<std::string> variables;    // variables to read
+        cf_reader_options options;          // per-instance run time config
     };
 
     using p_cf_reader_instance = std::shared_ptr<cf_reader_instance>;
 
-    teca_metadata metadata;     // cached aglomerated metadata
-    std::string time_reader;    // names the reader that provides time axis
-    std::string geometry_reader;// names the reader the provides mesh geometry
+    teca_metadata metadata;            // cached aglomerated metadata
+    std::string time_reader;           // names the reader that provides time axis
+    std::string geometry_reader;       // names the reader the provides mesh geometry
+    cf_reader_options global_options;  // default run time config
 
     using reader_map_t = std::map<std::string, p_cf_reader_instance>;
     reader_map_t readers;
 };
 
+
+
+// --------------------------------------------------------------------------
+std::string
+teca_multi_cf_reader_internals::cf_reader_options::get_x_axis_variable(
+    const std::string &default_val) const
+{
+    if (!x_axis_variable.empty())
+        return teca_string_util::emptystr(x_axis_variable);
+
+    return default_val;
+}
+
+// --------------------------------------------------------------------------
+std::string
+teca_multi_cf_reader_internals::cf_reader_options::get_y_axis_variable(
+    const std::string &default_val) const
+{
+    if (!y_axis_variable.empty())
+        return teca_string_util::emptystr(y_axis_variable);
+
+    return default_val;
+}
+
+// --------------------------------------------------------------------------
+std::string
+teca_multi_cf_reader_internals::cf_reader_options::get_z_axis_variable(
+    const std::string &default_val) const
+{
+    if (!z_axis_variable.empty())
+        return teca_string_util::emptystr(z_axis_variable);
+
+    return default_val;
+}
+
+// --------------------------------------------------------------------------
+std::string
+teca_multi_cf_reader_internals::cf_reader_options::get_t_axis_variable(
+    const std::string &default_val) const
+{
+    if (!t_axis_variable.empty())
+        return teca_string_util::emptystr(t_axis_variable);
+
+    return default_val;
+}
+
+// --------------------------------------------------------------------------
+int teca_multi_cf_reader_internals::cf_reader_options::get_periodic_in_x(
+    int default_val) const
+{
+    if (periodic_in_x < 0)
+        return default_val;
+
+    return periodic_in_x;
+}
+
+// --------------------------------------------------------------------------
+const std::string &
+teca_multi_cf_reader_internals::cf_reader_options::get_calendar(
+    const std::string &default_val) const
+{
+    if (!calendar.empty())
+        return calendar;
+
+    return default_val;
+}
+
+// --------------------------------------------------------------------------
+const std::string &
+teca_multi_cf_reader_internals::cf_reader_options::get_t_units(
+    const std::string &default_val) const
+{
+    if (!t_units.empty())
+        return t_units;
+
+    return default_val;
+}
+
+// --------------------------------------------------------------------------
+const std::string &
+teca_multi_cf_reader_internals::cf_reader_options::get_filename_time_template(
+    const std::string &default_val) const
+{
+    if (!filename_time_template.empty())
+        return filename_time_template;
+
+    return default_val;
+}
+
+// --------------------------------------------------------------------------
+int teca_multi_cf_reader_internals::cf_reader_options::get_clamp_dimensions_of_one(
+    int default_val) const
+{
+    if (clamp_dimensions_of_one < 0)
+        return default_val;
+
+    return clamp_dimensions_of_one;
+}
+
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader_internals::cf_reader_options::to_stream(
+    teca_binary_stream &bs) const
+{
+    bs.pack(name);
+    bs.pack(regex);
+    bs.pack(provides_time);
+    bs.pack(provides_geometry);
+    bs.pack(variables);
+    bs.pack(x_axis_variable);
+    bs.pack(y_axis_variable);
+    bs.pack(z_axis_variable);
+    bs.pack(t_axis_variable);
+    bs.pack(periodic_in_x);
+    bs.pack(calendar);
+    bs.pack(t_units);
+    bs.pack(filename_time_template);
+    bs.pack(clamp_dimensions_of_one);
+}
+
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader_internals::cf_reader_options::from_stream(
+    teca_binary_stream &bs)
+{
+    bs.unpack(name);
+    bs.unpack(regex);
+    bs.unpack(provides_time);
+    bs.unpack(provides_geometry);
+    bs.unpack(variables);
+    bs.unpack(x_axis_variable);
+    bs.unpack(y_axis_variable);
+    bs.unpack(z_axis_variable);
+    bs.unpack(t_axis_variable);
+    bs.unpack(periodic_in_x);
+    bs.unpack(calendar);
+    bs.unpack(t_units);
+    bs.unpack(filename_time_template);
+    bs.unpack(clamp_dimensions_of_one);
+}
+
+// --------------------------------------------------------------------------
+int teca_multi_cf_reader_internals::cf_reader_options::parse_line(
+    char *line, unsigned long line_no)
+{
+    if (strncmp("name", line, 5) == 0)
+    {
+        if (!name.empty())
+        {
+            TECA_ERROR("Duplicate name label found on line " << line_no)
+            return -1;
+        }
+
+        if (teca_string_util::extract_value<std::string>(line, name))
+        {
+            TECA_ERROR("Syntax error when parsing name on line " << line_no)
+            return -1;
+        }
+    }
+    else if (strncmp("regex", line, 5) == 0)
+    {
+        if (!regex.empty())
+        {
+            TECA_ERROR("Duplicate regex label found on line " << line_no)
+            return -1;
+        }
+
+        if (teca_string_util::extract_value<std::string>(line, regex))
+        {
+            TECA_ERROR("Syntax error when parsing regex on line " << line_no)
+            return -1;
+        }
+    }
+    else if (strncmp("variables", line, 9) == 0)
+    {
+        if (!variables.empty())
+        {
+            TECA_ERROR("Duplicate regex label found on line " << line_no)
+            return -1;
+        }
+
+        std::vector<char*> tmp;
+        if (teca_string_util::tokenize(line, '=', tmp) || (tmp.size() != 2))
+        {
+            TECA_ERROR("Invalid variables specifier : \"" << line
+                << "\" on line " << line_no)
+            return -1;
+        }
+
+        std::vector<char*> vars;
+        if (teca_string_util::tokenize(tmp[1], ',', vars) || (vars.size() < 1))
+        {
+            TECA_ERROR("Invalid variables specifier : \"" << line
+                << "\" on line " << line_no)
+            return -1;
+        }
+
+        size_t n_vars  = vars.size();
+        for (size_t i = 0; i < n_vars; ++i)
+        {
+            char *v = vars[i];
+            if (teca_string_util::skip_pad(v))
+            {
+                TECA_ERROR("Invalid variable name on line " << line_no)
+                return -1;
+            }
+            variables.push_back(v);
+        }
+    }
+    else if (strncmp("provides_time", line, 11) == 0)
+    {
+        if (provides_time)
+        {
+            TECA_ERROR("Duplicate provides_time label found on line " << line_no)
+            return -1;
+        }
+
+        provides_time = 1;
+    }
+    else if (strncmp("provides_geometry", line, 15) == 0)
+    {
+        if (provides_geometry)
+        {
+            TECA_ERROR("Duplicate provides_geometry label found on line " << line_no)
+            return -1;
+        }
+
+        provides_geometry = 1;
+    }
+    else if (strncmp("x_axis_variable", line, 15) == 0)
+    {
+        if (!x_axis_variable.empty())
+        {
+            TECA_ERROR("Duplicate x_axis_variable label found on line " << line_no)
+            return -1;
+        }
+
+        if (teca_string_util::extract_value<std::string>(line, x_axis_variable))
+        {
+            TECA_ERROR("Syntax error when parsing x_axis_variable on line " << line_no)
+            return -1;
+        }
+
+        return 1;
+    }
+    else if (strncmp("y_axis_variable", line, 15) == 0)
+    {
+        if (!y_axis_variable.empty())
+        {
+            TECA_ERROR("Duplicate y_axis_variable label found on line " << line_no)
+            return -1;
+        }
+
+        if (teca_string_util::extract_value<std::string>(line, y_axis_variable))
+        {
+            TECA_ERROR("Syntax error when parsing y_axis_variable on line " << line_no)
+            return -1;
+        }
+
+        return 1;
+    }
+    else if (strncmp("z_axis_variable", line, 15) == 0)
+    {
+        if (!z_axis_variable.empty())
+        {
+            TECA_ERROR("Duplicate z_axis_variable label found on line " << line_no)
+            return -1;
+        }
+
+        if (teca_string_util::extract_value<std::string>(line, z_axis_variable))
+        {
+            TECA_ERROR("Syntax error when parsing z_axis_variable on line " << line_no)
+            return -1;
+        }
+
+        return 1;
+    }
+    else if (strncmp("periodic_in_x", line, 15) == 0)
+    {
+        if (!(periodic_in_x < 0))
+        {
+            TECA_ERROR("Duplicate periodic_in_x label found on line " << line_no)
+            return -1;
+        }
+
+        std::string tmp;
+        bool val = false;
+        if (teca_string_util::extract_value<std::string>(line, tmp)
+            || teca_string_util::string_tt<bool>::convert(tmp.c_str(), val))
+        {
+            TECA_ERROR("Syntax error when parsing periodic_in_x on line " << line_no)
+            return -1;
+        }
+
+        periodic_in_x = val ? 1 : 0;
+
+        return 1;
+    }
+    else if (strncmp("t_axis_variable", line, 15) == 0)
+    {
+        if (!t_axis_variable.empty())
+        {
+            TECA_ERROR("Duplicate t_axis_variable label found on line " << line_no)
+            return -1;
+        }
+
+        if (teca_string_util::extract_value<std::string>(line, t_axis_variable))
+        {
+            TECA_ERROR("Syntax error when parsing t_axis_variable on line " << line_no)
+            return -1;
+        }
+
+        return 1;
+    }
+    else if (strncmp("calendar", line, 8) == 0)
+    {
+        if (!calendar.empty())
+        {
+            TECA_ERROR("Duplicate calendar label found on line " << line_no)
+            return -1;
+        }
+
+        if (teca_string_util::extract_value<std::string>(line, calendar))
+        {
+            TECA_ERROR("Syntax error when parsing calendar on line " << line_no)
+            return -1;
+        }
+
+        return 1;
+    }
+    else if (strncmp("t_units", line, 15) == 0)
+    {
+        if (!t_units.empty())
+        {
+            TECA_ERROR("Duplicate t_units label found on line " << line_no)
+            return -1;
+        }
+
+        if (teca_string_util::extract_value<std::string>(line, t_units))
+        {
+            TECA_ERROR("Syntax error when parsing t_units on line " << line_no)
+            return -1;
+        }
+
+        return 1;
+    }
+    else if (strncmp("filename_time_template", line, 15) == 0)
+    {
+        if (!filename_time_template.empty())
+        {
+            TECA_ERROR("Duplicate filename_time_template label found on line " << line_no)
+            return -1;
+        }
+
+        if (teca_string_util::extract_value<std::string>(line, filename_time_template))
+        {
+            TECA_ERROR("Syntax error when parsing filename_time_template on line " << line_no)
+            return -1;
+        }
+
+        return 1;
+    }
+    else if (strncmp("clamp_dimensions_of_one", line, 23) == 0)
+    {
+        if (!(clamp_dimensions_of_one < 0))
+        {
+            TECA_ERROR("Duplicate clamp_dimensions_of_one label found on line " << line_no)
+            return -1;
+        }
+
+        std::string tmp;
+        bool val = false;
+        if (teca_string_util::extract_value<std::string>(line, tmp)
+            || teca_string_util::string_tt<bool>::convert(tmp.c_str(), val))
+        {
+            TECA_ERROR("Syntax error when parsing clamp_dimensions_of_one on line " << line_no)
+            return -1;
+        }
+
+        clamp_dimensions_of_one = val ? 1 : 0;
+
+        return 1;
+    }
+
+    return 0;
+}
+
+
+
+
+
 // --------------------------------------------------------------------------
 int teca_multi_cf_reader_internals::read_arrays(p_teca_cf_reader reader,
     const teca_metadata &request, const std::vector<std::string> &arrays,
@@ -114,23 +581,9 @@ int teca_multi_cf_reader_internals::read_arrays(p_teca_cf_reader reader,
 
 // --------------------------------------------------------------------------
 int teca_multi_cf_reader_internals::parse_cf_reader_section(
-    teca_file_util::line_buffer &lines, std::string &name,
-    std::string &regex, int &provides_time, int &provides_geometry,
-    std::vector<std::string> &variables)
+    teca_file_util::line_buffer &lines,
+    teca_multi_cf_reader_internals::cf_reader_options &opts)
 {
-    name = "";
-    regex = "";
-    provides_time = 0;
-    provides_geometry = 0;
-    variables.clear();
-
-    // the section was valid if at least regex and vars were found
-    int have_name = 0;
-    int have_regex = 0;
-    int have_variables = 0;
-    int have_time_reader = 0;
-    int have_geometry_reader = 0;
-
     // the caller is expected to pass the current line and that line
     // is expected to be "[cf_reader]".
     char *l = lines.current();
@@ -155,116 +608,63 @@ int teca_multi_cf_reader_internals::parse_cf_reader_section(
         if (teca_string_util::is_comment(l))
             continue;
 
-
         // look for and process key words
-        if (strncmp("name", l, 5) == 0)
-        {
-            if (have_name)
-            {
-                TECA_ERROR("Duplicate name lable found on line " << lno)
-                return -1;
-            }
-
-            if (teca_string_util::extract_value<std::string>(l, name))
-            {
-                TECA_ERROR("Syntax error when parsing name on line " << lno)
-                return -1;
-            }
+        if (opts.parse_line(l, lno) < 0)
+            return -1;
+    }
 
-            have_name = 1;
-        }
-        else if (strncmp("regex", l, 5) == 0)
-        {
-            if (have_regex)
-            {
-                TECA_ERROR("Duplicate regex lable found on line " << lno)
-                return -1;
-            }
+    // the section was valid if at least regex and vars were found
+    bool have_regex = !opts.regex.empty();
+    int have_variables = !opts.variables.empty();
 
-            if (teca_string_util::extract_value<std::string>(l, regex))
-            {
-                TECA_ERROR("Syntax error when parsing regex on line " << lno)
-                return -1;
-            }
+    return (have_regex && have_variables) ? 0 : -1;
+}
 
-            have_regex = 1;
-        }
-        else if (strncmp("variables", l, 9) == 0)
-        {
-            if (have_variables)
-            {
-                TECA_ERROR("Duplicate regex lable found on line " << lno)
-                return -1;
-            }
+// --------------------------------------------------------------------------
+int teca_multi_cf_reader_internals::add_reader_instance(
+    const cf_reader_options &options)
+{
+    // construct and intialize the reader
+    p_teca_cf_reader reader = teca_cf_reader::New();
 
-            std::vector<char*> tmp;
-            if (teca_string_util::tokenize(l, '=', tmp) || (tmp.size() != 2))
-            {
-                TECA_ERROR("Invalid variables specifier : \"" << l
-                    << "\" on line " << lno)
-                return -1;
-            }
+    if (options.name.empty())
+    {
+        TECA_ERROR("Invalid reader key. It must not be empty")
+        return -1;
+    }
 
-            std::vector<char*> vars;
-            if (teca_string_util::tokenize(tmp[1], ',', vars) || (vars.size() < 1))
-            {
-                TECA_ERROR("Invalid variables specifier : \"" << l
-                    << "\" on line " << lno)
-                return -1;
-            }
+    this->readers[options.name] =
+        p_cf_reader_instance(new cf_reader_instance(reader,
+                std::set<std::string>(options.variables.begin(),
+                    options.variables.end()), options));
 
-            size_t n_vars  = vars.size();
-            for (size_t i = 0; i < n_vars; ++i)
-            {
-                char *v = vars[i];
-                if (teca_string_util::skip_pad(v))
-                {
-                    TECA_ERROR("Invalid variable name on line " << lno)
-                    return -1;
-                }
-                variables.push_back(v);
-            }
+    if (options.provides_time)
+        this->time_reader = options.name;
 
-            have_variables = 1;
-        }
-        else if (strncmp("provides_time", l, 11) == 0)
-        {
-            if (have_time_reader)
-            {
-                TECA_ERROR("Duplicate provides_time lable found on line " << lno)
-                return -1;
-            }
-            provides_time = 1;
-            have_time_reader = 1;
-        }
-        else if (strncmp("provides_geometry", l, 15) == 0)
-        {
-            if (have_geometry_reader)
-            {
-                TECA_ERROR("Duplicate provides_geometry lable found on line " << lno)
-                return -1;
-            }
-            provides_geometry = 1;
-        }
-    }
+    if (options.provides_geometry)
+        this->geometry_reader = options.name;
 
-    return (have_regex && have_variables) ? 0 : -1;
+    return 0;
 }
 
 
+
+
+
+
 // --------------------------------------------------------------------------
 teca_multi_cf_reader::teca_multi_cf_reader() :
+    input_file(""),
     x_axis_variable("lon"),
     y_axis_variable("lat"),
     z_axis_variable(""),
     t_axis_variable("time"),
-    t_calendar(""),
+    calendar(""),
     t_units(""),
     filename_time_template(""),
     periodic_in_x(0),
-    periodic_in_y(0),
-    periodic_in_z(0),
-    max_metadata_ranks(1024),
+    max_metadata_ranks(-1),
+    clamp_dimensions_of_one(0),
     internals(new teca_multi_cf_reader_internals)
 {}
 
@@ -282,34 +682,35 @@ void teca_multi_cf_reader::get_properties_description(
 
     opts.add_options()
         TECA_POPTS_GET(std::string, prefix, input_file,
-            "a file dedscribing the dataset layout ()")
+            "a file dedscribing the dataset layout")
         TECA_POPTS_GET(std::string, prefix, x_axis_variable,
-            "name of variable that has x axis coordinates (lon)")
+            "name of variable that has x axis coordinates")
         TECA_POPTS_GET(std::string, prefix, y_axis_variable,
-            "name of variable that has y axis coordinates (lat)")
+            "name of variable that has y axis coordinates")
         TECA_POPTS_GET(std::string, prefix, z_axis_variable,
-            "name of variable that has z axis coordinates ()")
+            "name of variable that has z axis coordinates")
         TECA_POPTS_GET(std::string, prefix, t_axis_variable,
-            "name of variable that has t axis coordinates (time)")
-        TECA_POPTS_GET(std::string, prefix, t_calendar,
-            "name of variable that has the time calendar (calendar)")
+            "name of variable that has t axis coordinates")
+        TECA_POPTS_GET(std::string, prefix, calendar,
+            "name of variable that has the time calendar")
         TECA_POPTS_GET(std::string, prefix, t_units,
             "a std::get_time template for decoding time from the input filename")
         TECA_POPTS_GET(std::string, prefix, filename_time_template,
-            "name of variable that has the time unit (units)")
-        TECA_POPTS_GET(std::vector<double>, prefix, t_values,
+            "name of variable that has the time unit")
+        TECA_POPTS_MULTI_GET(std::vector<double>, prefix, t_values,
             "name of variable that has t axis values set by the"
-            "the user if the file doesn't have time variable set ()")
+            "the user if the file doesn't have time variable set")
         TECA_POPTS_GET(int, prefix, periodic_in_x,
-            "the dataset has a periodic boundary in the x direction (0)")
-        TECA_POPTS_GET(int, prefix, periodic_in_y,
-            "the dataset has a periodic boundary in the y direction (0)")
-        TECA_POPTS_GET(int, prefix, periodic_in_z,
-            "the dataset has a periodic boundary in the z direction (0)")
+            "the dataset has a periodic boundary in the x direction")
         TECA_POPTS_GET(int, prefix, max_metadata_ranks,
-            "set the max number of ranks for reading metadata (1024)")
+            "set the max number of ranks for reading metadata")
+        TECA_POPTS_GET(int, prefix, clamp_dimensions_of_one,
+            "If set clamp requested axis extent in where the request is out of"
+            " bounds and the coordinate array dimension is 1.")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -317,18 +718,19 @@ void teca_multi_cf_reader::get_properties_description(
 void teca_multi_cf_reader::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, x_axis_variable)
     TECA_POPTS_SET(opts, std::string, prefix, y_axis_variable)
     TECA_POPTS_SET(opts, std::string, prefix, z_axis_variable)
     TECA_POPTS_SET(opts, std::string, prefix, t_axis_variable)
-    TECA_POPTS_SET(opts, std::string, prefix, t_calendar)
+    TECA_POPTS_SET(opts, std::string, prefix, calendar)
     TECA_POPTS_SET(opts, std::string, prefix, t_units)
     TECA_POPTS_SET(opts, std::string, prefix, filename_time_template)
     TECA_POPTS_SET(opts, std::vector<double>, prefix, t_values)
     TECA_POPTS_SET(opts, int, prefix, periodic_in_x)
-    TECA_POPTS_SET(opts, int, prefix, periodic_in_y)
-    TECA_POPTS_SET(opts, int, prefix, periodic_in_z)
     TECA_POPTS_SET(opts, int, prefix, max_metadata_ranks)
+    TECA_POPTS_SET(opts, int, prefix, clamp_dimensions_of_one)
 }
 #endif
 
@@ -349,12 +751,10 @@ int teca_multi_cf_reader::set_input_file(const std::string &input_file)
     }
 #endif
 
+    int num_readers = 0;
     teca_binary_stream bs;
 
-    // save a spot at the head of the stream for the number of readers.
-    // after we know how many readers were detected we will update this.
-    int num_readers = 0;
-    bs.pack(num_readers);
+    using reader_option_t = teca_multi_cf_reader_internals::cf_reader_options;
 
     if (rank == 0)
     {
@@ -368,9 +768,13 @@ int teca_multi_cf_reader::set_input_file(const std::string &input_file)
         // these are global variables and need to be at the top of the file
         std::string g_data_root;
         std::string g_regex;
+        reader_option_t g_opts;
+
+        std::vector<reader_option_t> section_opts;
 
         while (lines)
         {
+            int ierr = 0;
             long lno = lines.line_number();
             char *l = lines.current();
             teca_string_util::skip_pad(l);
@@ -395,62 +799,61 @@ int teca_multi_cf_reader::set_input_file(const std::string &input_file)
                     return -1;
                 }
             }
+            else if ((ierr = g_opts.parse_line(l, lno)))
+            {
+                // report parsing error
+                if (ierr < 0)
+                    return -1;
+            }
             else if (strcmp("[cf_reader]", l) == 0)
             {
-                std::string name;
-                std::string regex;
-                int provides_time = 0;
-                int provides_geometry = 0;
-                std::vector<std::string> variables;
-
-                if (teca_multi_cf_reader_internals::parse_cf_reader_section(lines,
-                    name, regex, provides_time, provides_geometry, variables))
+                reader_option_t opts;
+                if (teca_multi_cf_reader_internals::parse_cf_reader_section(lines, opts))
                 {
                     TECA_ERROR("Failed to parse [cf_reader] section on line " << lno)
                     return -1;
                 }
 
                 // always give a name
-                if (name.empty())
-                    name = std::to_string(num_readers);
+                if (opts.name.empty())
+                    opts.name = std::to_string(section_opts.size());
 
                 // look for and replace %data_root% if it is present
                 if (!g_data_root.empty())
                 {
-                    size_t loc = regex.find("%data_root%");
+                    size_t loc = opts.regex.find("%data_root%");
                     if (loc != std::string::npos)
-                        regex.replace(loc, 11, g_data_root);
+                        opts.regex.replace(loc, 11, g_data_root);
                 }
 
                 if (!g_regex.empty())
                 {
-                    size_t loc = regex.find("%regex%");
+                    size_t loc = opts.regex.find("%regex%");
                     if (loc != std::string::npos)
-                        regex.replace(loc, 7, g_regex);
+                        opts.regex.replace(loc, 7, g_regex);
                 }
 
-                // serialize
-                bs.pack(name);
-                bs.pack(regex);
-                bs.pack(provides_time);
-                bs.pack(provides_geometry);
-                bs.pack(variables);
-
-                num_readers += 1;
+                // save
+                section_opts.push_back(opts);
             }
         }
 
-        // update count
-        size_t ebs = bs.size();
-        bs.set_write_pos(0);
+        // serialize
+        g_opts.to_stream(bs);
+
+        num_readers = section_opts.size();
         bs.pack(num_readers);
-        bs.set_write_pos(ebs);
+
+        for (int i = 0; i < num_readers; ++i)
+            section_opts[i].to_stream(bs);
     }
 
     // share
     bs.broadcast(this->get_communicator());
 
     // deserialize
+    this->internals->global_options.from_stream(bs);
+
     bs.unpack(num_readers);
 
     if (num_readers < 1)
@@ -464,29 +867,32 @@ int teca_multi_cf_reader::set_input_file(const std::string &input_file)
 
     for (int i = 0; i < num_readers; ++i)
     {
-        std::string name;
-        std::string regex;
-        int provides_time;
-        int provides_geometry;
-        std::vector<std::string> variables;
+        teca_multi_cf_reader_internals::cf_reader_options options;
 
-        bs.unpack(name);
-        bs.unpack(regex);
-        bs.unpack(provides_time);
-        bs.unpack(provides_geometry);
-        bs.unpack(variables);
+        options.from_stream(bs);
 
-        num_time_readers += provides_time;
-        num_geometry_readers += provides_geometry;
+        num_time_readers += options.provides_time;
+        num_geometry_readers += options.provides_geometry;
 
-        if (this->add_reader(name, regex, provides_time,
-            provides_geometry, variables))
-        {
-            TECA_ERROR("Failed to add reader " << i << " \"" << name << "\"")
-            return -1;
-        }
+        this->internals->add_reader_instance(options);
     }
 
+    if (num_time_readers != 1)
+    {
+        TECA_ERROR(<< num_time_readers << " readers provide time."
+            " One and only one reader can provide time.")
+        return -1;
+    }
+
+    if (num_geometry_readers != 1)
+    {
+        TECA_ERROR(<< num_geometry_readers << " readers provide geometry."
+            " One and only one reader can provide mesh geometry.")
+        return -1;
+    }
+
+    this->input_file = input_file;
+
     return 0;
 }
 
@@ -506,32 +912,406 @@ void teca_multi_cf_reader::clear_cached_metadata()
 }
 
 // --------------------------------------------------------------------------
-int teca_multi_cf_reader::add_reader(const std::string &key,
-    const std::string &files_regex,
-    int provides_time, int provides_geometry,
-    const std::vector<std::string> &variables)
+void teca_multi_cf_reader::set_x_axis_variable(const std::string &var)
+{
+    if (this->x_axis_variable != var)
+    {
+        this->x_axis_variable = var;
+        this->set_modified();
+    }
+}
+
+// --------------------------------------------------------------------------
+std::string teca_multi_cf_reader::get_x_axis_variable() const
 {
-    if (key.empty())
+    // settings from the MCF file should override algorithm properties
+    // however, this may be called any time before or after the readers
+    // are set up.
+
+    if (this->internals->geometry_reader.empty())
+    {
+        // the geometry reader wasn't established yet, fall back to
+        // the current property value
+        return this->x_axis_variable;
+    }
+
+    // get the geometry reader instance
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(this->internals->geometry_reader);
+
+    if (it == this->internals->readers.end())
+    {
+        TECA_ERROR("No reader named \""
+            << this->internals->geometry_reader << "\" found")
+        return "";
+    }
+
+    // values in the configuration file take precedence over the member variable
+    // with in the configuration file, section options take precedence over
+    // globally scoped options
+    return it->second->options.get_x_axis_variable(
+        this->internals->global_options.get_x_axis_variable(
+            this->x_axis_variable));
+}
+
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader::set_y_axis_variable(const std::string &var)
+{
+    if (this->y_axis_variable != var)
+    {
+        this->y_axis_variable = var;
+        this->set_modified();
+    }
+}
+
+// --------------------------------------------------------------------------
+std::string teca_multi_cf_reader::get_y_axis_variable() const
+{
+    // settings from the MCF file should override algorithm properties
+    // however, this may be called any time before or after the readers
+    // are set up.
+
+    if (this->internals->geometry_reader.empty())
+    {
+        // the geometry reader wasn't established yet, fall back to
+        // the current property value
+        return this->y_axis_variable;
+    }
+
+    // get the geometry reader instance
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(this->internals->geometry_reader);
+
+    if (it == this->internals->readers.end())
+    {
+        TECA_ERROR("No reader named \""
+            << this->internals->geometry_reader << "\" found")
+        return "";
+    }
+
+    // values in the configuration file take precedence over the member variable
+    // with in the configuration file, section options take precedence over
+    // globally scoped options
+    return it->second->options.get_y_axis_variable(
+        this->internals->global_options.get_y_axis_variable(
+            this->y_axis_variable));
+}
+
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader::set_z_axis_variable(const std::string &var)
+{
+    if (this->z_axis_variable != var)
+    {
+        this->z_axis_variable = var;
+        this->set_modified();
+    }
+}
+
+// --------------------------------------------------------------------------
+std::string teca_multi_cf_reader::get_z_axis_variable() const
+{
+    // settings from the MCF file should override algorithm properties
+    // however, this may be called any time before or after the readers
+    // are set up.
+
+    if (this->internals->geometry_reader.empty())
+    {
+        // the geometry reader wasn't established yet, fall back to
+        // the current property value
+        return this->z_axis_variable;
+    }
+
+    // get the geometry reader instance
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(this->internals->geometry_reader);
+
+    if (it == this->internals->readers.end())
+    {
+        TECA_ERROR("No reader named \""
+            << this->internals->geometry_reader << "\" found")
+        return "";
+    }
+
+    // values in the configuration file take precedence over the member variable
+    // with in the configuration file, section options take precedence over
+    // globally scoped options
+    return it->second->options.get_z_axis_variable(
+        this->internals->global_options.get_z_axis_variable(
+            this->z_axis_variable));
+}
+
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader::set_periodic_in_x(int var)
+{
+    if (this->periodic_in_x != var)
+    {
+        this->periodic_in_x = var;
+        this->set_modified();
+    }
+}
+
+// --------------------------------------------------------------------------
+int teca_multi_cf_reader::get_periodic_in_x() const
+{
+    // settings from the MCF file should override algorithm properties
+    // however, this may be called any time before or after the readers
+    // are set up.
+
+    if (this->internals->geometry_reader.empty())
     {
-        TECA_ERROR("Invalid key, it must not be empty")
+        // the geometry reader wasn't established yet, fall back to
+        // the current property value
+        return this->periodic_in_x;
+    }
+
+    // get the geometry reader instance
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(this->internals->geometry_reader);
+
+    if (it == this->internals->readers.end())
+    {
+        TECA_ERROR("No reader named \""
+            << this->internals->geometry_reader << "\" found")
         return -1;
     }
 
-    p_teca_cf_reader reader = teca_cf_reader::New();
-    reader->set_files_regex(files_regex);
+    // values in the configuration file take precedence over the member variable
+    // with in the configuration file, section options take precedence over
+    // globally scoped options
+    return it->second->options.get_periodic_in_x(
+        this->internals->global_options.get_periodic_in_x(
+            this->periodic_in_x));
+}
 
-    this->internals->readers[key] =
-        teca_multi_cf_reader_internals::p_cf_reader_instance(
-            new teca_multi_cf_reader_internals::cf_reader_instance(
-                reader, std::set<std::string>(variables.begin(), variables.end())));
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader::set_t_axis_variable(const std::string &var)
+{
+    if (this->t_axis_variable != var)
+    {
+        this->t_axis_variable = var;
+        this->set_modified();
+    }
+}
 
-    if (provides_time)
-        this->internals->time_reader = key;
+// --------------------------------------------------------------------------
+std::string teca_multi_cf_reader::get_t_axis_variable() const
+{
+    // settings from the MCF file should override algorithm properties
+    // however, this may be called any time before or after the readers
+    // are set up.
 
-    if (provides_geometry)
-        this->internals->geometry_reader = key;
+    if (this->internals->geometry_reader.empty())
+    {
+        // the geometry reader wasn't established yet, fall back to
+        // the current property value
+        return this->t_axis_variable;
+    }
 
-    return 0;
+    // get the geometry reader instance
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(this->internals->geometry_reader);
+
+    if (it == this->internals->readers.end())
+    {
+        TECA_ERROR("No reader named \""
+            << this->internals->geometry_reader << "\" found")
+        return "";
+    }
+
+    // values in the configuration file take precedence over the member variable
+    // with in the configuration file, section options take precedence over
+    // globally scoped options
+    return it->second->options.get_t_axis_variable(
+        this->internals->global_options.get_t_axis_variable(
+            this->t_axis_variable));
+}
+
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader::set_calendar(const std::string &var)
+{
+    if (this->calendar != var)
+    {
+        this->calendar = var;
+        this->set_modified();
+    }
+}
+
+// --------------------------------------------------------------------------
+std::string teca_multi_cf_reader::get_calendar() const
+{
+    // settings from the MCF file should override algorithm properties
+    // however, this may be called any time before or after the readers
+    // are set up.
+
+    if (this->internals->time_reader.empty())
+    {
+        // the time reader wasn't established yet, fall back to
+        // the current property value
+        return this->calendar;
+    }
+
+    // get the time reader instance
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(this->internals->time_reader);
+
+    if (it == this->internals->readers.end())
+    {
+        TECA_ERROR("No reader named \""
+            << this->internals->time_reader << "\" found")
+        return "";
+    }
+
+    // values in the configuration file take precedence over the member variable
+    // with in the configuration file, section options take precedence over
+    // globally scoped options
+    return it->second->options.get_calendar(
+        this->internals->global_options.get_calendar(
+            this->calendar));
+}
+
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader::set_t_units(const std::string &var)
+{
+    if (this->t_units != var)
+    {
+        this->t_units = var;
+        this->set_modified();
+    }
+}
+
+// --------------------------------------------------------------------------
+std::string teca_multi_cf_reader::get_t_units() const
+{
+    // settings from the MCF file should override algorithm properties
+    // however, this may be called any time before or after the readers
+    // are set up.
+
+    if (this->internals->time_reader.empty())
+    {
+        // the time reader wasn't established yet, fall back to
+        // the current property value
+        return this->t_units;
+    }
+
+    // get the time reader instance
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(this->internals->time_reader);
+
+    if (it == this->internals->readers.end())
+    {
+        TECA_ERROR("No reader named \""
+            << this->internals->time_reader << "\" found")
+        return "";
+    }
+
+    // values in the configuration file take precedence over the member variable
+    // with in the configuration file, section options take precedence over
+    // globally scoped options
+    return it->second->options.get_t_units(
+        this->internals->global_options.get_t_units(
+            this->t_units));
+}
+
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader::set_filename_time_template(const std::string &var)
+{
+    if (this->filename_time_template != var)
+    {
+        this->filename_time_template = var;
+        this->set_modified();
+    }
+}
+
+// --------------------------------------------------------------------------
+std::string teca_multi_cf_reader::get_filename_time_template() const
+{
+    // settings from the MCF file should override algorithm properties
+    // however, this may be called any time before or after the readers
+    // are set up.
+
+    if (this->internals->time_reader.empty())
+    {
+        // the time reader wasn't established yet, fall back to
+        // the current property value
+        return this->filename_time_template;
+    }
+
+    // get the time reader instance
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(this->internals->time_reader);
+
+    if (it == this->internals->readers.end())
+    {
+        TECA_ERROR("No reader named \""
+            << this->internals->time_reader << "\" found")
+        return "";
+    }
+
+    // values in the configuration file take precedence over the member variable
+    // with in the configuration file, section options take precedence over
+    // globally scoped options
+    return it->second->options.get_filename_time_template(
+        this->internals->global_options.get_filename_time_template(
+            this->filename_time_template));
+}
+
+// --------------------------------------------------------------------------
+void teca_multi_cf_reader::set_clamp_dimensions_of_one(int var)
+{
+    if (this->clamp_dimensions_of_one != var)
+    {
+        this->clamp_dimensions_of_one = var;
+        this->set_modified();
+    }
+}
+
+// --------------------------------------------------------------------------
+int teca_multi_cf_reader::get_clamp_dimensions_of_one() const
+{
+    // settings from the MCF file should override algorithm properties
+    // however, this may be called any time before or after the readers
+    // are set up.
+
+    if (this->internals->geometry_reader.empty())
+    {
+        // the geometry reader wasn't established yet, fall back to
+        // the current property value
+        return this->clamp_dimensions_of_one;
+    }
+
+    // get the geometry reader instance
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(this->internals->geometry_reader);
+
+    if (it == this->internals->readers.end())
+    {
+        TECA_ERROR("No reader named \""
+            << this->internals->geometry_reader << "\" found")
+        return -1;
+    }
+
+    // values in the configuration file take precedence over the member variable
+    // with in the configuration file, section options take precedence over
+    // globally scoped options
+    return it->second->options.get_clamp_dimensions_of_one(
+        this->internals->global_options.get_clamp_dimensions_of_one(
+            this->clamp_dimensions_of_one));
+}
+
+// --------------------------------------------------------------------------
+int teca_multi_cf_reader::add_reader(const std::string &regex,
+    const std::string &key, int provides_time, int provides_geometry,
+    const std::vector<std::string> &variables)
+{
+    teca_multi_cf_reader_internals::cf_reader_options options;
+
+    options.name = key;
+    options.regex = regex;
+    options.provides_time = provides_time;
+    options.provides_geometry = provides_geometry;
+    options.variables = variables;
+
+    return this->internals->add_reader_instance(options);
 }
 
 // --------------------------------------------------------------------------
@@ -553,7 +1333,9 @@ int teca_multi_cf_reader::set_time_reader(const std::string &key)
 // --------------------------------------------------------------------------
 int teca_multi_cf_reader::set_geometry_reader(const std::string &key)
 {
-    teca_multi_cf_reader_internals::reader_map_t::iterator it = this->internals->readers.find(key);
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(key);
+
     if (it == this->internals->readers.end())
     {
         TECA_ERROR("No reader associated with \"" << key << "\"")
@@ -568,7 +1350,9 @@ int teca_multi_cf_reader::set_geometry_reader(const std::string &key)
 int teca_multi_cf_reader::add_variable_reader(const std::string &key,
     const std::string &variable)
 {
-    teca_multi_cf_reader_internals::reader_map_t::iterator it = this->internals->readers.find(key);
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(key);
+
     if (it == this->internals->readers.end())
     {
         TECA_ERROR("No reader associated with \"" << key << "\"")
@@ -583,7 +1367,9 @@ int teca_multi_cf_reader::add_variable_reader(const std::string &key,
 int teca_multi_cf_reader::set_variable_reader(const std::string &key,
     const std::vector<std::string> &variables)
 {
-    teca_multi_cf_reader_internals::reader_map_t::iterator it = this->internals->readers.find(key);
+    teca_multi_cf_reader_internals::reader_map_t::iterator it =
+        this->internals->readers.find(key);
+
     if (it == this->internals->readers.end())
     {
         TECA_ERROR("No reader associated with \"" << key << "\"")
@@ -634,6 +1420,8 @@ teca_metadata teca_multi_cf_reader::get_output_metadata(
     std::vector<std::string> vars_out;
 
     // update the metadata for the managed readers
+    const teca_multi_cf_reader_internals::cf_reader_options &global_options = this->internals->global_options;
+
     teca_multi_cf_reader_internals::reader_map_t::iterator it = this->internals->readers.begin();
     teca_multi_cf_reader_internals::reader_map_t::iterator end = this->internals->readers.end();
     for (; it != end; ++it)
@@ -641,18 +1429,61 @@ teca_metadata teca_multi_cf_reader::get_output_metadata(
         const std::string &key = it->first;
         teca_multi_cf_reader_internals::p_cf_reader_instance &inst = it->second;
 
-        // pass run time control parameters
-        inst->reader->set_x_axis_variable(this->x_axis_variable);
-        inst->reader->set_y_axis_variable(this->y_axis_variable);
-        inst->reader->set_z_axis_variable(this->z_axis_variable);
-        inst->reader->set_t_axis_variable(this->t_axis_variable);
-        inst->reader->set_t_calendar(this->t_calendar);
-        inst->reader->set_t_units(this->t_units);
-        inst->reader->set_filename_time_template(this->filename_time_template);
-        inst->reader->set_periodic_in_x(this->periodic_in_x);
-        inst->reader->set_periodic_in_y(this->periodic_in_y);
-        inst->reader->set_periodic_in_z(this->periodic_in_z);
-        inst->reader->set_max_metadata_ranks(this->max_metadata_ranks);
+        // configure the reader. settings from the MCF file override the
+        // algorithm properties. with in the MCF file settings from specific
+        // reader section override global settings.
+        inst->reader->set_files_regex(inst->options.regex);
+
+        inst->reader->set_x_axis_variable(
+            inst->options.get_x_axis_variable(
+                global_options.get_x_axis_variable(
+                    this->x_axis_variable)));
+
+        inst->reader->set_y_axis_variable(
+            inst->options.get_y_axis_variable(
+                global_options.get_y_axis_variable(
+                    this->y_axis_variable)));
+
+        inst->reader->set_z_axis_variable(
+            inst->options.get_z_axis_variable(
+                global_options.get_z_axis_variable(
+                    this->z_axis_variable)));
+
+        inst->reader->set_t_axis_variable(
+            inst->options.get_t_axis_variable(
+                global_options.get_t_axis_variable(
+                    this->t_axis_variable)));
+
+        inst->reader->set_periodic_in_x(
+            inst->options.get_periodic_in_x(
+                global_options.get_periodic_in_x(
+                    this->periodic_in_x)));
+
+        inst->reader->set_calendar(
+            inst->options.get_calendar(
+                global_options.get_calendar(
+                    this->calendar)));
+
+        inst->reader->set_t_units(
+            inst->options.get_t_units(
+                global_options.get_t_units(
+                    this->t_units)));
+
+        inst->reader->set_filename_time_template(
+            inst->options.get_filename_time_template(
+                global_options.get_filename_time_template(
+                    this->filename_time_template)));
+
+        inst->reader->set_clamp_dimensions_of_one(
+            inst->options.get_clamp_dimensions_of_one(
+                global_options.get_clamp_dimensions_of_one(
+                    this->clamp_dimensions_of_one)));
+
+        if (!this->t_values.empty())
+            inst->reader->set_t_values(this->t_values);
+
+        if (this->max_metadata_ranks >= 0)
+            inst->reader->set_max_metadata_ranks(this->max_metadata_ranks);
 
         // update the internal reader's metadata
         inst->metadata = inst->reader->update_metadata();
@@ -725,17 +1556,17 @@ teca_metadata teca_multi_cf_reader::get_output_metadata(
             std::string x_variable;
             if (coords_in.get("x_variable", x_variable))
             {
-                TECA_ERROR("Failed to get the x axis varaible name")
+                TECA_ERROR("Failed to get the x-axis varaible name")
                 return teca_metadata();
             }
             coords_out.set("x_variable", x_variable);
 
-            if (!this->x_axis_variable.empty())
+            if (!inst->reader->get_x_axis_variable().empty())
             {
                 teca_metadata x_atts;
                 if (atts_in.get(x_variable, x_atts))
                 {
-                    TECA_ERROR("Failed to get attributes for \""
+                    TECA_ERROR("Failed to get attributes for the x-axis variable \""
                         << x_variable << "\"")
                     return teca_metadata();
                 }
@@ -745,7 +1576,7 @@ teca_metadata teca_multi_cf_reader::get_output_metadata(
             p_teca_variant_array x = coords_in.get("x");
             if (!x)
             {
-                TECA_ERROR("Failed to get the y axis")
+                TECA_ERROR("Failed to get the x-axis")
                 return teca_metadata();
             }
             coords_out.set("x", x);
@@ -754,17 +1585,17 @@ teca_metadata teca_multi_cf_reader::get_output_metadata(
             std::string y_variable;
             if (coords_in.get("y_variable", y_variable))
             {
-                TECA_ERROR("Failed to get the x axis varaible name")
+                TECA_ERROR("Failed to get the y-axis varaible name")
                 return teca_metadata();
             }
             coords_out.set("y_variable", y_variable);
 
-            if (!this->y_axis_variable.empty())
+            if (!inst->reader->get_y_axis_variable().empty())
             {
                 teca_metadata y_atts;
                 if (atts_in.get(y_variable, y_atts))
                 {
-                    TECA_ERROR("Failed to get attributes for \""
+                    TECA_ERROR("Failed to get attributes for the y-axis variable \""
                         << y_variable << "\"")
                     return teca_metadata();
                 }
@@ -774,7 +1605,7 @@ teca_metadata teca_multi_cf_reader::get_output_metadata(
             p_teca_variant_array y = coords_in.get("y");
             if (!y)
             {
-                TECA_ERROR("Failed to get the x axis")
+                TECA_ERROR("Failed to get the y-axis")
                 return teca_metadata();
             }
             coords_out.set("y", y);
@@ -783,17 +1614,17 @@ teca_metadata teca_multi_cf_reader::get_output_metadata(
             std::string z_variable;
             if (coords_in.get("z_variable", z_variable))
             {
-                TECA_ERROR("Failed to get the y axis varaible name")
+                TECA_ERROR("Failed to get the z-axis varaible name")
                 return teca_metadata();
             }
             coords_out.set("z_variable", z_variable);
 
-            if (!this->z_axis_variable.empty())
+            if (!inst->reader->get_z_axis_variable().empty())
             {
                 teca_metadata z_atts;
                 if (atts_in.get(z_variable, z_atts))
                 {
-                    TECA_ERROR("Failed to get attributes for \""
+                    TECA_ERROR("Failed to get attributes for the z-axis variable \""
                         << z_variable << "\"")
                     return teca_metadata();
                 }
@@ -803,15 +1634,15 @@ teca_metadata teca_multi_cf_reader::get_output_metadata(
             p_teca_variant_array z = coords_in.get("z");
             if (!z)
             {
-                TECA_ERROR("Failed to get the z axis")
+                TECA_ERROR("Failed to get the z-axis")
                 return teca_metadata();
             }
             coords_out.set("z", z);
 
             // pass periodicity
-            coords_out.set("periodic_in_x", this->periodic_in_x);
-            coords_out.set("periodic_in_y", this->periodic_in_y);
-            coords_out.set("periodic_in_z", this->periodic_in_z);
+            int periodic = 0;
+            coords_in.get("periodic_in_x", periodic);
+            coords_out.set("periodic_in_x", periodic);
 
             // pass bounds
             p_teca_variant_array bounds = inst->metadata.get("bounds");
diff --git a/io/teca_multi_cf_reader.h b/io/teca_multi_cf_reader.h
index f575ef5ef..84804782e 100644
--- a/io/teca_multi_cf_reader.h
+++ b/io/teca_multi_cf_reader.h
@@ -4,6 +4,7 @@
 #include "teca_algorithm.h"
 #include "teca_metadata.h"
 #include "teca_shared_object.h"
+#include "teca_cf_reader.h"
 
 #include <set>
 #include <vector>
@@ -14,54 +15,53 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_multi_cf_reader)
 class teca_multi_cf_reader_internals;
 using p_teca_multi_cf_reader_internals = std::shared_ptr<teca_multi_cf_reader_internals>;
 
-/// a reader for data stored in NetCDF CF format in multiple files
+/// A reader for data stored in NetCDF CF format in multiple files.
 /**
-a reader for data stored in NetCDF CF format in multiple files.  the data read
-is presented to the down stream as a single dataset
-
-use the add_reader method to specify regular experiession and corresponding
-list of variables to read. a reader, not necessarily the same one, must be
-selected to provide the time and spatial axes.
-
-this reader could handle spatio-temporal interpolations as well, however that
-is currently not implemented. as a result all data is expected to be on the
-same coordinate system.
-
-A number of algorithm properties modify run time behavior, most of these are
-exposed from teca_cf_reader. see the teca_cf_reader for details.
-
-The reader may be initialized via a configuration file. The configuration file
-consists of name = value pairs and flags organized in sections. Sections are
-declared using []. There is an optional  global section followed by a number of
-[cf_reader] sections. Each [cf_reader] section consists of a name(optional), a
-regex, a list of variables, a provides_time flag(optional) and a provides
-geometry flag(optional). At least one section must contain a provides_time and
-provides geometry flag. The global section may contain a data_root. Occurances
-of the string %data_root% in the regex are replaced with the value of
-data_root.
-
-The following example configures the reader to read hus,ua and va.
-
-```
-# TECA multi_cf_reader config
-
-data_root = /opt/TECA_data/HighResMIP/ECMWF-IFS-HR-SST-present
-
-[cf_reader]
-regex = %data_root%/hus/hus.*\.nc$
-variables = hus
-provides_time
-provides_geometry
-
-[cf_reader]
-regex = %data_root%/va/va.*\.nc$
-variables = va
-
-[cf_reader]
-regex = %data_root%/ua/ua.*\.nc$
-variables = ua
-```
-*/
+ * The data read is presented to the down stream as a single dataset
+ *
+ * use the add_reader method to specify regular expression and corresponding
+ * list of variables to read. a reader, not necessarily the same one, must be
+ * selected to provide the time and spatial axes.
+ *
+ * this reader could handle spatio-temporal interpolations as well, however
+ * that is currently not implemented. as a result all data is expected to be
+ * on the same coordinate system.
+ *
+ * A number of algorithm properties modify run time behavior, most of these
+ * are exposed from teca_cf_reader. see the teca_cf_reader for details.
+ *
+ * The reader may be initialized via a configuration file. The configuration
+ * file consists of name = value pairs and flags organized in sections.
+ * Sections are declared using []. There is an optional  global section
+ * followed by a number of [cf_reader] sections. Each [cf_reader] section
+ * consists of a name(optional), a regex, a list of variables, a provides_time
+ * flag(optional) and a provides geometry flag(optional). At least one section
+ * must contain a provides_time and provides geometry flag. The global section
+ * may contain a data_root. Occurrences of the string %data_root% in the regex
+ * are replaced with the value of data_root.
+ *
+ * The following example configures the reader to read hus,ua and va.
+ *
+ * ```
+ * # TECA multi_cf_reader config
+ *
+ * data_root = /opt/TECA_data/HighResMIP/ECMWF-IFS-HR-SST-present
+ *
+ * [cf_reader]
+ * regex = %data_root%/hus/hus.*\.nc$
+ * variables = hus
+ * provides_time
+ * provides_geometry
+ *
+ * [cf_reader]
+ * regex = %data_root%/va/va.*\.nc$
+ * variables = va
+ *
+ * [cf_reader]
+ * regex = %data_root%/ua/ua.*\.nc$
+ * variables = ua
+ * ```
+ */
 class teca_multi_cf_reader : public teca_algorithm
 {
 public:
@@ -75,74 +75,169 @@ class teca_multi_cf_reader : public teca_algorithm
     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()
     TECA_SET_ALGORITHM_PROPERTIES()
 
-    // set the file name describing the dataset to read
+    /**
+     * Set the MCF configuration file that describes the dataset to read.
+     * Each section in the MCF file adds an internal reader.
+     */
     int set_input_file(const std::string &input_file);
-
-    // adds a reader to the collection and at the same time specifies
-    // how it will be used.
-    int add_reader(const std::string &key,
-        const std::string &files_regex,
-        int provides_time, int provides_geometry,
+    std::string get_input_file() { return this->input_file; }
+
+    /**
+     * Adds a reader to the collection and at the same time specifies how it
+     * will be used. This is alternative way to configure the multi_cf_reader
+     * instead of providing the configuration via an MCF file (see
+     * set_input_file).
+     */
+    int add_reader(const std::string &regex,
+        const std::string &key, int provides_time,
+        int provides_geometry,
         const std::vector<std::string> &variables);
 
-    // sets the reader that provides the time axis
+    /// sets the reader that provides the time axis
     int set_time_reader(const std::string &key);
 
-    // sets the reader that provides the mesh geometry
+    /// sets the reader that provides the mesh geometry
     int set_geometry_reader(const std::string &key);
 
-    // adds to the list of variables that a reader will provide
+    /// adds to the list of variables that a reader will provide
     int add_variable_reader(const std::string &key,
         const std::string &variable);
 
-    // sets the list of variable that a reader will provide.
+    /// sets the list of variable that a reader will provide.
     int set_variable_reader(const std::string &key,
         const std::vector<std::string> &variable);
 
-    // get the list of variables that the reader will serve up
+    /// get the list of variables that the reader will serve up
     void get_variables(std::vector<std::string> &vars);
 
-    // set if the dataset has periodic boundary conditions
-    TECA_ALGORITHM_PROPERTY(int, periodic_in_x)
-    TECA_ALGORITHM_PROPERTY(int, periodic_in_y)
-    TECA_ALGORITHM_PROPERTY(int, periodic_in_z)
-
-    // set the variable to use for the coordinate axes.
-    // the defaults are: x => lon, y => lat, z = "",
-    // t => "time". leaving z empty will result in a 2D
-    // mesh.
-    TECA_ALGORITHM_PROPERTY(std::string, x_axis_variable)
-    TECA_ALGORITHM_PROPERTY(std::string, y_axis_variable)
-    TECA_ALGORITHM_PROPERTY(std::string, z_axis_variable)
-    TECA_ALGORITHM_PROPERTY(std::string, t_axis_variable)
-
-    // time calendar and time unit if the user wants to
-    // specify them
-    TECA_ALGORITHM_PROPERTY(std::string, t_calendar)
-    TECA_ALGORITHM_PROPERTY(std::string, t_units)
-
-    // a way to infer time from the filename if the time axis is not
-    // stored in the file itself. strftime format codes are used.
-    // For example for the files:
-    //
-    //      my_file_20170516_00.nc
-    //      my_file_20170516_03.nc
-    //      ...
-    //
-    // the template would be
-    //
-    //      my_file_%Y%m%d_%H.nc
-    TECA_ALGORITHM_PROPERTY(std::string, filename_time_template)
-
-    // time values to use instead if time variable doesn't
-    // exist.
+    /** @name periodic_in_x
+     * Set to indicate the presence of a periodic boundary in the x direction.
+     * If set this will override the corresponding setting from the MCF file
+     * for all internal readers.
+     */
+    ///@{
+    void set_periodic_in_x(int flag);
+    int get_periodic_in_x() const;
+    ///@}
+
+    /** @name x_axis_variable
+     * Set the variable to use for the mesh x-axis. If set this will override
+     * the corresponding setting from the MCF file for all internal readers.
+     */
+    ///@{
+    void set_x_axis_variable(const std::string &var);
+    std::string get_x_axis_variable() const;
+    ///@}
+
+    /** @name y_axis_variable
+     * Set the variable to use for the mesh y-axis. If set this will override
+     * the corresponding setting from the MCF file for all internal readers.
+     */
+    ///@{
+    void set_y_axis_variable(const std::string &var);
+    std::string get_y_axis_variable() const;
+    ///@}
+
+    /** @name z_axis_variable
+     * Set the variable to use for the mesh z-axis. Leaving the z-axis empty
+     * results in a 2D mesh. You must set this to the correct vertical
+     * coordinate dimension to produce a 3D mesh. If set this will override
+     * the corresponding setting from the MCF file for all internal readers.
+     */
+    ///@{
+    void set_z_axis_variable(const std::string &var);
+    std::string get_z_axis_variable() const;
+    ///@}
+
+    /** @name t_axis_variable_
+     * Set the variable to use for the mesh t-axis. Default "time". Setting
+     * this to an empty string disables the time axis. If set this will
+     * override the corresponding setting from the MCF file for all internal
+     * readers.
+     */
+    ///@{
+    void set_t_axis_variable(const std::string &var);
+    std::string get_t_axis_variable() const;
+    ///@}
+
+    /** @name calendar
+     * Use this to override the calendar, or set one when specifying t_values
+     * directly. If set this will override the corresponding setting from the
+     * MCF file for all internal readers.
+     */
+    ///@{
+    void set_calendar(const std::string &calendar);
+    std::string get_calendar() const;
+    ///@}
+
+    /** @name t_units
+     * Use this to set or override the time units. This is necessary when
+     * specifying time values directly. If set this will override the
+     * corresponding setting from the MCF file for all internal readers.
+     */
+    ///@{
+    void set_t_units(const std::string &units);
+    std::string get_t_units() const;
+    ///@}
+
+    /** @name filename_time_template
+     * a way to infer time from the filename if the time axis is not stored in
+     * the file itself. If set this will override the corresponding setting
+     * from the MCF file for all internal readers.
+     *
+     * strftime format codes are used. For example for the files:
+     * ```
+     *      my_file_20170516_00.nc
+     *      my_file_20170516_03.nc
+     *      ...
+     * ```
+     * the template would be
+     * ```
+     *      my_file_%Y%m%d_%H.nc
+     * ```
+     */
+    ///@{
+    void set_filename_time_template(const std::string &templ);
+    std::string get_filename_time_template() const;
+    ///@}
+
+    /** @name t_values
+     * Set the time values to use instead if a time variable doesn't exist or
+     * you need to override it. If set this will override the corresponding
+     * setting from the MCF file for all internal readers.
+     */
+    ///@{
     TECA_ALGORITHM_VECTOR_PROPERTY(double, t_value)
-
-    // set/get the number of ranks used to read the time axis.
-    // the default value of 1024 ranks works well on NERSC
-    // Cori scratch file system and may not be optimal on
-    // other systems.
+    ///@}
+
+    /** @name max_metadata_ranks
+     * set/get the number of ranks used to read the time axis. If set this
+     * will override the corresponding setting from the MCF file for all
+     * internal readers.
+     */
+    ///@{
     TECA_ALGORITHM_PROPERTY(int, max_metadata_ranks)
+    ///@}
+
+    /** @name periodic_in_x
+     * Set to indicate the presence of a periodic boundary in the x direction.
+     * If set this will override the corresponding setting from the MCF file
+     * for all internal readers.
+     */
+    ///@{
+    ///@}
+
+    /** @name clamp_dimensions_of_one
+     * If set the requested extent will be clamped in a given direction if the
+     * coorinate axis in that direction has a length of 1 and the requested
+     * extent would be out of bounds. This is a work around to enable loading
+     * 2D data with a vertical dimension of 1, into a 3D mesh and should be
+     * used with caution.
+     */
+    ///@{
+    void set_clamp_dimensions_of_one(int flag);
+    int get_clamp_dimensions_of_one() const;
+    ///@}
 
 protected:
     teca_multi_cf_reader();
@@ -160,18 +255,18 @@ class teca_multi_cf_reader : public teca_algorithm
     void set_modified() override;
 
 private:
+    std::string input_file;
     std::string x_axis_variable;
     std::string y_axis_variable;
     std::string z_axis_variable;
     std::string t_axis_variable;
-    std::string t_calendar;
+    std::string calendar;
     std::string t_units;
     std::string filename_time_template;
     std::vector<double> t_values;
     int periodic_in_x;
-    int periodic_in_y;
-    int periodic_in_z;
     int max_metadata_ranks;
+    int clamp_dimensions_of_one;
 
     p_teca_multi_cf_reader_internals internals;
 };
diff --git a/io/teca_netcdf_util.cxx b/io/teca_netcdf_util.cxx
index a17c39d7e..20832e845 100644
--- a/io/teca_netcdf_util.cxx
+++ b/io/teca_netcdf_util.cxx
@@ -380,9 +380,18 @@ int read_attribute(netcdf_handle &fh, int var_id, int att_id, teca_metadata &att
     return -1;
 }
 
+// **************************************************************************
+int read_variable_attributes(netcdf_handle &fh,
+    const std::string &var_name, teca_metadata &atts)
+{
+    return read_variable_attributes(fh, var_name, "", "", "", "", false, atts);
+}
+
 // **************************************************************************
 int read_variable_attributes(netcdf_handle &fh, const std::string &var_name,
-    teca_metadata &atts)
+    const std::string &x_axis_variable, const std::string &y_axis_variable,
+    const std::string &z_axis_variable, const std::string &t_axis_variable,
+    int clamp_dimensions_of_one, teca_metadata &atts)
 {
     int ierr = 0;
     int var_id = 0;
@@ -408,18 +417,36 @@ int read_variable_attributes(netcdf_handle &fh, const std::string &var_name,
     }
 #endif
 
+    // skip scalars
+    if (n_dims == 0)
+        return 0;
+
     // convert from the netcdf type code
     NC_DISPATCH(var_nc_type,
        var_type = teca_variant_array_code<NC_T>::get();
        )
 
-    // skip scalars
-    if (n_dims == 0)
-        return 0;
+    // read attributes
+    for (int ii = 0; ii < n_atts; ++ii)
+    {
+        if (teca_netcdf_util::read_attribute(fh, var_id, ii, atts))
+        {
+            TECA_ERROR("Failed to read the " << ii << "th attribute for variable \""
+                << var_name << "\"." << std::endl << nc_strerror(ierr))
+            return -1;
+        }
+    }
+
+    // read the dimensions
+    int n_mesh_dims = 0;
+    int have_mesh_dim[4] = {0};
+
+    int mesh_dim_active[4] = {0};
+    int n_active_dims = 0;
 
     std::vector<size_t> dims;
     std::vector<std::string> dim_names;
-    unsigned int centering = teca_array_attributes::point_centering;
+
     for (int ii = 0; ii < n_dims; ++ii)
     {
         char dim_name[NC_MAX_NAME + 1] = {'\0'};
@@ -437,33 +464,74 @@ int read_variable_attributes(netcdf_handle &fh, const std::string &var_name,
 #if !defined(HDF5_THREAD_SAFE)
         }
 #endif
+
+        int active = (clamp_dimensions_of_one && (dim == 1) ? 0 : 1);
+
+        if (!x_axis_variable.empty() &&
+            !strcmp(dim_name, x_axis_variable.c_str()))
+        {
+            have_mesh_dim[0] = 1;
+            n_mesh_dims += 1;
+
+            mesh_dim_active[0] = active;
+            n_active_dims += active;
+        }
+        else if (!y_axis_variable.empty() &&
+            !strcmp(dim_name, y_axis_variable.c_str()))
+        {
+            have_mesh_dim[1] = 1;
+            n_mesh_dims += 1;
+
+            mesh_dim_active[1] = active;
+            n_active_dims += active;
+        }
+        else if (!z_axis_variable.empty() &&
+            !strcmp(dim_name, z_axis_variable.c_str()))
+        {
+            have_mesh_dim[2] = 1;
+            n_mesh_dims += 1;
+
+            mesh_dim_active[2] = active;
+            n_active_dims += active;
+        }
+        else if (!t_axis_variable.empty() &&
+            !strcmp(dim_name, t_axis_variable.c_str()))
+        {
+            have_mesh_dim[3] = 1;
+            mesh_dim_active[3] = 1;
+        }
+
         dim_names.push_back(dim_name);
         dims.push_back(dim);
     }
 
+    // can only be point centered if all the dimensions are active coordinate
+    // axes
+    unsigned int centering = teca_array_attributes::no_centering;
+    if (n_mesh_dims == n_dims)
+    {
+        centering = teca_array_attributes::point_centering;
+    }
+
     atts.set("cf_id", var_id);
     atts.set("cf_dims", dims);
     atts.set("cf_dim_names", dim_names);
     atts.set("cf_type_code", var_nc_type);
     atts.set("type_code", var_type);
     atts.set("centering", centering);
-
-    for (int ii = 0; ii < n_atts; ++ii)
-    {
-        if (teca_netcdf_util::read_attribute(fh, var_id, ii, atts))
-        {
-            TECA_ERROR("Failed to read the " << ii << "th attribute for variable \""
-                << var_name << "\"." << std::endl << nc_strerror(ierr))
-            return -1;
-        }
-    }
+    atts.set("have_mesh_dim", have_mesh_dim, 4);
+    atts.set("mesh_dim_active", mesh_dim_active, 4);
+    atts.set("n_mesh_dims", n_mesh_dims);
+    atts.set("n_active_dims", n_active_dims);
 
     return 0;
 }
 
 // **************************************************************************
 int read_variable_attributes(netcdf_handle &fh, int var_id,
-    std::string &name, teca_metadata &atts)
+    const std::string &x_axis_variable, const std::string &y_axis_variable,
+    const std::string &z_axis_variable, const std::string &t_axis_variable,
+    int clamp_dimensions_of_one, std::string &name, teca_metadata &atts)
 {
     int ierr = 0;
     char var_name[NC_MAX_NAME + 1] = {'\0'};
@@ -488,18 +556,38 @@ int read_variable_attributes(netcdf_handle &fh, int var_id,
     }
 #endif
 
+    // skip scalars
+    if (n_dims == 0)
+        return 0;
+
+    name = var_name;
+
     // convert from the netcdf type code
     NC_DISPATCH(var_nc_type,
        var_type = teca_variant_array_code<NC_T>::get();
        )
 
-    // skip scalars
-    if (n_dims == 0)
-        return 0;
+    // read attributes
+    for (int ii = 0; ii < n_atts; ++ii)
+    {
+        if (teca_netcdf_util::read_attribute(fh, var_id, ii, atts))
+        {
+            TECA_ERROR("Failed to read the " << ii << "th attribute for variable "
+                << var_name << ". " << std::endl << nc_strerror(ierr))
+            return -1;
+        }
+    }
+
+    // read the dimensions
+    int n_mesh_dims = 0;
+    int have_mesh_dim[4] = {0};
+
+    int n_active_dims = 0;
+    int mesh_dim_active[4] = {0};
 
     std::vector<size_t> dims;
     std::vector<std::string> dim_names;
-    unsigned int centering = teca_array_attributes::point_centering;
+
     for (int ii = 0; ii < n_dims; ++ii)
     {
         char dim_name[NC_MAX_NAME + 1] = {'\0'};
@@ -517,11 +605,53 @@ int read_variable_attributes(netcdf_handle &fh, int var_id,
 #if !defined(HDF5_THREAD_SAFE)
         }
 #endif
+        int active = (clamp_dimensions_of_one && (dim == 1) ? 0 : 1);
+
+        if (!x_axis_variable.empty() &&
+            !strcmp(dim_name, x_axis_variable.c_str()))
+        {
+            have_mesh_dim[0] = 1;
+            n_mesh_dims += 1;
+
+            mesh_dim_active[0] = active;
+            n_active_dims += active;
+        }
+        else if (!y_axis_variable.empty() &&
+            !strcmp(dim_name, y_axis_variable.c_str()))
+        {
+            have_mesh_dim[1] = 1;
+            n_mesh_dims += 1;
+
+            mesh_dim_active[1] = active;
+            n_active_dims += active;
+        }
+        else if (!z_axis_variable.empty() &&
+            !strcmp(dim_name, z_axis_variable.c_str()))
+        {
+            have_mesh_dim[2] = 1;
+            n_mesh_dims += 1;
+
+            mesh_dim_active[2] = active;
+            n_active_dims += active;
+        }
+        else if (!t_axis_variable.empty() &&
+            !strcmp(dim_name, t_axis_variable.c_str()))
+        {
+            have_mesh_dim[3] = 1;
+            mesh_dim_active[3] = 1;
+        }
+
         dim_names.push_back(dim_name);
         dims.push_back(dim);
     }
 
-    name = var_name;
+    // can only be point centered if all the dimensions are active coordinate
+    // axes
+    unsigned int centering = teca_array_attributes::no_centering;
+    if ((n_mesh_dims + have_mesh_dim[3]) == n_dims)
+    {
+        centering = teca_array_attributes::point_centering;
+    }
 
     atts.set("cf_id", var_id);
     atts.set("cf_dims", dims);
@@ -529,16 +659,10 @@ int read_variable_attributes(netcdf_handle &fh, int var_id,
     atts.set("cf_type_code", var_nc_type);
     atts.set("type_code", var_type);
     atts.set("centering", centering);
-
-    for (int ii = 0; ii < n_atts; ++ii)
-    {
-        if (teca_netcdf_util::read_attribute(fh, var_id, ii, atts))
-        {
-            TECA_ERROR("Failed to read the " << ii << "th attribute for variable "
-                << var_name << ". " << std::endl << nc_strerror(ierr))
-            return -1;
-        }
-    }
+    atts.set("have_mesh_dim", have_mesh_dim);
+    atts.set("mesh_dim_active", mesh_dim_active);
+    atts.set("n_mesh_dims", n_mesh_dims);
+    atts.set("n_active_dims", n_active_dims);
 
     return 0;
 }
@@ -564,7 +688,8 @@ read_variable_and_attributes::data_t read_variable_and_attributes::operator()()
     // query variable attributes
     int ierr = 0;
     teca_metadata atts;
-    if (teca_netcdf_util::read_variable_attributes(fh, m_variable, atts))
+    if (teca_netcdf_util::read_variable_attributes(fh,
+        m_variable, "", "", "", "", false, atts))
     {
         TECA_ERROR("Failed to read \"" << m_variable << "\" attributes")
         return this->package(m_id);
@@ -720,7 +845,9 @@ int write_variable_attributes(netcdf_handle &fh, int var_id,
         if ((att_name == "cf_id") || (att_name == "cf_dims") ||
             (att_name == "cf_dim_names") || (att_name == "type_code") ||
             (att_name == "cf_type_code") || (att_name == "centering") ||
-            (att_name == "size"))
+            (att_name == "size") || (att_name == "have_mesh_dim") ||
+            (att_name == "mesh_dim_active") || (att_name == "n_mesh_dims") ||
+            (att_name == "n_active_dims"))
             continue;
 
         // get the attribute value
diff --git a/io/teca_netcdf_util.h b/io/teca_netcdf_util.h
index d7857febb..c16520a60 100644
--- a/io/teca_netcdf_util.h
+++ b/io/teca_netcdf_util.h
@@ -1,6 +1,8 @@
 #ifndef teca_netcdf_util_h
 #define teca_netcdf_util_h
 
+/// @file
+
 #include "teca_config.h"
 #include "teca_mpi.h"
 #include "teca_metadata.h"
@@ -14,7 +16,7 @@
 #include <netcdf_par.h>
 #endif
 
-// macro to help with netcdf data types
+/// macro to help with netcdf floating point data types
 #define NC_DISPATCH_FP(tc_, code_)                          \
     switch (tc_)                                            \
     {                                                       \
@@ -25,6 +27,7 @@
             << " is not a floating point type")             \
     }
 
+/// macro to help with netcdf data types
 #define NC_DISPATCH(tc_, code_)                             \
     switch (tc_)                                            \
     {                                                       \
@@ -44,6 +47,7 @@
             << " is not supported")                         \
     }
 
+/// macro that executes code when the type code is matched.
 #define NC_DISPATCH_CASE(cc_, tt_, code_)   \
     case cc_:                               \
     {                                       \
@@ -52,19 +56,23 @@
         break;                              \
     }
 
+/// Codes dealing with NetCDF I/O calls
 namespace teca_netcdf_util
 {
 
-// traits class mapping to/from netcdf
+/// A traits class mapping to netcdf from C++
 template<typename num_t> class netcdf_tt {};
+
+/// A traits class mapping to C++ from netcdf
 template<int nc_enum> class cpp_tt {};
 
-#define DECLARE_NETCDF_TT(cpp_t_, nc_c_)            \
-template <> class netcdf_tt<cpp_t_>                 \
-{                                                   \
-public:                                             \
-    enum { type_code = nc_c_ };                     \
-    static const char *name() { return #nc_c_; }    \
+#define DECLARE_NETCDF_TT(cpp_t_, nc_c_)                                 \
+/** A traits class mapping to NetCDF from C++, specialized for cpp_t_ */ \
+template <> class netcdf_tt<cpp_t_>                                      \
+{                                                                        \
+public:                                                                  \
+    enum { type_code = nc_c_ };                                          \
+    static const char *name() { return #nc_c_; }                         \
 };
 DECLARE_NETCDF_TT(char, NC_BYTE)
 DECLARE_NETCDF_TT(unsigned char, NC_UBYTE)
@@ -80,12 +88,13 @@ DECLARE_NETCDF_TT(unsigned long long, NC_UINT64)
 DECLARE_NETCDF_TT(float, NC_FLOAT)
 DECLARE_NETCDF_TT(double, NC_DOUBLE)
 
-#define DECLARE_CPP_TT(cpp_t_, nc_c_)               \
-template <> class cpp_tt<nc_c_>                     \
-{                                                   \
-public:                                             \
-    using type = cpp_t_;                            \
-    static const char *name() { return #cpp_t_; }   \
+#define DECLARE_CPP_TT(cpp_t_, nc_c_)                                    \
+/** A traits class mapping to C++ from NetCDF, specialized for cpp_t_ */ \
+template <> class cpp_tt<nc_c_>                                          \
+{                                                                        \
+public:                                                                  \
+    using type = cpp_t_;                                                 \
+    static const char *name() { return #cpp_t_; }                        \
 };
 DECLARE_CPP_TT(char, NC_BYTE)
 DECLARE_CPP_TT(unsigned char, NC_UBYTE)
@@ -101,47 +110,48 @@ DECLARE_CPP_TT(unsigned long long, NC_UINT64)
 DECLARE_CPP_TT(float, NC_FLOAT)
 DECLARE_CPP_TT(double, NC_DOUBLE)
 
-// to deal with fortran fixed length strings
-// which are not properly nulll terminated
+/** To deal with fortran fixed length strings which are not properly nulll
+ * terminated.
+ */
 void crtrim(char *s, long n);
 
-// NetCDF 3 is not threadsafe. The HDF5 C-API can be compiled to be threadsafe,
-// but it is usually not. NetCDF uses HDF5-HL API to access HDF5, but HDF5-HL
-// API is not threadsafe without the --enable-unsupported flag. For all those
-// reasons it's best for the time being to protect all NetCDF I/O.
+/** NetCDF 3 is not threadsafe. The HDF5 C-API can be compiled to be
+ * threadsafe, but it is usually not. NetCDF uses HDF5-HL API to access HDF5,
+ * but HDF5-HL API is not threadsafe without the --enable-unsupported flag. For
+ * all those reasons it's best for the time being to protect all NetCDF I/O.
+ */
 std::mutex &get_netcdf_mutex();
 
-// RAII for managing netcdf files
+/// A RAII class for managing NETCDF files. The file is kept open while the object exists.
 class netcdf_handle
 {
 public:
     netcdf_handle() : m_handle(0)
     {}
 
-    // initialize with a handle returned from
-    // nc_open/nc_create etc
+    /** Initialize with a handle returned from nc_open/nc_create etc. */
     netcdf_handle(int h) : m_handle(h)
     {}
 
-    // close the file during destruction
+    /** Close the file during destruction. */
     ~netcdf_handle()
     { this->close(); }
 
-    // this is a move only class, and should
-    // only be initialized with an valid handle
+    /**
+     * This is a move only class, and should
+     * only be initialized with an valid handle.
+     */
     netcdf_handle(const netcdf_handle &) = delete;
     void operator=(const netcdf_handle &) = delete;
 
-    // move construction takes ownership
-    // from the other object
+    /** Move construction takes ownership from the other object. */
     netcdf_handle(netcdf_handle &&other)
     {
         m_handle = other.m_handle;
         other.m_handle = 0;
     }
 
-    // move assignment takes ownership
-    // from the other object
+    /** Move assignment takes ownership from the other object. */
     void operator=(netcdf_handle &&other)
     {
         this->close();
@@ -149,37 +159,47 @@ class netcdf_handle
         other.m_handle = 0;
     }
 
-    // open the file. this can be used from MPI parallel runs, but collective
-    // I/O is not possible when a file is opend this way. Returns 0 on success.
+    /**
+     * Open the file. this can be used from MPI parallel runs, but collective
+     * I/O is not possible when a file is opened this way. Returns 0 on
+     * success.
+     */
     int open(const std::string &file_path, int mode);
 
-    // open the file. this can be used when collective I/O is desired. the
-    // passed in communcator specifies the subset of ranks that will access
-    // the file. Calling this when linked to a non-MPI enabled NetCDF install,
-    // from a parallel run will, result in an error. Returns 0 on success.
+    /**
+     * Open the file. this can be used when collective I/O is desired. the
+     * passed in communicator specifies the subset of ranks that will access
+     * the file. Calling this when linked to a non-MPI enabled NetCDF install,
+     * from a parallel run will, result in an error. Returns 0 on success.
+     */
     int open(MPI_Comm comm, const std::string &file_path, int mode);
 
-    // create the file. this can be used from MPI parallel runs, but collective
-    // I/O is not possible when a file is created this way. Returns 0 on success.
+    /**
+     * Create the file. this can be used from MPI parallel runs, but collective
+     * I/O is not possible when a file is created this way. Returns 0 on
+     * success.
+     */
     int create(const std::string &file_path, int mode);
 
-    // create the file. this can be used when collective I/O is desired. the
-    // passed in communcator specifies the subset of ranks that will access
-    // the file. Calling this when linked to a non-MPI enabled NetCDF install,
-    // from a parallel run will, result in an error. Returns 0 on success.
+    /**
+     * Create the file. this can be used when collective I/O is desired. the
+     * passed in communicator specifies the subset of ranks that will access
+     * the file. Calling this when linked to a non-MPI enabled NetCDF install,
+     * from a parallel run will, result in an error. Returns 0 on success.
+     */
     int create(MPI_Comm comm, const std::string &file_path, int mode);
 
-    // close the file
+    /** Close the file. */
     int close();
 
-    // flush all data to disk
+    /** Flush all data to disk. */
     int flush();
 
-    // returns a reference to the handle
+    /** Returns a reference to the handle. */
     int &get()
     { return m_handle; }
 
-    // test if the handle is valid
+    /** Test if the handle is valid. */
     operator bool() const
     { return m_handle > 0; }
 
@@ -187,51 +207,107 @@ class netcdf_handle
     int m_handle;
 };
 
-// read the specified variable attribute by name.
-// it's value is stored in the metadata object
-// return is non-zero if an error occurred
+/**
+ * Read the specified variable attribute by name.
+ * Its value is stored in the metadata object
+ * return is non-zero if an error occurred.
+ */
 int read_attribute(netcdf_handle &fh, int var_id,
     const std::string &att_name, teca_metadata &atts);
 
-// read the specified variable attribute by id
-// it's value is stored in the metadata object
-// return is non-zero if an error occurred
+/**
+ * Read the specified variable attribute by id.
+ * Its value is stored in the metadata object
+ * return is non-zero if an error occurred.
+ */
 int read_attribute(netcdf_handle &fh, int var_id,
     int att_id, teca_metadata &atts);
 
-// read the specified variable's name, dimensions, and it's associated
-// NetCDF attributes into the metadata object. Additonally the following
-// key/value pairs are added and useful for subsequent I/O and processing
-//
-//  cf_id - the NetCDF variable id that can be used to read the variable
-//  cf_dims - a vector of the NetCDF dimension lengths (i.e. the variable's shape)
-//  cf_dim_names - a vector of the names of the NetCDF dimensions
-//  cf_type_code - the NetCDF type code
-//  type_code - the TECA type code
-//  centering - for now it is set to teca_array_attributes::point_centering
-//
-// return is non-zero if an error occurred
+/**
+ * Read the specified variable's name, dimensions, and it's associated
+ * NetCDF attributes into the metadata object. Additionally the following
+ * key/value pairs are added and useful for subsequent I/O and processing
+ *
+ *  | Key             | Description                                          |
+ *  | ----            | -----------                                          |
+ *  | cf_id           | The NetCDF variable id that can be used to read the  |
+ *  |                 | variable.                                            |
+ *  | cf_dims         | A vector of the NetCDF dimension lengths (i.e. the   |
+ *  |                 | variable's shape).                                   |
+ *  | cf_dim_names    | A vector of the names of the NetCDF dimensions.      |
+ *  | cf_type_code    | The NetCDF type code.                                |
+ *  | type_code       | The teca_variant_array::code type code.              |
+ *  | centering       | The mesh centering, point_centering or no_centering  |
+ *  | have_mesh_dim   | Flags indicating the presence of the x,y,z, and t    |
+ *  |                 | mesh dimensions                                      |
+ *  | mesh_dim_active | Flags indicating if the x,y,z, and t dimension is    |
+ *  |                 | active.                                              |
+ *
+ * In order for centering and have_mesh_dim flags to be set, the x_variable,
+ * y_variable, z_variable, and t_variable must be specified.
+ *
+ * If dimension is 1 and clamp_dimensions_of_one is set then the dimension is
+ * marked as inactive.
+ *
+ * returns non-zero if an error occurred.
+ */
 int read_variable_attributes(netcdf_handle &fh, int var_id,
-    std::string &name, teca_metadata &atts);
-
+    const std::string &x_variable, const std::string &y_variable,
+    const std::string &z_variable, const std::string &t_variable,
+    int clamp_dimensions_of_one, std::string &name, teca_metadata &atts);
+
+/**
+ * Read the specified variable's name, dimensions, and it's associated
+ * NetCDF attributes into the metadata object. Additionally the following
+ * key/value pairs are added and useful for subsequent I/O and processing
+ *
+ *  | Key             | Description                                          |
+ *  | ----            | -----------                                          |
+ *  | cf_id           | The NetCDF variable id that can be used to read the  |
+ *  |                 | variable.                                            |
+ *  | cf_dims         | A vector of the NetCDF dimension lengths (i.e. the   |
+ *  |                 | variable's shape).                                   |
+ *  | cf_dim_names    | A vector of the names of the NetCDF dimensions.      |
+ *  | cf_type_code    | The NetCDF type code.                                |
+ *  | type_code       | The teca_variant_array::code type code.              |
+ *  | centering       | The mesh centering, point_centering or no_centering  |
+ *  | have_mesh_dim   | Flags indicating the presence of the x,y,z, and t    |
+ *  |                 | mesh dimensions                                      |
+ *  | mesh_dim_active | Flags indicating if the x,y,z, and t dimension is    |
+ *  |                 | active.                                              |
+ *
+ * In order for centering and have_mesh_dim flags to be set, the x_variable,
+ * y_variable, z_variable, and t_variable must be specified.
+ *
+ * If dimension is 1 and clamp_dimensions_of_one is set then the dimension is
+ * marked as inactive.
+ *
+ * returns non-zero if an error occurred.
+ */
 int read_variable_attributes(netcdf_handle &fh,
-    const std::string &name, teca_metadata &atts);
-
-// functional that reads and returns a variable from the
-// named file. we're doing this so we can do thread
-// parallel I/O to hide some of the cost of opening files
-// on Lustre and to hide the cost of reading time coordinate
-// which is typically very expensive as NetCDF stores
-// unlimted dimensions non-contiguously
-//
-// note: Thu 09 Apr 2020 05:45:29 AM PDT
-// Threading these operations worked well in NetCDF 3, however
-// in NetCDF 4 backed by HDF5 necessary locking eliminates any
-// speed up.
+    const std::string &name,
+    const std::string &x_variable, const std::string &y_variable,
+    const std::string &z_variable, const std::string &t_variable,
+    int clamp_dimensions_of_one, teca_metadata &atts);
+
+/// Functional that reads and returns a variable from the named file.
+/**
+ * We're doing this so we can do thread
+ * parallel I/O to hide some of the cost of opening files
+ * on Lustre and to hide the cost of reading time coordinate
+ * which is typically very expensive as NetCDF stores
+ * unlimited dimensions non-contiguously.
+ *
+ * @note
+ * Thu 09 Apr 2020 05:45:29 AM PDT
+ * Threading these operations worked well in NetCDF 3, however
+ * in NetCDF 4 backed by HDF5 necessary locking eliminates any
+ * speed up.
+ */
 class read_variable_and_attributes
 {
 public:
-    // data and task types
+    /** Data and task types. */
     using data_elem_t = std::pair<p_teca_variant_array, teca_metadata>;
     using data_t = std::pair<unsigned long, data_elem_t>;
     using task_t = std::packaged_task<data_t()>;
@@ -260,21 +336,24 @@ class read_variable_and_attributes
     unsigned long m_id;
 };
 
-// function that reads and returns a variable from the
-// named file. we're doing this so we can do thread
-// parallel I/O to hide some of the cost of opening files
-// on Lustre and to hide the cost of reading time coordinate
-// which is typically very expensive as NetCDF stores
-// unlimted dimensions non-contiguously
-//
-// note: Thu 09 Apr 2020 05:45:29 AM PDT
-// Threading these operations worked well in NetCDF 3, however
-// in NetCDF 4 backed by HDF5 necessary locking eliminates any
-// speed up.
+/// Function that reads and returns a variable from the named file.
+/**
+ * we're doing this so we can do thread
+ * parallel I/O to hide some of the cost of opening files
+ * on Lustre and to hide the cost of reading time coordinate
+ * which is typically very expensive as NetCDF stores
+ * unlimited dimensions non-contiguously
+ *
+ * @note
+ * Thu 09 Apr 2020 05:45:29 AM PDT
+ * Threading these operations worked well in NetCDF 3, however
+ * in NetCDF 4 backed by HDF5 necessary locking eliminates any
+ * speed up.
+ */
 class read_variable
 {
 public:
-    // data and task types
+    /** Data and task types. */
     using data_t = std::pair<unsigned long, p_teca_variant_array>;
     using task_t = std::packaged_task<data_t()>;
     using queue_t = teca_thread_pool<task_t, data_t>;
@@ -302,8 +381,11 @@ class read_variable
     unsigned long m_id;
 };
 
-// write the attributes in array_atts to the variable identified by var_id the
-// name is used in error messages. returns zero of successful.
+
+/**
+ * Write the attributes in array_atts to the variable identified by var_id the
+ * name is used in error messages. Returns zero of successful.
+ */
 int write_variable_attributes(netcdf_handle &fh, int var_id,
     teca_metadata &array_atts);
 
diff --git a/io/teca_table_reader.cxx b/io/teca_table_reader.cxx
index 838faa13a..92679a7c7 100644
--- a/io/teca_table_reader.cxx
+++ b/io/teca_table_reader.cxx
@@ -3,6 +3,7 @@
 #include "teca_binary_stream.h"
 #include "teca_coordinate_util.h"
 #include "teca_file_util.h"
+#include "teca_common.h"
 
 #include <algorithm>
 #include <cstring>
@@ -190,24 +191,28 @@ void teca_table_reader::get_properties_description(
         TECA_POPTS_GET(string, prefix, file_name,
             "a file name to read")
         TECA_POPTS_GET(string, prefix, index_column,
-            "name of the column containing index values (\"\")")
+            "name of the column containing index values")
         TECA_POPTS_GET(int, prefix, generate_original_ids,
             "add original row ids into the output. default off.")
         TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, metadata_column_names,
              "names of the columns to copy directly into metadata")
         TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, metadata_column_keys,
              "names of the metadata keys to create from the named columns")
-        TECA_POPTS_GET(int, prefix, output_format,
+        TECA_POPTS_GET(int, prefix, file_format,
             "output file format enum, 0:csv, 1:bin, 2:xlsx, 3:auto."
             "if auto is used, format is deduced from file_name")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
 // --------------------------------------------------------------------------
 void teca_table_reader::set_properties(const string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, string, prefix, file_name)
     TECA_POPTS_SET(opts, string, prefix, index_column)
     TECA_POPTS_SET(opts, int, prefix, generate_original_ids)
diff --git a/io/teca_table_reader.h b/io/teca_table_reader.h
index d03f55de5..71ce65cff 100644
--- a/io/teca_table_reader.h
+++ b/io/teca_table_reader.h
@@ -15,74 +15,72 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_table_reader)
 
 /// a reader for data stored in binary table format
 /**
-A reader for data stored in CSV or binary table format. By default the reader
-reads and returns the entire table on rank 0.  The reader can partition the
-data across an "index column".  The index column assigns a unique id to rows
-that should be returned together. The reader reports the number of unique ids
-to the pipeline which can then be requested by the pipeline during parallel or
-sequential execution.
-
-output:
-    generates a table containing the data read from the file.
-
-
-TECA CSV format specification
------------------------------
-Comment lines
-~~~~~~~~~~~~~
-a '#' character at the start of a line marks it as a comment. The version of
-the CSV specification as well as the version of TECA used to write the table
-will be stored in comment lines. Comment lines are currently skipped when
-reading the table.
-
-Column definitions
-~~~~~~~~~~~~~~~~~~
-the first row stores the names and data types of the columns. Column names are
-strings and delimited by double quotes. A column's data type is
-encoded in the name using (N) where N is an integer type code defined by
-teca_variant_array and parentheses delimit the type code. The type code
-sequence is stripped from the name when the file is read.
-
-+-------------------+------+
-| C type            | code |
-+-------------------+------+
-| char              | 1    |
-| unsigned char     | 2    |
-| int               | 3    |
-| unsigned int      | 4    |
-| short int         | 5    |
-| short unsigned int| 6    |
-| long              | 7    |
-| unsigned long     | 8    |
-| long long         | 9    |
-| unsigned long long| 10   |
-| float             | 11   |
-| double            | 12   |
-| std::string       | 13   |
-+-------------------+------+
-
-The number of column definitions found determines the number of columns in the
-table when reading.
-
-Column data
-~~~~~~~~~~~
-Data is organized row by row with an entry for each column. Entries are
-separated by commas ','. Error's will occur when the number of column
-definitions don't match the number of data entries per row.
-
-String data
-~~~~~~~~~~~
-Strings are delimited by double quotations. Double quotes and commas in strings
-may be escaped by a backslash.
-
-Numeric data
-~~~~~~~~~~~~
-The type code provided in the column definition tells the type of number.
-These codes are defined in teca_variant_array.
-
-floating point types are written with format and precision such that they
-may be read without introducing rounding error.
-*/
+ * A reader for data stored in CSV or binary table format. By default the reader
+ * reads and returns the entire table on rank 0.  The reader can partition the
+ * data across an "index column".  The index column assigns a unique id to rows
+ * that should be returned together. The reader reports the number of unique ids
+ * to the pipeline which can then be requested by the pipeline during parallel or
+ * sequential execution.
+ *
+ * output:
+ *     generates a table containing the data read from the file.
+ *
+ *
+ * ### TECA CSV format specification
+ *
+ * #### Comment lines
+ *
+ * a '#' character at the start of a line marks it as a comment. The version of
+ * the CSV specification as well as the version of TECA used to write the table
+ * will be stored in comment lines. Comment lines are currently skipped when
+ * reading the table.
+ *
+ * #### Column definitions
+ *
+ * the first row stores the names and data types of the columns. Column names are
+ * strings and delimited by double quotes. A column's data type is
+ * encoded in the name using (N) where N is an integer type code defined by
+ * teca_variant_array and parentheses delimit the type code. The type code
+ * sequence is stripped from the name when the file is read.
+ *
+ * | C type             | code |
+ * | ------             | ---- |
+ * | char               | 1    |
+ * | unsigned char      | 2    |
+ * | int                | 3    |
+ * | unsigned int       | 4    |
+ * | short int          | 5    |
+ * | short unsigned int | 6    |
+ * | long               | 7    |
+ * | unsigned long      | 8    |
+ * | long long          | 9    |
+ * | unsigned long long | 10   |
+ * | float              | 11   |
+ * | double             | 12   |
+ * | std::string        | 13   |
+ *
+ * The number of column definitions found determines the number of columns in the
+ * table when reading.
+ *
+ * #### Column data
+ *
+ * Data is organized row by row with an entry for each column. Entries are
+ * separated by commas ','. Error's will occur when the number of column
+ * definitions don't match the number of data entries per row.
+ *
+ * #### String data
+ *
+ * Strings are delimited by double quotations. Double quotes and commas in strings
+ * may be escaped by a backslash.
+ *
+ * #### Numeric data
+ *
+ * The type code provided in the column definition tells the type of number.
+ * These codes are defined in teca_variant_array.
+ *
+ * floating point types are written with format and precision such that they
+ * may be read without introducing rounding error.
+ */
 class teca_table_reader : public teca_algorithm
 {
 public:
diff --git a/io/teca_table_writer.cxx b/io/teca_table_writer.cxx
index 8c610a0f9..75e221b5e 100644
--- a/io/teca_table_writer.cxx
+++ b/io/teca_table_writer.cxx
@@ -309,12 +309,16 @@ void teca_table_writer::get_properties_description(
             "if auto is used, format is deduced from file_name")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
 // --------------------------------------------------------------------------
 void teca_table_writer::set_properties(const std::string &prefix, variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::string, prefix, file_name)
     TECA_POPTS_SET(opts, std::string, prefix, row_dim_name)
     TECA_POPTS_SET(opts, bool, prefix, output_format)
diff --git a/io/teca_table_writer.h b/io/teca_table_writer.h
index 3d3d0dce7..f0f0dfc14 100644
--- a/io/teca_table_writer.h
+++ b/io/teca_table_writer.h
@@ -10,19 +10,20 @@
 
 TECA_SHARED_OBJECT_FORWARD_DECL(teca_table_writer)
 
-/// teca_table_writer - writes tabular datasets in CSV format.
-/**
-an algorithm that writes tabular data in a binary or CSV (comma separated value)
-format that is easily ingested by most spreadsheet apps. Each page of
-a database is written to a file.
-
-The binary format is internal to TECA, and provides the best performance.
-
-The CSV format is intended for use getting data into other tools such as MS
-Excel and or Python based codes.
-
-See TECA CSV format specification in teca_table_reader for more information.
-*/
+/** @brief
+ * An algorithm that writes tabular data in a binary or CSV (comma separated
+ * value) format that is easily ingested by most spreadsheet apps. Each page
+ * of a database is written to a file.
+ *
+ * @details
+ * The binary format is internal to TECA, and provides the best performance.
+ *
+ * The CSV format is intended for use getting data into other tools such as MS
+ * Excel and or Python based codes.
+ *
+ * See TECA CSV format specification in teca_table_reader for more
+ * information.
+ */
 class teca_table_writer : public teca_algorithm
 {
 public:
diff --git a/io/teca_vtk_util.h b/io/teca_vtk_util.h
index eab568835..fa49530ca 100644
--- a/io/teca_vtk_util.h
+++ b/io/teca_vtk_util.h
@@ -1,6 +1,8 @@
 #ifndef teca_vtk_util_h
 #define teca_vtk_util_h
 
+/// @file
+
 #include "teca_config.h"
 #include "teca_cartesian_mesh.h"
 
@@ -35,8 +37,13 @@ using vtkUnsignedLongLongArray = void*;
 class vtkRectilinearGrid;
 #endif
 
+
+/// Codes dealing with VTK
 namespace teca_vtk_util
 {
+
+/// @cond
+
 // traits class for naming and/or selecting
 // the VTK type given a C++ type
 template <typename T> struct vtk_tt {};
@@ -65,8 +72,9 @@ VTK_TT_SPEC(unsigned long, unsigned_long, vtkUnsignedLongArray, "%lu")
 VTK_TT_SPEC(long long, long_long, vtkLongLongArray, "%lli")
 VTK_TT_SPEC(unsigned long long, unsigned_long_long, vtkUnsignedLongLongArray, "%llu")
 
-// deep copy input mesh into the VTK object
-// return is 0 if successful
+/// @endcond
+
+/// deep copy input mesh into the VTK object. @returns 0 if successful
 int deep_copy(vtkRectilinearGrid *output,
     const_p_teca_cartesian_mesh input);
 
diff --git a/io/teca_wrf_reader.cxx b/io/teca_wrf_reader.cxx
index ba5825f12..73a621b04 100644
--- a/io/teca_wrf_reader.cxx
+++ b/io/teca_wrf_reader.cxx
@@ -5,7 +5,7 @@
 #include "teca_thread_pool.h"
 #include "teca_coordinate_util.h"
 #include "teca_netcdf_util.h"
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 
 #include <netcdf.h>
 #include <iostream>
@@ -104,7 +104,7 @@ teca_wrf_reader::teca_wrf_reader() :
     m_z_axis_variable("ZNU"),
     w_z_axis_variable("ZNW"),
     t_axis_variable("XTIME"),
-    t_calendar(""),
+    calendar(""),
     t_units(""),
     filename_time_template(""),
     periodic_in_x(0),
@@ -127,32 +127,34 @@ void teca_wrf_reader::get_properties_description(
         + (prefix.empty()?"teca_wrf_reader":prefix));
 
     opts.add_options()
-        TECA_POPTS_GET(std::vector<std::string>, prefix, file_names,
+        TECA_POPTS_MULTI_GET(std::vector<std::string>, prefix, file_names,
             "paths/file names to read")
         TECA_POPTS_GET(std::string, prefix, files_regex,
             "a regular expression that matches the set of files "
             "comprising the dataset")
         TECA_POPTS_GET(std::string, prefix, metadata_cache_dir,
-            "a directory where metadata caches can be stored ()")
-        TECA_POPTS_GET(std::string, prefix, t_calendar,
-            "name of variable that has the time calendar (calendar)")
+            "a directory where metadata caches can be stored")
+        TECA_POPTS_GET(std::string, prefix, calendar,
+            "name of variable that has the time calendar")
         TECA_POPTS_GET(std::string, prefix, t_units,
             "a std::get_time template for decoding time from the input filename")
         TECA_POPTS_GET(std::string, prefix, filename_time_template,
-            "name of variable that has the time unit (units)")
-        TECA_POPTS_GET(std::vector<double>, prefix, t_values,
+            "name of variable that has the time unit")
+        TECA_POPTS_MULTI_GET(std::vector<double>, prefix, t_values,
             "name of variable that has t axis values set by the"
-            "the user if the file doesn't have time variable set ()")
+            "the user if the file doesn't have time variable set")
         TECA_POPTS_GET(int, prefix, periodic_in_x,
-            "the dataset has apriodic boundary in the x direction (0)")
+            "the dataset has apriodic boundary in the x direction")
         TECA_POPTS_GET(int, prefix, periodic_in_y,
-            "the dataset has apriodic boundary in the y direction (0)")
+            "the dataset has apriodic boundary in the y direction")
         TECA_POPTS_GET(int, prefix, periodic_in_z,
-            "the dataset has apriodic boundary in the z direction (0)")
+            "the dataset has apriodic boundary in the z direction")
         TECA_POPTS_GET(int, prefix, thread_pool_size,
-            "set the number of I/O threads (-1)")
+            "set the number of I/O threads")
         ;
 
+    this->teca_algorithm::get_properties_description(prefix, opts);
+
     global_opts.add(opts);
 }
 
@@ -160,10 +162,12 @@ void teca_wrf_reader::get_properties_description(
 void teca_wrf_reader::set_properties(const std::string &prefix,
     variables_map &opts)
 {
+    this->teca_algorithm::set_properties(prefix, opts);
+
     TECA_POPTS_SET(opts, std::vector<std::string>, prefix, file_names)
     TECA_POPTS_SET(opts, std::string, prefix, files_regex)
     TECA_POPTS_SET(opts, std::string, prefix, metadata_cache_dir)
-    TECA_POPTS_SET(opts, std::string, prefix, t_calendar)
+    TECA_POPTS_SET(opts, std::string, prefix, calendar)
     TECA_POPTS_SET(opts, std::string, prefix, t_units)
     TECA_POPTS_SET(opts, std::string, prefix, filename_time_template)
     TECA_POPTS_SET(opts, std::vector<double>, prefix, t_values)
@@ -660,17 +664,17 @@ teca_metadata teca_wrf_reader::get_output_metadata(
                 if (!time_atts.has("calendar"))
                 {
                     std::string cal = "standard";
-                    if (!this->t_calendar.empty())
+                    if (!this->calendar.empty())
                         cal = "standard";
                     else
-                        cal = this->t_calendar;
+                        cal = this->calendar;
                     time_atts.set("calendar", cal);
                     atrs.set(t_axis_variable, time_atts);
                 }
             }
             else if (!this->t_values.empty())
             {
-                if (this->t_calendar.empty() || this->t_units.empty())
+                if (this->calendar.empty() || this->t_units.empty())
                 {
                     TECA_ERROR("calendar and units has to be specified"
                         " for the time variable")
@@ -687,7 +691,7 @@ teca_metadata teca_wrf_reader::get_output_metadata(
                 }
 
                 teca_metadata time_atts;
-                time_atts.set("calendar", this->t_calendar);
+                time_atts.set("calendar", this->calendar);
                 time_atts.set("units", this->t_units);
 
                 atrs.set("time", time_atts);
@@ -707,12 +711,12 @@ teca_metadata teca_wrf_reader::get_output_metadata(
                 std::vector<double> t_values;
 
                 std::string t_units = this->t_units;
-                std::string t_calendar = this->t_calendar;
+                std::string calendar = this->calendar;
 
                 // assume that this is a standard calendar if none is provided
-                if (this->t_calendar.empty())
+                if (this->calendar.empty())
                 {
-                    t_calendar = "standard";
+                    calendar = "standard";
                 }
 
                 // loop over all files and infer dates from names
@@ -770,8 +774,8 @@ teca_metadata teca_wrf_reader::get_output_metadata(
                     int minute = current_tm.tm_min;
                     double second = current_tm.tm_sec;
                     double current_time = 0;
-                    if (calcalcs::coordinate(year, mon, day, hour, minute,
-                        second, t_units.c_str(), t_calendar.c_str(), &current_time))
+                    if (teca_calcalcs::coordinate(year, mon, day, hour, minute,
+                        second, t_units.c_str(), calendar.c_str(), &current_time))
                     {
                         TECA_ERROR("conversion of date inferred from "
                             "filename failed");
@@ -787,7 +791,7 @@ teca_metadata teca_wrf_reader::get_output_metadata(
 
                 // set the time metadata
                 teca_metadata time_atts;
-                time_atts.set("calendar", t_calendar);
+                time_atts.set("calendar", calendar);
                 time_atts.set("units", t_units);
                 atrs.set("time", time_atts);
 
diff --git a/io/teca_wrf_reader.h b/io/teca_wrf_reader.h
index fb2db2182..292e2bae9 100644
--- a/io/teca_wrf_reader.h
+++ b/io/teca_wrf_reader.h
@@ -13,41 +13,50 @@ TECA_SHARED_OBJECT_FORWARD_DECL(teca_wrf_reader)
 class teca_wrf_reader_internals;
 using p_teca_wrf_reader_internals = std::shared_ptr<teca_wrf_reader_internals>;
 
-/// a reader for data stored in WRF ARW format
+/// A reader for data stored in WRF ARW format.
 /**
-a reader for data stored in WRF ARW format
-
-reads a set of arrays from  single time step into an Arakawa C grid
-mesh. the mesh is optionally subset.
-
-metadata keys:
-    variables - a list of all available variables.
-    <var> -  a metadata object holding all NetCDF attributes for the variable named <var>
-    time variables - a list of all variables with time as the only dimension
-    coordinates - a metadata object holding names and arrays of the coordinate axes
-        x_axis_variable - name of x axis variable
-        y_axis_variable - name of y axis variable
-        z_axis_variable - name of z axis variable
-        t_axis_variable - name of t axis variable
-        x - array of x coordinates
-        y - array of y coordinates
-        z - array of z coordinates
-        t - array of t coordinates
-    files - list of files in this dataset
-    step_count - list of the number of steps in each file
-    number_of_time_steps - total number of time steps in all files
-    whole_extent - index space extent describing (nodal) dimensions of the mesh
-
-request keys:
-    time_step - the time step to read
-    arrays - list of arrays to read
-    extent - index space extents describing the subset of data to read
-
-output:
-    generates a 2 or 3D teca_arakawa_c_grid mesh for the requested timestep on
-    the requested extent with the requested point based arrays and value at
-    this timestep for all time variables.
-*/
+ * Reads a set of arrays from single time step into an Arakawa C grid
+ * mesh. The mesh is optionally subset.
+ *
+ * ### metadata keys:
+ *
+ *  | key                   | description |
+ *  | ----                  | ----------- |
+ *  | variables             | a list of all available variables |
+ *  | [var]                 | a metadata object holding all NetCDF attributes for the |
+ *  |                       | variable named [var] |
+ *  | time variables        | a list of all variables with time as the only |
+ *  |                       | dimension |
+ *  | coordinates           | a metadata object holding names and arrays of the |
+ *  |                       | coordinate axes |
+ *  |  x_axis_variable      | name of x axis variable |
+ *  |  y_axis_variable      | name of y axis variable |
+ *  |  z_axis_variable      | name of z axis variable |
+ *  |  t_axis_variable      | name of t axis variable |
+ *  |  x                    | array of x coordinates |
+ *  |  y                    | array of y coordinates |
+ *  |  z                    | array of z coordinates |
+ *  |  t                    | array of t coordinates |
+ *  |  files                | list of files in this dataset |
+ *  |  step_count           | list of the number of steps in each file |
+ *  |  number_of_time_steps | total number of time steps in all files |
+ *  |  whole_extent         | index space extent describing (nodal) dimensions of the |
+ *  |                       | mesh |
+ *
+ * ### request keys:
+ *
+ *  | key        | description |
+ *  | ----       | ----------- |
+ *  | time_step  | the time step to read
+ *  | arrays     | list of arrays to read
+ *  | extent     | index space extents describing the subset of data to read
+ *
+ * ### output:
+ *
+ * generates a 2 or 3D teca_arakawa_c_grid mesh for the requested timestep on
+ * the requested extent with the requested point based arrays and value at this
+ * timestep for all time variables.
+ */
 class teca_wrf_reader : public teca_algorithm
 {
 public:
@@ -82,7 +91,7 @@ class teca_wrf_reader : public teca_algorithm
 
     // time calendar and time unit if the user wants to
     // specify them
-    TECA_ALGORITHM_PROPERTY(std::string, t_calendar)
+    TECA_ALGORITHM_PROPERTY(std::string, calendar)
     TECA_ALGORITHM_PROPERTY(std::string, t_units)
 
     // a way to infer time from the filename if the time axis is not
@@ -136,7 +145,7 @@ class teca_wrf_reader : public teca_algorithm
     std::string m_z_axis_variable;
     std::string w_z_axis_variable;
     std::string t_axis_variable;
-    std::string t_calendar;
+    std::string calendar;
     std::string t_units;
     std::string filename_time_template;
     std::vector<double> t_values;
diff --git a/paraview/vtkTECATimeAnnotation.cxx b/paraview/vtkTECATimeAnnotation.cxx
index 1794d58b2..340659c09 100644
--- a/paraview/vtkTECATimeAnnotation.cxx
+++ b/paraview/vtkTECATimeAnnotation.cxx
@@ -15,7 +15,7 @@
 #include <iomanip>
 #include <algorithm>
 
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 
 //----------------------------------------------------------------------------
 vtkStandardNewMacro(vtkTECATimeAnnotation);
@@ -111,7 +111,7 @@ int vtkTECATimeAnnotation::RequestData(vtkInformation *req,
   int minute = 0;
   double second = 0;
 
-  if (calcalcs::date(time, &year, &month, &day, &hour, &minute, &second,
+  if (teca_calcalcs::date(time, &year, &month, &day, &hour, &minute, &second,
       time_units.c_str(), calendar.c_str()))
   {
       vtkErrorMacro("Failed to compute the date time=" <<  time)
diff --git a/python/CMake/teca_python.cmake b/python/CMake/teca_python.cmake
index 2acc89a5e..75fae0f5c 100644
--- a/python/CMake/teca_python.cmake
+++ b/python/CMake/teca_python.cmake
@@ -4,7 +4,9 @@ function(depend_swig input output)
     # custom command to update the dependency file
     add_custom_command(
         OUTPUT ${output_file}
-        COMMAND ${swig_cmd} -c++ -python -MM
+        COMMAND env LD_LIBRARY_PATH=$ENV{LD_LIBRARY_PATH}
+            DYLD_LIBRARY_PATH=$ENV{DYLD_LIBRARY_PATH}
+            ${swig_cmd} -c++ -python -MM
             -I${MPI4Py_INCLUDE_DIR}
             -I${CMAKE_CURRENT_BINARY_DIR}
             -I${CMAKE_CURRENT_BINARY_DIR}/..
@@ -19,7 +21,9 @@ function(depend_swig input output)
     # bootstrap the dependency list
     message(STATUS "Generating initial dependency list for ${input}")
     execute_process(
-        COMMAND ${swig_cmd} -c++ -python -MM
+        COMMAND env LD_LIBRARY_PATH=$ENV{LD_LIBRARY_PATH}
+            DYLD_LIBRARY_PATH=$ENV{DYLD_LIBRARY_PATH}
+            ${swig_cmd} -c++ -python -MM
             -I${MPI4Py_INCLUDE_DIR}
             -I${CMAKE_CURRENT_BINARY_DIR}
             -I${CMAKE_CURRENT_BINARY_DIR}/..
@@ -73,7 +77,9 @@ function(wrap_swig input output)
     endforeach()
     add_custom_command(
         OUTPUT ${output_file}
-        COMMAND ${swig_cmd} -c++ -python -threads -w341,325
+        COMMAND env LD_LIBRARY_PATH=$ENV{LD_LIBRARY_PATH}
+            DYLD_LIBRARY_PATH=$ENV{DYLD_LIBRARY_PATH}
+            ${swig_cmd} -c++ -python -threads -w341,325
             -DSWIG_TYPE_TABLE=teca_py
             -I${MPI4Py_INCLUDE_DIR}
             -I${CMAKE_CURRENT_BINARY_DIR}
diff --git a/python/teca_py_alg.i b/python/teca_py_alg.i
index 9bc3a75d5..37307967b 100644
--- a/python/teca_py_alg.i
+++ b/python/teca_py_alg.i
@@ -19,12 +19,14 @@
 #include "teca_derived_quantity_numerics.h"
 #include "teca_descriptive_statistics.h"
 #include "teca_evaluate_expression.h"
+#include "teca_elevation_mask.h"
 #include "teca_integrated_vapor_transport.h"
 #include "teca_l2_norm.h"
 #include "teca_laplacian.h"
 #include "teca_latitude_damper.h"
 #include "teca_mask.h"
 #include "teca_normalize_coordinates.h"
+#include "teca_rename_variables.h"
 #include "teca_saffir_simpson.h"
 #include "teca_table_calendar.h"
 #include "teca_table_sort.h"
@@ -36,7 +38,8 @@
 #include "teca_tc_classify.h"
 #include "teca_tc_trajectory.h"
 #include "teca_tc_wind_radii.h"
-#include "teca_temporal_average.h"
+#include "teca_simple_moving_average.h"
+#include "teca_unpack_data.h"
 #include "teca_valid_value_mask.h"
 #include "teca_vertical_reduction.h"
 #include "teca_vorticity.h"
@@ -118,12 +121,12 @@
 %include "teca_table_to_stream.h"
 
 /***************************************************************************
- temporal_average
+ simple_moving_average
  ***************************************************************************/
-%ignore teca_temporal_average::shared_from_this;
-%shared_ptr(teca_temporal_average)
-%ignore teca_temporal_average::operator=;
-%include "teca_temporal_average.h"
+%ignore teca_simple_moving_average::shared_from_this;
+%shared_ptr(teca_simple_moving_average)
+%ignore teca_simple_moving_average::operator=;
+%include "teca_simple_moving_average.h"
 
 /***************************************************************************
  vorticity
@@ -216,13 +219,6 @@
 %shared_ptr(teca_table_region_mask)
 %ignore teca_table_region_mask::operator=;
 %include "teca_table_region_mask.h"
-%extend teca_table_region_mask
-{
-    TECA_PY_ALGORITHM_VECTOR_PROPERTY(unsigned long, region_size)
-    TECA_PY_ALGORITHM_VECTOR_PROPERTY(unsigned long, region_start);
-    TECA_PY_ALGORITHM_VECTOR_PROPERTY(double, region_x_coordinate);
-    TECA_PY_ALGORITHM_VECTOR_PROPERTY(double, region_y_coordinate);
-}
 
 /***************************************************************************
  pytorch_algorithm
@@ -418,3 +414,27 @@ struct teca_tc_saffir_simpson
 %shared_ptr(teca_valid_value_mask)
 %ignore teca_valid_value_mask::operator=;
 %include "teca_valid_value_mask.h"
+
+/***************************************************************************
+ unpack_data
+ ***************************************************************************/
+%ignore teca_unpack_data::shared_from_this;
+%shared_ptr(teca_unpack_data)
+%ignore teca_unpack_data::operator=;
+%include "teca_unpack_data.h"
+
+/***************************************************************************
+ elevation_mask
+ ***************************************************************************/
+%ignore teca_elevation_mask::shared_from_this;
+%shared_ptr(teca_elevation_mask)
+%ignore teca_elevation_mask::operator=;
+%include "teca_elevation_mask.h"
+
+/***************************************************************************
+ rename_variables
+ ***************************************************************************/
+%ignore teca_rename_variables::shared_from_this;
+%shared_ptr(teca_rename_variables)
+%ignore teca_rename_variables::operator=;
+%include "teca_rename_variables.h"
diff --git a/python/teca_py_algorithm.h b/python/teca_py_algorithm.h
index fdb61974a..cfc326d67 100644
--- a/python/teca_py_algorithm.h
+++ b/python/teca_py_algorithm.h
@@ -1,6 +1,8 @@
 #ifndef teca_py_algorithm_h
 #define teca_py_algorithm_h
 
+/// @file
+
 #include "teca_metadata.h"
 #include "teca_dataset.h"
 #include "teca_py_object.h"
@@ -10,10 +12,10 @@
 #include <Python.h>
 #include <vector>
 
-
-// we are going to be overly verbose in an effort to help
-// the user debug their code. package this up for use in all
-// the callbacks.
+/** Reports an error from a user provided callback.  We are going to be overly
+ * verbose in an effort to help the user debug their code. package this up for
+ * use in all the callbacks.
+ */
 #define TECA_PY_CALLBACK_ERROR(_phase, _cb_obj)             \
     {                                                       \
     PyObject *cb_str = PyObject_Str(_cb_obj);               \
@@ -29,19 +31,21 @@
     Py_XDECREF(cb_str);                                     \
     }
 
+/// Codes for briding teca_algorithm to Python
 namespace teca_py_algorithm
 {
 /// wrapper for report_callback phase callback
-/** Manages a python callback for use during the report_callback phase of
-pipeline execution. In addition to holding the callback it handles translation
-of the input and output arguments.
-
-the python function must accept the following arguments:
-
-   port - an integer set to the active port number
-   input_md - a list of metadata objects one per input connection
-
-it must return: a teca_metadata object.
+/**
+ * Manages a python callback for use during the report_callback phase of
+ * pipeline execution. In addition to holding the callback it handles translation
+ * of the input and output arguments.
+ *
+ * the python function must accept the following arguments:
+ *
+ * > port - an integer set to the active port number
+ * > input_md - a list of metadata objects one per input connection
+ *
+ * it must return: a teca_metadata object.
 */
 class report_callback
 {
@@ -107,11 +111,11 @@ class report_callback
     teca_py_object::teca_py_callable m_callback;
 };
 
-/// wrapper for request phase callback
+/// A wrapper for the request phase callback.
 /** Manages a python callback for use during the request phase of pipeline
-execution. In addition to holding the callback it handles translation of the
-input and output arguments.
-*/
+ * execution. In addition to holding the callback it handles translation of the
+ *input and output arguments.
+ */
 class request_callback
 {
 public:
@@ -199,18 +203,18 @@ class request_callback
 
 /// wrapper for execute_callback phase callback
 /** Manages a python callback for use during the execute_callback phase of
-pipeline execution. In addition to holding the callback it handles translation
-of the input and output arguments.
-
-the python function must accept the following arguments:
-
-   port - an integer set to the active port number
-   input_data - a list of datasets objects one per input connection,
-        per upstream request
-   request - a metadata object containing the request
-
-it must return: a teca_dataset object.
-*/
+ * pipeline execution. In addition to holding the callback it handles translation
+ * of the input and output arguments.
+ *
+ * the python function must accept the following arguments:
+ *
+ * >  port - an integer set to the active port number
+ * >  input_data - a list of datasets objects one per input connection,
+ * >               per upstream request
+ * >  request - a metadata object containing the request
+ *
+ * it must return: a teca_dataset object.
+ */
 class execute_callback
 {
 public:
@@ -292,18 +296,18 @@ class execute_callback
 
 /// wrapper for execute_callback phase callback
 /** Manages a python callback for use during the execute_callback phase of
-pipeline execution. In addition to holding the callback it handles translation
-of the input and output arguments.
-
-the python function must accept the following arguments:
-
-   port - an integer set to the active port number
-   input_data - a list of datasets objects one per input connection,
-        per upstream request
-   request - a metadata object containing the request
-   streaming - flag indicating when processing is finished
-
-it must return: a teca_dataset object.
+ * pipeline execution. In addition to holding the callback it handles translation
+ * of the input and output arguments.
+ *
+ * the python function must accept the following arguments:
+ *
+ * >  port - an integer set to the active port number
+ * >  input_data - a list of datasets objects one per input connection,
+ * >               per upstream request
+ * >  request - a metadata object containing the request
+ * >  streaming - flag indicating when processing is finished
+ *
+ * it must return: a teca_dataset object.
 */
 class threaded_execute_callback
 {
@@ -386,12 +390,12 @@ class threaded_execute_callback
 
 /// wrapper for reduce_callback of the programmable reduction
 /**
-Manages a python callback for use during a programmable reduction. In addition
-to holding the callback it handles translation of the input and output
-arguments.
-
-the python function must accept the two datasets to reduce and return the
-reduced data
+ * Manages a python callback for use during a programmable reduction. In addition
+ * to holding the callback it handles translation of the input and output
+ * arguments.
+ *
+ * the python function must accept the two datasets to reduce and return the
+ * reduced data
 */
 class reduce_callback
 {
@@ -486,12 +490,12 @@ class reduce_callback
 
 /// wrapper for finalize_callback of the programmable reduction
 /**
-Manages a python callback for use during a programmable reduction. In addition
-to holding the callback it handles translation of the input and output
-arguments.
-
-the python function must accept the dataset to finalize and return the
-finalized data
+ * Manages a python callback for use during a programmable reduction. In addition
+ * to holding the callback it handles translation of the input and output
+ * arguments.
+ *
+ * the python function must accept the dataset to finalize and return the
+ * finalized data
 */
 class finalize_callback
 {
diff --git a/python/teca_py_array.h b/python/teca_py_array.h
index 31ae58228..6a0df1b38 100644
--- a/python/teca_py_array.h
+++ b/python/teca_py_array.h
@@ -1,6 +1,8 @@
 #ifndef teca_py_array_h
 #define teca_py_array_h
 
+/// @file
+
 #define NPY_NO_DEPRECATED_API NPY_1_7_API_VERSION
 #include <numpy/arrayobject.h>
 #include <Python.h>
@@ -10,8 +12,10 @@
 #include "teca_common.h"
 #include "teca_variant_array.h"
 
+/// Codes for interfacing with numpy arrays
 namespace teca_py_array
 {
+/// @cond
 /// cpp_tt -- traits class for working with PyArrayObject's
 /**
 cpp_tt::type -- get the C++ type given a numpy enum.
@@ -70,7 +74,6 @@ teca_py_array_numpy_tt_declare(NPY_UINT64, unsigned long long)
 teca_py_array_numpy_tt_declare(NPY_FLOAT, float)
 teca_py_array_numpy_tt_declare(NPY_DOUBLE, double)
 
-
 // CPP_T - array type to match
 // OBJ - PyArrayObject* instance
 // CODE - code to execute on match
@@ -80,7 +83,16 @@ teca_py_array_numpy_tt_declare(NPY_DOUBLE, double)
         using AT = CPP_T;                               \
         CODE                                            \
     }
+/// @endcond
+
 
+/** @brief A dispatch macro that executes the code in CODE based
+ *  on the run time determined type of OBJ.
+ *
+ *  @details The following alias is available for determining the actual
+ *  type within the CODE section: `using AT = CPP_T;`
+ *
+ */
 #define TECA_PY_ARRAY_DISPATCH(OBJ, CODE)                       \
     TECA_PY_ARRAY_DISPATCH_CASE(float, OBJ, CODE)               \
     TECA_PY_ARRAY_DISPATCH_CASE(double, OBJ, CODE)              \
@@ -96,7 +108,7 @@ teca_py_array_numpy_tt_declare(NPY_DOUBLE, double)
     TECA_PY_ARRAY_DISPATCH_CASE(unsigned short, OBJ, CODE)
 
 
-
+/// @cond
 /// numpy_scalar_tt - traits class for working with PyArrayObject's
 /**
 ::code - get the numpy type enum given a C++ type.
@@ -163,7 +175,7 @@ teca_py_array_numpy_scalar_tt_declare(NPY_DOUBLE, Float64, double)
     TECA_PY_ARRAY_SCALAR_DISPATCH_CASE(short, OBJ, CODE)                    \
     else TECA_PY_ARRAY_SCALAR_DISPATCH_CASE(unsigned short, OBJ, CODE)
 
-#if 0 
+#if 0
 #define TECA_PY_ARRAY_SCALAR_DISPATCH_I32(OBJ, CODE)                        \
     TECA_PY_ARRAY_SCALAR_DISPATCH_CASE(int, OBJ, CODE)                      \
     else TECA_PY_ARRAY_SCALAR_DISPATCH_CASE(unsigned int, OBJ, CODE)        \
@@ -194,9 +206,10 @@ teca_py_array_numpy_scalar_tt_declare(NPY_DOUBLE, Float64, double)
 #define TECA_PY_ARRAY_SCALAR_DISPATCH(OBJ, CODE)                            \
     TECA_PY_ARRAY_SCALAR_DISPATCH_FP(OBJ, CODE)                             \
     else TECA_PY_ARRAY_SCALAR_DISPATCH_I(OBJ, CODE)
+/// @endcond
 
 
-// ****************************************************************************
+/// Append values from the object to the variant array.
 bool append(teca_variant_array *varr, PyObject *obj)
 {
     // numpy ndarray
@@ -253,7 +266,7 @@ bool append(teca_variant_array *varr, PyObject *obj)
     return false;
 }
 
-// ****************************************************************************
+/// Copy values from the object into variant array.
 bool copy(teca_variant_array *varr, PyObject *obj)
 {
     if (PyArray_Check(obj) || PyArray_CheckScalar(obj))
@@ -267,7 +280,7 @@ bool copy(teca_variant_array *varr, PyObject *obj)
     return false;
 }
 
-// ****************************************************************************
+/// Set i'th element of the variant array to the value of the object.
 bool set(teca_variant_array *varr, unsigned long i, PyObject *obj)
 {
     // numpy scalar
@@ -284,8 +297,7 @@ bool set(teca_variant_array *varr, unsigned long i, PyObject *obj)
     return false;
 }
 
-
-// ****************************************************************************
+/// Construct a new variant array and initialize it with a copy of the object.
 p_teca_variant_array new_variant_array(PyObject *obj)
 {
     // not an array
@@ -320,7 +332,7 @@ p_teca_variant_array new_variant_array(PyObject *obj)
     return nullptr;
 }
 
-// ****************************************************************************
+/// Construct a new numpy array initialized with the contents of the variant array.
 template <typename NT>
 PyArrayObject *new_object(teca_variant_array_impl<NT> *varrt)
 {
@@ -346,7 +358,7 @@ PyArrayObject *new_object(teca_variant_array_impl<NT> *varrt)
     return arr;
 }
 
-// ****************************************************************************
+/// Construct a new numpy array initialized with the contents of the variant array.
 PyArrayObject *new_object(teca_variant_array *varr)
 {
     TEMPLATE_DISPATCH(teca_variant_array_impl, varr,
diff --git a/python/teca_py_core.i b/python/teca_py_core.i
index fa67e3025..28273ae52 100644
--- a/python/teca_py_core.i
+++ b/python/teca_py_core.i
@@ -1,7 +1,7 @@
 %{
 #include <vector>
 
-#include "calcalcs.h"
+#include "teca_calcalcs.h"
 #include "teca_algorithm_executive.h"
 #include "teca_index_executive.h"
 #include "teca_metadata.h"
@@ -158,7 +158,6 @@ class teca_variant_array;
 %ignore operator<<(std::ostream &, const std::vector<std::string> &);
 %include "teca_common.h"
 %include "teca_shared_object.h"
-%include "teca_variant_array_fwd.h"
 %ignore teca_variant_array::operator=;
 %ignore teca_variant_array_factory;
 %ignore teca_variant_array::append(const teca_variant_array &other);
@@ -484,7 +483,6 @@ class teca_dataset;
 %template(teca_dataset_base) std::enable_shared_from_this<teca_dataset>;
 %ignore teca_dataset::operator=;
 %ignore teca_dataset::set_index_request_key(std::string const *);
-%include "teca_dataset_fwd.h"
 %include "teca_dataset.h"
 TECA_PY_CONST_CAST(teca_dataset)
 %extend teca_dataset
@@ -589,7 +587,6 @@ class teca_algorithm_executive;
 %ignore teca_algorithm_executive::operator=;
 %include "teca_common.h"
 %include "teca_shared_object.h"
-%include "teca_algorithm_executive_fwd.h"
 %include "teca_algorithm_executive.h"
 
 /***************************************************************************
@@ -609,11 +606,9 @@ class teca_algorithm_executive;
 %shared_ptr(teca_algorithm)
 class teca_algorithm;
 %template(teca_algorithm_base) std::enable_shared_from_this<teca_algorithm>;
-typedef std::pair<std::shared_ptr<teca_algorithm>, unsigned int> teca_algorithm_output_port;
 %template(teca_output_port_type) std::pair<std::shared_ptr<teca_algorithm>, unsigned int>;
 %include "teca_common.h"
 %include "teca_shared_object.h"
-%include "teca_algorithm_fwd.h"
 %include "teca_program_options.h"
 %include "teca_algorithm.h"
 
@@ -707,7 +702,6 @@ typedef std::pair<std::shared_ptr<teca_algorithm>, unsigned int> teca_algorithm_
 %ignore teca_threaded_algorithm::shared_from_this;
 %shared_ptr(teca_threaded_algorithm)
 %ignore teca_threaded_algorithm::operator=;
-%include "teca_threaded_algorithm_fwd.h"
 %include "teca_threaded_algorithm.h"
 
 /***************************************************************************
@@ -716,7 +710,6 @@ typedef std::pair<std::shared_ptr<teca_algorithm>, unsigned int> teca_algorithm_
 %ignore teca_index_reduce::shared_from_this;
 %shared_ptr(teca_index_reduce)
 %ignore teca_index_reduce::operator=;
-%include "teca_index_reduce_fwd.h"
 %include "teca_index_reduce.h"
 
 /***************************************************************************
@@ -754,7 +747,6 @@ typedef std::pair<std::shared_ptr<teca_algorithm>, unsigned int> teca_algorithm_
 %ignore teca_programmable_algorithm::get_request_callback;
 %ignore teca_programmable_algorithm::set_execute_callback;
 %ignore teca_programmable_algorithm::get_execute_callback;
-%include "teca_programmable_algorithm_fwd.h"
 %include "teca_programmable_algorithm.h"
 
 /***************************************************************************
@@ -792,7 +784,6 @@ typedef std::pair<std::shared_ptr<teca_algorithm>, unsigned int> teca_algorithm_
 %ignore teca_threaded_programmable_algorithm::get_request_callback;
 %ignore teca_threaded_programmable_algorithm::set_execute_callback;
 %ignore teca_threaded_programmable_algorithm::get_execute_callback;
-%include "teca_programmable_algorithm_fwd.h"
 %include "teca_threaded_programmable_algorithm.h"
 
 /***************************************************************************
@@ -839,7 +830,6 @@ typedef std::pair<std::shared_ptr<teca_algorithm>, unsigned int> teca_algorithm_
 %ignore teca_programmable_reduce::get_reduce_callback;
 %ignore teca_programmable_reduce::set_finalize_callback;
 %ignore teca_programmable_reduce::get_finalize_callback;
-%include "teca_programmable_reduce_fwd.h"
 %include "teca_programmable_reduce.h"
 
 /***************************************************************************
@@ -874,7 +864,7 @@ typedef std::pair<std::shared_ptr<teca_algorithm>, unsigned int> teca_algorithm_
 %include "teca_dataset_capture.h"
 
 /***************************************************************************
- calcalcs
+ teca_calcalcs
  ***************************************************************************/
 %inline
 %{
@@ -894,7 +884,7 @@ PyObject *date(double offset, const char *units, const char *calendar)
     int minute = -1;
     double second = -1.0;
 
-    if (calcalcs::date(offset, &year, &month, &day, &hour,
+    if (teca_calcalcs::date(offset, &year, &month, &day, &hour,
         &minute, &second, units, calendar))
     {
         TECA_PY_ERROR_NOW(PyExc_RuntimeError, "Failed to convert time")
@@ -916,7 +906,7 @@ PyObject *is_leap_year(const char *calendar, const char *units,
     teca_py_gil_state gil;
 
     int leap = 0;
-    if (calcalcs::is_leap_year(calendar, units, year, leap))
+    if (teca_calcalcs::is_leap_year(calendar, units, year, leap))
     {
         TECA_PY_ERROR_NOW(PyExc_RuntimeError,
             "Failed to determine leap year status")
@@ -934,7 +924,7 @@ PyObject *days_in_month(const char *calendar, const char *units,
     teca_py_gil_state gil;
 
     int dpm = 0;
-    if (calcalcs::days_in_month(calendar, units, year, month, dpm))
+    if (teca_calcalcs::days_in_month(calendar, units, year, month, dpm))
     {
         TECA_PY_ERROR_NOW(PyExc_RuntimeError,
             "Failed to determine days in month")
@@ -970,8 +960,8 @@ PyObject *thread_parameters(MPI_Comm comm,
     {
         // caller requested automatic load balancing but this,
         // failed.
-        TECA_PY_ERROR(PyExc_RuntimeError,
-            "Automatic load balancing failed")
+        PyErr_Format(PyExc_RuntimeError,
+            "Failed to detect thread parameters.");
         return nullptr;
     }
 
diff --git a/python/teca_py_data.i b/python/teca_py_data.i
index 10b79d3f9..e5a139b7a 100644
--- a/python/teca_py_data.i
+++ b/python/teca_py_data.i
@@ -77,7 +77,6 @@
 %shared_ptr(teca_array_collection)
 %ignore teca_array_collection::operator=;
 %ignore teca_array_collection::operator[];
-%include "teca_array_collection_fwd.h"
 %include "teca_array_collection.h"
 %extend teca_array_collection
 {
@@ -149,8 +148,8 @@
 %ignore teca_mesh::get_time_step(unsigned long *) const;
 %ignore teca_mesh::set_calendar(std::string const *);
 %ignore teca_mesh::set_time_units(std::string const *);
-%ignore teca_mesh::set_array_attributes(teca_metadata const *);
-%ignore teca_mesh::get_array_attributes(teca_metadata *) const;
+%ignore teca_mesh::set_attributes(teca_metadata const *);
+%ignore teca_mesh::get_attributes(teca_metadata *) const;
 %ignore teca_mesh::get_arrays(int) const;
 %ignore teca_mesh::get_point_arrays() const;
 %ignore teca_mesh::get_cell_arrays() const;
@@ -161,7 +160,6 @@
 %ignore teca_mesh::get_y_face_arrays() const;
 %ignore teca_mesh::get_z_face_arrays() const;
 %ignore teca_mesh::get_information_arrays() const;
-%include "teca_mesh_fwd.h"
 %include "teca_mesh.h"
 TECA_PY_DYNAMIC_CAST(teca_mesh, teca_dataset)
 TECA_PY_CONST_CAST(teca_mesh)
@@ -174,12 +172,12 @@ TECA_PY_CONST_CAST(teca_mesh)
     TECA_PY_DATASET_METADATA(std::string, calendar)
     TECA_PY_DATASET_METADATA(std::string, time_units)
 
-    teca_metadata get_array_attributes()
+    teca_metadata get_attributes()
     {
         teca_py_gil_state gil;
 
         teca_metadata atts;
-        self->get_array_attributes(atts);
+        self->get_attributes(atts);
 
         return atts;
     }
@@ -723,7 +721,6 @@ TECA_PY_CONST_CAST(teca_table)
 %shared_ptr(teca_table_collection)
 %ignore teca_table_collection::operator=;
 %ignore teca_table_collection::operator[];
-%include "teca_table_collection_fwd.h"
 %include "teca_table_collection.h"
 %extend teca_table_collection
 {
@@ -759,7 +756,6 @@ TECA_PY_CONST_CAST(teca_table)
 %shared_ptr(teca_database)
 %ignore teca_database::operator=;
 %ignore teca_database::get_table_name(unsigned int);
-%include "teca_database_fwd.h"
 %include "teca_database.h"
 TECA_PY_DYNAMIC_CAST(teca_database, teca_dataset)
 TECA_PY_CONST_CAST(teca_database)
diff --git a/python/teca_py_gil_state.h b/python/teca_py_gil_state.h
index 2a6da36f8..6945dc41d 100644
--- a/python/teca_py_gil_state.h
+++ b/python/teca_py_gil_state.h
@@ -3,7 +3,10 @@
 
 #include <Python.h>
 
-// RAII helper for managing the Python GIL
+/// A RAII helper for managing the Python GIL.
+/** The GIL is aquired and held while the object exists. The GIL must be held
+ * by C++ code invoking any Python C-API calls.
+ */
 class teca_py_gil_state
 {
 public:
diff --git a/python/teca_py_iterator.h b/python/teca_py_iterator.h
index cfd26c9be..e102f4617 100644
--- a/python/teca_py_iterator.h
+++ b/python/teca_py_iterator.h
@@ -1,17 +1,20 @@
 #ifndef teca_py_iterator_h
 #define teca_py_iterator_h
 
+/// @file
+
 #include "teca_common.h"
 #include "teca_variant_array.h"
 #include "teca_py_object.h"
 #include "teca_py_string.h"
 #include <Python.h>
 
-// this macro is used to build up dispatchers
-// PYT - type tag idnetifying the PyObject
-// ITER - PySequence* instance
-// CODE - code to execute on match
-// ST - typedef coresponding to matching tag
+/** this macro is used to build up dispatchers
+ * PYT - type tag idnetifying the PyObject
+ * ITER - PySequence* instance
+ * CODE - code to execute on match
+ * ST - typedef coresponding to matching tag
+ */
 #define TECA_PY_ITERATOR_DISPATCH_CASE(PYT, ITER, CODE) \
     if (teca_py_iterator::is_type<PYT>(ITER))           \
     {                                                   \
@@ -19,7 +22,7 @@
         CODE                                            \
     }
 
-// the macro dispatches for all the Python types
+/// the macro dispatches for all the Python types
 #define TECA_PY_ITERATOR_DISPATCH(ITER, CODE)               \
     TECA_PY_ITERATOR_DISPATCH_CASE(bool, ITER, CODE)        \
     else TECA_PY_ITERATOR_DISPATCH_CASE(int, ITER, CODE)    \
@@ -27,21 +30,21 @@
     else TECA_PY_ITERATOR_DISPATCH_CASE(char*, ITER, CODE)  \
     else TECA_PY_ITERATOR_DISPATCH_CASE(long, ITER, CODE)
 
-// this one just the numeric types
+/// this one just the numeric types
 #define TECA_PY_ITERATOR_DISPATCH_NUM(ITER, CODE)           \
     TECA_PY_ITERATOR_DISPATCH_CASE(int, ITER, CODE)         \
     else TECA_PY_ITERATOR_DISPATCH_CASE(float, ITER, CODE)  \
     else TECA_PY_ITERATOR_DISPATCH_CASE(long, ITER, CODE)
 
-// this one just strings
+/// this one just strings
 #define TECA_PY_ITERATOR_DISPATCH_STR(ITER, CODE)   \
     TECA_PY_ITERATOR_DISPATCH_CASE(char*, ITER, CODE)
 
-
+/// Codes for interfacing to Python iterators
 namespace teca_py_iterator
 {
 
-// ****************************************************************************
+/// Returns true if the object is iterable.
 bool is_iterable(PyObject *obj)
 {
     PyObject *iter = nullptr;
@@ -55,7 +58,7 @@ bool is_iterable(PyObject *obj)
 }
 
 
-// ****************************************************************************
+/// Returns true if all of the elements of the container match the templated type.
 template <typename py_t>
 bool is_type(PyObject *obj)
 {
@@ -83,7 +86,7 @@ bool is_type(PyObject *obj)
     return true;
 }
 
-// ****************************************************************************
+/// Appends values from the object to the variant array
 bool append(teca_variant_array *va, PyObject *obj)
 {
     // not a iterator
@@ -127,7 +130,7 @@ bool append(teca_variant_array *va, PyObject *obj)
     return false;
 }
 
-// ****************************************************************************
+/// Copies values from the object into the variant array
 bool copy(teca_variant_array *va, PyObject *obj)
 {
     // not a iterator
@@ -173,7 +176,7 @@ bool copy(teca_variant_array *va, PyObject *obj)
     return false;
 }
 
-// ****************************************************************************
+/// Cretaes a new variant array initialized with a copy of the object.
 p_teca_variant_array new_variant_array(PyObject *obj)
 {
     // not a iterator
diff --git a/python/teca_py_object.h b/python/teca_py_object.h
index 43753124c..39ddf1d68 100644
--- a/python/teca_py_object.h
+++ b/python/teca_py_object.h
@@ -1,34 +1,39 @@
 #ifndef teca_py_object_h
 #define teca_py_object_h
 
+/// @file
+
 #include "teca_common.h"
 #include "teca_variant_array.h"
 #include "teca_py_string.h"
 #include "teca_py_integer.h"
 #include <Python.h>
 
+/// Codes dealing with Python objects
 namespace teca_py_object
 {
+
 /// teca_py_object::cpp_tt, A traits class for working with PyObject's
 /**
-if know the Python type tag then this class gives you:
-
-::type -- C++ type that can hold the value of the PyObject.
-::is_type -- returns true if the given PyObject has this type
-::value -- convert given PyObject to its C++ type
-
-Python type tags and their coresponding PyObject's are:
-int --> PyInt/PyLong, long --> PyInt/PyLong, bool --> PyBool,
-float --> PyFloat, char* --> PyUnicode/PyString
+ * if know the Python type tag then this class gives you:
+ *
+ *     type -- C++ type that can hold the value of the PyObject.
+ *     is_type -- returns true if the given PyObject has this type
+ *     value -- convert given PyObject to its C++ type
+ *
+ * Python type tags and their coresponding PyObject's are:
+ *
+ * int --> PyInt/PyLong, long --> PyInt/PyLong, bool --> PyBool,
+ * float --> PyFloat, char* --> PyUnicode/PyString
 */
 template <typename py_t> struct cpp_tt
 {};
 
-/*
-PY_T -- C-name of python type
-CPP_T -- underlying type needed to store it on the C++ side
-PY_CHECK -- function that verifies the PyObject is this type
-PY_AS_CPP -- function that converts to the C++ type */
+/** PY_T -- C-name of python type
+ * CPP_T -- underlying type needed to store it on the C++ side
+ * PY_CHECK -- function that verifies the PyObject is this type
+ * PY_AS_CPP -- function that converts to the C++ type
+ */
 #define teca_py_object_cpp_tt_declare(PY_T, CPP_T, PY_CHECK, PY_AS_CPP) \
 template <> struct cpp_tt<PY_T>                                         \
 {                                                                       \
@@ -41,6 +46,7 @@ teca_py_object_cpp_tt_declare(long, long, PyLongCheck, PyLongToCLong)
 teca_py_object_cpp_tt_declare(float, double, PyFloat_Check, PyFloat_AsDouble)
 teca_py_object_cpp_tt_declare(char*, std::string, PyStringCheck, PyStringToCString)
 teca_py_object_cpp_tt_declare(bool, int, PyBool_Check, PyIntegerToCInt)
+
 // teca_metadata
 template <> struct cpp_tt<teca_metadata>
 {
@@ -68,28 +74,29 @@ template <> struct cpp_tt<teca_metadata>
 
 /// py_tt, traits class for working with PyObject's
 /**
-if you know the C++ type then this class gives you:
-
-::tag -- Use this in teca_py_object::cpp_t to find
-         the PyObject indentification and conversion
-         methods. see example below.
-
-::new_object -- copy construct a new PyObject
-
-here is an example of looking up the PyObject conversion
-function(value) from a known C++ type (float).
-
-float val = cpp_tt<py_tt<float>::tag>::value(obj);
-
-py_tt is used to take a C++ type and lookup the Python type
-tag. Then the type tag is used to lookup the function.
+ * if you know the C++ type then this class gives you:
+ *
+ *     tag -- Use this in teca_py_object::cpp_t to find
+ *              the PyObject indentification and conversion
+ *              methods. see example below.
+ *
+ *     new_object -- copy construct a new PyObject
+ *
+ * here is an example of looking up the PyObject conversion
+ * function(value) from a known C++ type (float).
+ *
+ *     float val = cpp_tt<py_tt<float>::tag>::value(obj);
+ *
+ * py_tt is used to take a C++ type and lookup the Python type
+ * tag. Then the type tag is used to lookup the function.
 */
 template <typename type> struct py_tt
 {};
 
 /**
-CPP_T -- underlying type needed to store it on the C++ side
-CPP_AS_PY -- function that converts from the C++ type */
+ * CPP_T -- underlying type needed to store it on the C++ side
+ * CPP_AS_PY -- function that converts from the C++ type
+ */
 #define teca_py_object_py_tt_declare(CPP_T, PY_T, CPP_AS_PY)\
 template <> struct py_tt<CPP_T>                             \
 {                                                           \
@@ -109,14 +116,14 @@ teca_py_object_py_tt_declare(unsigned long, int, CIntUToPyInteger)
 teca_py_object_py_tt_declare(unsigned long long, int, CIntULLToPyInteger)
 teca_py_object_py_tt_declare(float, float, PyFloat_FromDouble)
 teca_py_object_py_tt_declare(double, float, PyFloat_FromDouble)
-// string
+/// string
 template <> struct py_tt<std::string>
 {
     typedef char* tag;
     static PyObject *new_object(const std::string &s)
     { return CStringToPyString(s.c_str()); }
 };
-// teca_metadata
+/// teca_metadata
 template <> struct py_tt<teca_metadata>
 {
     typedef teca_metadata tag;
@@ -129,11 +136,12 @@ template <> struct py_tt<teca_metadata>
 };
 
 
-// dispatch macro.
-// OBJ -- PyObject* instance
-// CODE -- code block to execute on match
-// OT -- a typedef to the match type available in
-//       the code block
+/** dispatch macro.
+ * OBJ -- PyObject* instance
+ * CODE -- code block to execute on match
+ * OT -- a typedef to the match type available in
+ *       the code block
+ */
 #define TECA_PY_OBJECT_DISPATCH_CASE(CPP_T, PY_OBJ, CODE)   \
     if (teca_py_object::cpp_tt<CPP_T>::is_type(PY_OBJ))     \
     {                                                       \
@@ -141,7 +149,7 @@ template <> struct py_tt<teca_metadata>
         CODE                                                \
     }
 
-// all
+/// all
 #define TECA_PY_OBJECT_DISPATCH(PY_OBJ, CODE)                       \
     TECA_PY_OBJECT_DISPATCH_CASE(int, PY_OBJ, CODE)                 \
     else TECA_PY_OBJECT_DISPATCH_CASE(float, PY_OBJ, CODE)          \
@@ -149,20 +157,22 @@ template <> struct py_tt<teca_metadata>
     else TECA_PY_OBJECT_DISPATCH_CASE(long, PY_OBJ, CODE)           \
     else TECA_PY_OBJECT_DISPATCH_CASE(teca_metadata, PY_OBJ, CODE)
 
-// just numeric/POD
+/// just numeric/POD
 #define TECA_PY_OBJECT_DISPATCH_NUM(PY_OBJ, CODE)           \
     TECA_PY_OBJECT_DISPATCH_CASE(int, PY_OBJ, CODE)         \
     else TECA_PY_OBJECT_DISPATCH_CASE(float, PY_OBJ, CODE)  \
     else TECA_PY_OBJECT_DISPATCH_CASE(long, PY_OBJ, CODE)
 
-// just special cases
+/// just special cases
 #define TECA_PY_OBJECT_DISPATCH_STR(PY_OBJ, CODE)       \
     TECA_PY_OBJECT_DISPATCH_CASE(char*, PY_OBJ, CODE)
 
 #define TECA_PY_OBJECT_DISPATCH_MD(PY_OBJ, CODE)                \
     TECA_PY_OBJECT_DISPATCH_CASE(teca_metadata, PY_OBJ, CODE)
 
-// ****************************************************************************
+
+
+/// Creates a new variant array initializede with a copy of the object.
 p_teca_variant_array new_variant_array(PyObject *obj)
 {
     TECA_PY_OBJECT_DISPATCH(obj,
@@ -178,7 +188,7 @@ p_teca_variant_array new_variant_array(PyObject *obj)
     return nullptr;
 }
 
-// ****************************************************************************
+/// Copies values from the object into the variant array.
 bool copy(teca_variant_array *varr, PyObject *obj)
 {
     TEMPLATE_DISPATCH(teca_variant_array_impl, varr,
@@ -211,7 +221,7 @@ bool copy(teca_variant_array *varr, PyObject *obj)
     return false;
 }
 
-// ****************************************************************************
+/// Sets the i'th element of the variant array to the value of the object.
 bool set(teca_variant_array *varr, unsigned long i, PyObject *obj)
 {
     TEMPLATE_DISPATCH(teca_variant_array_impl, varr,
@@ -241,7 +251,7 @@ bool set(teca_variant_array *varr, unsigned long i, PyObject *obj)
     return false;
 }
 
-// ****************************************************************************
+/// Appends values from the object at the end of the variant array.
 bool append(teca_variant_array *varr, PyObject *obj)
 {
     TEMPLATE_DISPATCH(teca_variant_array_impl, varr,
@@ -270,7 +280,7 @@ bool append(teca_variant_array *varr, PyObject *obj)
     return false;
 }
 
-// container that keeps a reference to a PyObject
+/// A container that keeps a reference to a PyObject
 class teca_py_object_ptr
 {
 public:
@@ -321,6 +331,7 @@ class teca_py_object_ptr
     PyObject *m_obj;
 };
 
+/// A container that keeps a reference to a callable object.
 class teca_py_callable : public teca_py_object_ptr
 {
 public:
diff --git a/python/teca_py_sequence.h b/python/teca_py_sequence.h
index 1dd4888e4..7ee94829b 100644
--- a/python/teca_py_sequence.h
+++ b/python/teca_py_sequence.h
@@ -1,12 +1,15 @@
 #ifndef teca_py_sequence_h
 #define teca_py_sequence_h
 
+/// @file
+
 #include "teca_common.h"
 #include "teca_variant_array.h"
 #include "teca_py_object.h"
 #include "teca_py_string.h"
 #include <Python.h>
 
+/// @cond
 // this macro is used to build up dispatchers
 // PYT - type tag idnetifying the PyObject
 // SEQ - PySequence* instance
@@ -37,10 +40,15 @@
 #define TECA_PY_SEQUENCE_DISPATCH_STR(SEQ, CODE)    \
     TECA_PY_SEQUENCE_DISPATCH_CASE(char*, SEQ, CODE)
 
+/// @endcond
 
+/// Codes for interfacing to Python sequences
 namespace teca_py_sequence
 {
-// ****************************************************************************
+
+/** @brief Returns true if all the elements in the sequence have the same type
+ * as the template argument.
+ */
 template <typename py_t>
 bool is_type(PyObject *seq)
 {
@@ -68,7 +76,7 @@ bool is_type(PyObject *seq)
     return true;
 }
 
-// ****************************************************************************
+/// Appends values from the sequence into the variant array.
 bool append(teca_variant_array *va, PyObject *seq)
 {
     // not a sequence
@@ -110,7 +118,7 @@ bool append(teca_variant_array *va, PyObject *seq)
     return false;
 }
 
-// ****************************************************************************
+/// Copies the values from the sequence into the variant array.
 bool copy(teca_variant_array *va, PyObject *seq)
 {
     // not a sequence
@@ -155,7 +163,7 @@ bool copy(teca_variant_array *va, PyObject *seq)
     return false;
 }
 
-// ****************************************************************************
+/// Returns a new variant array initialized with a copy of the sequence.
 p_teca_variant_array new_variant_array(PyObject *seq)
 {
     // not a sequence
@@ -187,7 +195,7 @@ p_teca_variant_array new_variant_array(PyObject *seq)
     return nullptr;
 }
 
-// ****************************************************************************
+/// Returns a list initialized with a copy of the variant array.
 template<typename NT>
 PyObject *new_object(const teca_variant_array_impl<NT> *va)
 {
@@ -199,7 +207,7 @@ PyObject *new_object(const teca_variant_array_impl<NT> *va)
     return list;
 }
 
-// ****************************************************************************
+/// Returns a list initialized with a copy of the variant array.
 PyObject *new_object(const_p_teca_variant_array va)
 {
     TEMPLATE_DISPATCH(const teca_variant_array_impl,
diff --git a/setup.py b/setup.py
index 772ee7c91..e915c9430 100644
--- a/setup.py
+++ b/setup.py
@@ -12,7 +12,7 @@
 # when compiled outside of the git repo we must set the version
 # manually. Also note that these must be unique per upload to PyPi
 # so be sure to use an 'rcX' for testing
-teca_version = "4.0.0"
+teca_version = "4.1.0"
 
 class CMakeExtension(Extension):
     def __init__(self, name, sourcedir=''):
diff --git a/system/teca_system_interface.h b/system/teca_system_interface.h
index 9a196013c..d456ee81b 100644
--- a/system/teca_system_interface.h
+++ b/system/teca_system_interface.h
@@ -1,27 +1,30 @@
 #ifndef teca_system_interface_h
 #define teca_system_interface_h
 
+/// @file
+
 #include "teca_mpi.h"
 #include <string>
 
+/// Codes for interfacing with low level system API's
 namespace teca_system_interface
 {
-/**
-when set print stack trace in response to common signals.
-*/
+
+/// when set print stack trace in response to common signals.
 void set_stack_trace_on_error(int enable=1);
-void set_stack_trace_on_mpi_error(MPI_Comm comm=MPI_COMM_WORLD, int enable=1);
 
-/**
-return current program stack in a string demangle cxx symbols
-if possible.
+/// when set print stack trace in response to MPI errors.
+void set_stack_trace_on_mpi_error(MPI_Comm comm=MPI_COMM_WORLD, int enable=1);
 
-first_frame - frame number to start trace from
-whole_path -  set true to see full path in source file listing
+/** return current program stack in a string demangle cxx symbols
+ * if possible.
+ *
+ *    first_frame - frame number to start trace from
+ *    whole_path -  set true to see full path in source file listing
 */
 std::string get_program_stack(int first_frame, int whole_path);
 
-
+/// Return the name of the currently running program.
 std::string get_program_name();
 };
 
diff --git a/test/CMakeLists.txt b/test/CMakeLists.txt
index 5d752b9af..5705d3bb8 100644
--- a/test/CMakeLists.txt
+++ b/test/CMakeLists.txt
@@ -183,7 +183,7 @@ teca_add_test(test_cf_writer_cam5_mpi_threads
     COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} test_cf_writer
     -i "${TECA_DATA_ROOT}/cam5_1_amip_run2\\.cam2\\.h2\\.1991-10-[0-9][0-9]-10800\\.nc"
     -o "test_cf_writer_cam5_mt_%t%.nc" -s 0,-1 -x lon -y lat -t time -c 1 -n 2 U850 V850
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_cf_writer_cfsr_mpi_threads
@@ -191,14 +191,14 @@ teca_add_test(test_cf_writer_cfsr_mpi_threads
     -i "${TECA_DATA_ROOT}/NCEP_CFSR_0\\.5_1979\\.nc"
     -o "test_cf_writer_NCEP_CFSR_mt_%t%.nc" -s 0,-1 -x longitude -y latitude
     -b 65,110,10,55,0,0 -c 1 -n 2 elevation
-    FEATURES ${TECA_HAS_NETCDF}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_cf_writer_era5_mpi_threads
     COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} test_cf_writer
     -i "${TECA_DATA_ROOT}/e5\.oper\.an\.vinteg\.162_072_viwvn.*\.nc"
     -o "test_cf_writer_era5_mt_%t%.nc" -s 0,-1 -x longitude -y latitude -t time -c 1 -n 2 VIWVN
-    FEATURES ${TECA_HAS_NETCDF}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_connected_components
@@ -250,12 +250,12 @@ teca_add_test(test_latitude_damper
     LIBS teca_core teca_data teca_io teca_alg ${teca_test_link}
     COMMAND test_latitude_damper 361 181 10 "test_latitude_damper_%t%.%e%")
 
-teca_add_test(test_temporal_average
-    SOURCES test_temporal_average.cpp
+teca_add_test(test_simple_moving_average
+    SOURCES test_simple_moving_average.cpp
     LIBS teca_core teca_data teca_io teca_alg ${teca_test_link}
-    COMMAND test_temporal_average
-    "${TECA_DATA_ROOT}/cam5_1_amip_run2.cam2.h2.1991-10-01-10800.nc"
-    test_temporal_average_%t%.%e% 0 -1 3 U850
+    COMMAND test_simple_moving_average
+    "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc$"
+    "${TECA_DATA_ROOT}/test_temporal_average" 0 -1 3 1 prw
     FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
@@ -331,7 +331,7 @@ teca_add_test(test_descriptive_statistics_mpi_threads
     "${TECA_DATA_ROOT}/cam5_1_amip_run2\\.cam2\\.h2\\.1991-10-[0-9][0-9]-10800\\.nc"
     "${TECA_DATA_ROOT}/test_descriptive_statistics.bin" 0 -1 2
     TMQ T200 T500
-    FEATURES ${TECA_HAS_UDUNITS} ${TECA_HAS_NETCDF} ${TECA_HAS_MPI}
+    FEATURES ${TECA_HAS_UDUNITS} ${TECA_HAS_NETCDF} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_streaming_reduce_threads
@@ -347,9 +347,8 @@ teca_add_test(test_streaming_reduce_mpi_threads
     LIBS teca_core teca_data teca_io teca_alg ${teca_test_link}
     COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} test_descriptive_statistics 0
     "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3.*\\.nc"
-    "${TECA_DATA_ROOT}/test_streaming_reduce.bin" 0 -1 4
-    prw
-    FEATURES ${TECA_HAS_UDUNITS} ${TECA_HAS_NETCDF}
+    "${TECA_DATA_ROOT}/test_streaming_reduce.bin" 0 -1 4 prw
+    FEATURES ${TECA_HAS_UDUNITS} ${TECA_HAS_NETCDF} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_binary_stream
@@ -396,6 +395,7 @@ teca_add_test(test_tc_candidates_mpi_threads
     "${TECA_DATA_ROOT}/test_tc_candidates_20.bin" 0 3 2
     U850 V850 UBOT VBOT PSL T500 T200 Z1000 Z200 -20 20
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_tc_trajectory
@@ -446,7 +446,7 @@ teca_add_test(test_table_reader_distribute_mpi_threads
     "${TECA_DATA_ROOT}/test_tc_candidates_20.bin"
     "${TECA_DATA_ROOT}/test_table_reader_distribute_20.bin"
     "step" 0 -1 2
-    FEATURES ${TECA_HAS_MPI}
+    FEATURES ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_tc_wind_radii_serial
@@ -473,7 +473,7 @@ teca_add_test(test_tc_wind_radii_mpi_threads
     "${TECA_DATA_ROOT}/cam5_1_amip_run2_1990s/.*\\.nc$" "${TECA_DATA_ROOT}/test_tc_wind_radii.bin"
     "!(((track_id==4)&&(surface_wind*3.6d>=177.0d))||((track_id==191)&&(surface_wind*3.6d>=249.0d))||((track_id==523)&&(3.6d*surface_wind>=209.0d)))"
     32 1 2 0 -1
-    FEATURES (${TECA_HAS_MPI} AND ${TECA_HAS_NETCDF})
+    FEATURES ${TECA_HAS_MPI} ${TECA_HAS_NETCDF} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_tc_wind_radii_threads
@@ -559,7 +559,15 @@ teca_add_test(test_bayesian_ar_detect_threads
     COMMAND test_bayesian_ar_detect
     "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\\.nc$"
     "${TECA_DATA_ROOT}/test_bayesian_ar_detect.bin" IVT
-    "bayesian_ar_detect_%t%.nc" ${TEST_CORES} 0 -1
+    "bayesian_ar_detect_%t%.nc" -1 0 -1
+    REQ_TECA_DATA)
+
+teca_add_test(test_bayesian_ar_detect_mpi
+    COMMAND ${MPIEXEC} -n ${TEST_CORES} test_bayesian_ar_detect
+    "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\\.nc$"
+    "${TECA_DATA_ROOT}/test_bayesian_ar_detect.bin" IVT
+    "bayesian_ar_detect_%t%.nc" -1 0 -1
+    FEATURES ${TECA_HAS_MPI} ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
 teca_add_test(test_bayesian_ar_detect_mpi_threads
@@ -567,89 +575,39 @@ teca_add_test(test_bayesian_ar_detect_mpi_threads
     "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\\.nc$"
     "${TECA_DATA_ROOT}/test_bayesian_ar_detect.bin" IVT
     "bayesian_ar_detect_%t%.nc" -1 0 -1
-    FEATURES (${TECA_HAS_MPI} AND ${TECA_HAS_NETCDF})
+    FEATURES ${TECA_HAS_MPI} ${TECA_HAS_NETCDF} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_normalize_coordinates_pass_through
     EXEC_NAME test_normalize_coordinates
     SOURCES test_normalize_coordinates.cpp
     LIBS teca_core teca_data teca_io teca_alg ${teca_test_link}
-    COMMAND test_normalize_coordinates 90 45 7 0 0 0 0 360 -90 90 0 10
-    "${TECA_DATA_ROOT}/test_normalize_coordinates.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_x
-    COMMAND test_normalize_coordinates 90 45 7 1 0 0 0 360 -90 90 0 10
+    COMMAND test_normalize_coordinates 90 45 7 0 360 -90 90 100 0
     "${TECA_DATA_ROOT}/test_normalize_coordinates.bin"
     REQ_TECA_DATA)
 
 teca_add_test(test_normalize_coordinates_flip_y
-    COMMAND test_normalize_coordinates 90 45 7 0 1 0 0 360 -90 90 0 10
-    "${TECA_DATA_ROOT}/test_normalize_coordinates.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_z
-    COMMAND test_normalize_coordinates 90 45 7 0 0 1 0 360 -90 90 0 10
-    "${TECA_DATA_ROOT}/test_normalize_coordinates.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_xy
-    COMMAND test_normalize_coordinates 90 45 7 1 1 0 0 360 -90 90 0 10
+    COMMAND test_normalize_coordinates 90 45 7 0 360 90 -90 100 0
     "${TECA_DATA_ROOT}/test_normalize_coordinates.bin"
     REQ_TECA_DATA)
 
-teca_add_test(test_normalize_coordinates_flip_xz
-    COMMAND test_normalize_coordinates 90 45 7 1 0 1 0 360 -90 90 0 10
-    "${TECA_DATA_ROOT}/test_normalize_coordinates.bin"
+teca_add_test(test_normalize_coordinates_shift_x
+    COMMAND test_normalize_coordinates 90 45 7 -180 180 -90 90 100 0
+    "${TECA_DATA_ROOT}/test_normalize_coordinates_shift_x.bin"
     REQ_TECA_DATA)
 
-teca_add_test(test_normalize_coordinates_flip_yz
-    COMMAND test_normalize_coordinates 90 45 7 0 1 1 0 360 -90 90 0 10
-    "${TECA_DATA_ROOT}/test_normalize_coordinates.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_xyz
-    COMMAND test_normalize_coordinates 90 45 7 1 1 1 0 360 -90 90 0 10
-    "${TECA_DATA_ROOT}/test_normalize_coordinates.bin"
+teca_add_test(test_normalize_coordinates_shift_x_flip_y
+    COMMAND test_normalize_coordinates 90 45 7 -180 180 90 -90 100 0
+    "${TECA_DATA_ROOT}/test_normalize_coordinates_shift_x.bin"
     REQ_TECA_DATA)
 
 teca_add_test(test_normalize_coordinates_pass_through_subset
-    COMMAND test_normalize_coordinates 90 45 7 0 0 0 40 190 -30 45 3 7
-    "${TECA_DATA_ROOT}/test_normalize_coordinates_subset.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_x_subset
-    COMMAND test_normalize_coordinates 90 45 7 1 0 0 40 190 -30 45 3 7
+    COMMAND test_normalize_coordinates 90 45 7 0 360 -90 90 100 0 40 190 -30 45 70 30
     "${TECA_DATA_ROOT}/test_normalize_coordinates_subset.bin"
     REQ_TECA_DATA)
 
 teca_add_test(test_normalize_coordinates_flip_y_subset
-    COMMAND test_normalize_coordinates 90 45 7 0 1 0 40 190 -30 45 3 7
-    "${TECA_DATA_ROOT}/test_normalize_coordinates_subset.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_z_subset
-    COMMAND test_normalize_coordinates 90 45 7 0 0 1 40 190 -30 45 3 7
-    "${TECA_DATA_ROOT}/test_normalize_coordinates_subset.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_xy_subset
-    COMMAND test_normalize_coordinates 90 45 7 1 1 0 40 190 -30 45 3 7
-    "${TECA_DATA_ROOT}/test_normalize_coordinates_subset.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_xz_subset
-    COMMAND test_normalize_coordinates 90 45 7 1 0 1 40 190 -30 45 3 7
-    "${TECA_DATA_ROOT}/test_normalize_coordinates_subset.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_yz_subset
-    COMMAND test_normalize_coordinates 90 45 7 0 1 1 40 190 -30 45 3 7
-    "${TECA_DATA_ROOT}/test_normalize_coordinates_subset.bin"
-    REQ_TECA_DATA)
-
-teca_add_test(test_normalize_coordinates_flip_xyz_subset
-    COMMAND test_normalize_coordinates 90 45 7 1 1 1 40 190 -30 45 3 7
+    COMMAND test_normalize_coordinates 90 45 7 0 360 90 -90 100 0 40 190 -30 45 70 30
     "${TECA_DATA_ROOT}/test_normalize_coordinates_subset.bin"
     REQ_TECA_DATA)
 
@@ -671,13 +629,13 @@ teca_add_test(test_cf_writer_collective_threads
 teca_add_test(test_cf_writer_collective_mpi
     COMMAND ${MPIEXEC} -n ${TEST_CORES} test_cf_writer_collective 128 512 128 1
     "${TECA_DATA_ROOT}/test_cf_writer_collective_%t%.bin" 213
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI}
     REQ_TECA_DATA)
 
 teca_add_test(test_cf_writer_collective_mpi_threads
     COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} test_cf_writer_collective 128 512 128 2
     "${TECA_DATA_ROOT}/test_cf_writer_collective_%t%.bin" 213
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(test_cf_writer_bad_type
@@ -688,12 +646,29 @@ teca_add_test(test_cf_writer_bad_type
     REQ_TECA_DATA
     WILL_FAIL)
 
-teca_add_test(test_integrated_vapor_transport
+teca_add_test(test_integrated_water_vapor_vv_mask
+    SOURCES test_integrated_water_vapor.cpp
+    EXEC_NAME test_integrated_water_vapor
+    LIBS teca_core teca_data teca_alg teca_io ${teca_test_link}
+    COMMAND test_integrated_water_vapor 0 0 0
+    FEATURES ${TECA_HAS_NETCDF})
+
+teca_add_test(test_integrated_water_vapor_elev_mask
+    LIBS teca_core teca_data teca_alg teca_io ${teca_test_link}
+    COMMAND test_integrated_water_vapor 1 0 0
+    FEATURES ${TECA_HAS_NETCDF})
+
+teca_add_test(test_integrated_vapor_transport_vv_mask
     SOURCES test_integrated_vapor_transport.cpp
+    EXEC_NAME test_integrated_vapor_transport
     LIBS teca_core teca_data teca_alg teca_io ${teca_test_link}
-    COMMAND test_integrated_vapor_transport
-    FEATURES ${TECA_HAS_NETCDF}
-    REQ_TECA_DATA)
+    COMMAND test_integrated_vapor_transport 0 0 0
+    FEATURES ${TECA_HAS_NETCDF})
+
+teca_add_test(test_integrated_vapor_transport_elev_mask
+    LIBS teca_core teca_data teca_alg teca_io ${teca_test_link}
+    COMMAND test_integrated_vapor_transport 1 0 0
+    FEATURES ${TECA_HAS_NETCDF})
 
 teca_add_test(test_cf_time_axis_reader
     SOURCES test_cf_time_axis_reader.cpp
@@ -705,7 +680,7 @@ teca_add_test(test_cf_time_axis_reader
 
 teca_add_test(test_cf_time_axis_reader_mpi
     COMMAND ${MPIEXEC} -n ${TEST_CORES} test_cf_time_axis_reader
-        "${TECA_DATA_ROOT}/HighResMIP/TC_test/PSL/PSL.*\\.nc$" ${HALF_TEST_CORES}
+        "${TECA_DATA_ROOT}/HighResMIP/TC_test/PSL/PSL.*\\.nc$" ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI}
     REQ_TECA_DATA)
 
@@ -715,3 +690,68 @@ teca_add_test(test_valid_value_mask
     COMMAND test_valid_value_mask 0.25 1.0e20 "${TECA_DATA_ROOT}/test_valid_value_mask.nc"
     FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
+
+teca_add_test(test_unpack_data
+    SOURCES test_unpack_data.cpp
+    LIBS teca_core teca_data teca_alg teca_io ${teca_test_link}
+    COMMAND test_unpack_data "${TECA_DATA_ROOT}/test_unpack_data.nc"
+    FEATURES ${TECA_HAS_NETCDF}
+    REQ_TECA_DATA)
+
+teca_add_test(test_priority_queue
+    SOURCES test_priority_queue.cpp
+    LIBS teca_core teca_data ${teca_test_link}
+    COMMAND test_priority_queue 57 1)
+
+teca_add_test(test_bounds_to_extent
+    SOURCES test_bounds_to_extent.cpp
+    LIBS teca_core teca_data ${teca_test_link}
+    COMMAND test_bounds_to_extent)
+
+teca_add_test(test_elevation_mask
+    SOURCES test_elevation_mask.cpp
+    LIBS teca_core teca_data teca_io teca_alg ${teca_test_link}
+    COMMAND test_elevation_mask cf
+    "${TECA_DATA_ROOT}/ECMWF-IFS-HR-SST-present_himalaya\\.nc"
+    "${TECA_DATA_ROOT}/GTOPO_DEM_025deg\\.nc"
+    "${TECA_DATA_ROOT}/test_elevation_mask"
+    FEATURES ${TECA_HAS_NETCDF}
+    REQ_TECA_DATA)
+
+teca_add_test(test_interval_iterator_daily
+    SOURCES test_interval_iterator.cpp
+    EXEC_NAME test_interval_iterator
+    LIBS teca_core teca_data teca_io teca_alg ${teca_test_link}
+    COMMAND test_interval_iterator daily
+    "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc$"
+    365
+    FEATURES ${TECA_HAS_NETCDF}
+    REQ_TECA_DATA)
+
+teca_add_test(test_interval_iterator_monthly
+    COMMAND test_interval_iterator monthly
+    "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc$"
+    12
+    FEATURES ${TECA_HAS_NETCDF}
+    REQ_TECA_DATA)
+
+teca_add_test(test_interval_iterator_seasonal
+    COMMAND test_interval_iterator seasonal
+    "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc$"
+    3
+    FEATURES ${TECA_HAS_NETCDF}
+    REQ_TECA_DATA)
+
+teca_add_test(test_interval_iterator_yearly
+    COMMAND test_interval_iterator yearly
+    "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc$"
+    1
+    FEATURES ${TECA_HAS_NETCDF}
+    REQ_TECA_DATA)
+
+teca_add_test(test_rename_variables
+    SOURCES test_rename_variables.cpp
+    LIBS teca_core teca_data teca_io teca_alg ${teca_test_link}
+    COMMAND test_rename_variables "${TECA_DATA_ROOT}/test_rename_variables.nc"
+    FEATURES ${TECA_HAS_NETCDF}
+    REQ_TECA_DATA)
diff --git a/test/apps/CMakeLists.txt b/test/apps/CMakeLists.txt
index b2c20a564..607c7aa85 100644
--- a/test/apps/CMakeLists.txt
+++ b/test/apps/CMakeLists.txt
@@ -5,135 +5,229 @@ include_directories(${CMAKE_CURRENT_SOURCE_DIR}
     $<TARGET_PROPERTY:teca_io,INTERFACE_INCLUDE_DIRECTORIES>
     )
 
-teca_add_test(test_deeplab_ar_detect_app_thread
+teca_add_app_test(test_deeplab_ar_detect_app_threads
+    teca_deeplab_ar_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_PYTORCH}
     REQ_TECA_DATA)
 
-teca_add_test(test_deeplab_ar_detect_app_mpi
+teca_add_app_test(test_deeplab_ar_detect_app_mpi
+    teca_deeplab_ar_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
-    ${MPIEXEC} ${HALF_TEST_CORES}
+    ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_PYTORCH}
         ${TECA_HAS_MPI} ${MPI4Py_FOUND}
     REQ_TECA_DATA)
 
-teca_add_test(test_deeplab_ar_detect_app_mcf_thread
+teca_add_app_test(test_deeplab_ar_detect_app_mpi_threads
+    teca_deeplab_ar_detect
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_PYTORCH}
+        ${TECA_HAS_MPI} ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_deeplab_ar_detect_app_mcf_threads
+    teca_deeplab_ar_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect_app_mcf.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_PYTORCH}
     REQ_TECA_DATA)
 
-teca_add_test(test_deeplab_ar_detect_app_mcf_mpi
+teca_add_app_test(test_deeplab_ar_detect_app_mcf_mpi
+    teca_deeplab_ar_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect_app_mcf.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
-    ${MPIEXEC} ${HALF_TEST_CORES}
+    ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_PYTORCH}
         ${TECA_HAS_MPI} ${MPI4Py_FOUND}
     REQ_TECA_DATA)
 
-teca_add_test(test_bayesian_ar_detect_app_thread
+teca_add_app_test(test_deeplab_ar_detect_app_mcf_mpi_threads
+    teca_deeplab_ar_detect
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect_app_mcf.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_PYTORCH}
+        ${TECA_HAS_MPI} ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_bayesian_ar_detect_app_threads
+    teca_bayesian_ar_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
     FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_bayesian_ar_detect_app_mpi
+teca_add_app_test(test_bayesian_ar_detect_app_mpi
+    teca_bayesian_ar_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
-    ${MPIEXEC} ${HALF_TEST_CORES}
+    ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI}
     REQ_TECA_DATA)
 
-teca_add_test(test_bayesian_ar_detect_app_mcf_thread
+teca_add_app_test(test_bayesian_ar_detect_app_mpi_threads
+    teca_bayesian_ar_detect
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_bayesian_ar_detect_app_mcf_threads
+    teca_bayesian_ar_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect_app_mcf.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
     FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_bayesian_ar_detect_app_mcf_mpi
+teca_add_app_test(test_bayesian_ar_detect_app_mcf_mpi
+    teca_bayesian_ar_detect
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect_app_mcf.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    ${MPIEXEC} ${TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_bayesian_ar_detect_app_mcf_mpi_threads
+    teca_bayesian_ar_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect_app_mcf.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
     ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_bayesian_ar_detect_app_packed_data_mpi
+    teca_bayesian_ar_detect
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect_app_packed_data.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    ${MPIEXEC} ${TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_integrated_water_vapor_app_threads
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_integrated_water_vapor_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    FEATURES ${TECA_HAS_NETCDF}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_integrated_water_vapor_app_mpi
+    teca_integrated_water_vapor
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_integrated_water_vapor_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI}
     REQ_TECA_DATA)
 
-teca_add_test(test_integrated_vapor_transport_app_thread
+teca_add_app_test(test_integrated_water_vapor_app_mpi_threads
+    teca_integrated_water_vapor
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_integrated_water_vapor_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_integrated_vapor_transport_app_threads
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_integrated_vapor_transport_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
     FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_integrated_vapor_transport_app_mpi
+teca_add_app_test(test_integrated_vapor_transport_app_mpi
+    teca_integrated_vapor_transport
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_integrated_vapor_transport_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
-    ${MPIEXEC} ${HALF_TEST_CORES}
+    ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_detect_app
+teca_add_app_test(test_integrated_vapor_transport_app_mpi_threads
+    teca_integrated_vapor_transport
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_integrated_vapor_transport_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_integrated_vapor_transport_app_packed_data
+    teca_integrated_vapor_transport
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_integrated_vapor_transport_app_packed_data.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
+    FEATURES ${TECA_HAS_NETCDF}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_tc_detect_app teca_tc_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_detect_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_detect_app_mpi
+teca_add_app_test(test_tc_detect_app_mpi teca_tc_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_detect_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_detect_app_mcf
+teca_add_app_test(test_tc_detect_app_mcf teca_tc_detect
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_detect_app_mcf.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_trajectory_app
+teca_add_app_test(test_tc_trajectory_app
+    teca_tc_trajectory
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_trajectory_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_wind_radii_app_serial
+teca_add_app_test(test_tc_wind_radii_app_serial
+    teca_tc_wiind_radii
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_wind_radii_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_wind_radii_app_mpi
+teca_add_app_test(test_tc_wind_radii_app_mpi
+    teca_tc_wiind_radii
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_wind_radii_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_stats_app
+teca_add_app_test(test_tc_stats_app teca_tc_stats
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_stats_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_trajectory_scalars_app_serial
+teca_add_app_test(test_tc_trajectory_scalars_app_serial
+    teca_tc_trajectory_scalars
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_trajectory_scalars_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_trajectory_scalars_app_mpi
+teca_add_app_test(test_tc_trajectory_scalars_app_mpi
+    teca_tc_trajectory_scalars
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_trajectory_scalars_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} ${MPIEXEC} ${TEST_CORES}
-    FEATURES ${TECA_HAS_MPI} ${MPI4Py_FOUND}
+    FEATURES ${TECA_HAS_MPI} ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
-teca_add_test(test_tc_wind_radii_stats_app
+teca_add_app_test(test_tc_wind_radii_stats_app teca_tc_wind_radii_stats
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_tc_wind_radii_stats_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     REQ_TECA_DATA)
 
-teca_add_test(test_event_filter_app
+teca_add_app_test(test_event_filter_app teca_event_filter
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_event_filter_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_seasonal_average_thread
+teca_add_app_test(test_temporal_reduction_app_seasonal_average_threads
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
@@ -141,15 +235,27 @@ teca_add_test(test_temporal_reduction_app_seasonal_average_thread
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_seasonal_average_mpi_thread
+teca_add_app_test(test_temporal_reduction_app_seasonal_average_mpi
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
-    seasonal average 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    seasonal average 7 ${MPIEXEC} ${HALF_TEST}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_monthly_average_thread
+teca_add_app_test(test_temporal_reduction_app_seasonal_average_mpi_threads
+    teca_temporal_reduction
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
+    "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
+    seasonal average 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_temporal_reduction_app_monthly_average_threads
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
@@ -157,15 +263,27 @@ teca_add_test(test_temporal_reduction_app_monthly_average_thread
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_monthly_average_mpi_thread
+teca_add_app_test(test_temporal_reduction_app_monthly_average_mpi
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
-    monthly average 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    monthly average 7 ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_monthly_minimum_thread
+teca_add_app_test(test_temporal_reduction_app_monthly_average_mpi_threads
+    teca_temporal_reduction
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
+    "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
+    monthly average 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_temporal_reduction_app_monthly_minimum_threads
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
@@ -173,15 +291,27 @@ teca_add_test(test_temporal_reduction_app_monthly_minimum_thread
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_monthly_minimum_mpi_thread
+teca_add_app_test(test_temporal_reduction_app_monthly_minimum_mpi
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
-    monthly minimum 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    monthly minimum 7 ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_monthly_maximum_thread
+teca_add_app_test(test_temporal_reduction_app_monthly_minimum_mpi_threads
+    teca_temporal_reduction
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
+    "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
+    monthly minimum 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_temporal_reduction_app_monthly_maximum_threads
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
@@ -189,36 +319,51 @@ teca_add_test(test_temporal_reduction_app_monthly_maximum_thread
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_monthly_maximum_mpi_thread
+teca_add_app_test(test_temporal_reduction_app_monthly_maximum_mpi
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
-    monthly maximum 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    monthly maximum 7 ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_daily_average_missing_values
+teca_add_app_test(test_temporal_reduction_app_monthly_maximum_mpi_threads
+    teca_temporal_reduction
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
+    "prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc" prw
+    monthly maximum 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_temporal_reduction_app_daily_average_missing_values
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "MERRA2_100_inst3_3d_asm_Np_crop_1980012[89]\\.nc" T daily average 1
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_daily_maximum_missing_values
+teca_add_app_test(test_temporal_reduction_app_daily_maximum_missing_values
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "MERRA2_100_inst3_3d_asm_Np_crop_1980012[89]\\.nc" T daily maximum 1
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_daily_minimum_missing_values
+teca_add_app_test(test_temporal_reduction_app_daily_minimum_missing_values
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "MERRA2_100_inst3_3d_asm_Np_crop_1980012[89]\\.nc" T daily minimum 1
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_mcf_daily_average_thread
+teca_add_app_test(test_temporal_reduction_app_mcf_daily_average_threads
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app_mcf.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "${CMAKE_BINARY_DIR}/${BIN_PREFIX}/../test/ECMWF-IFS-HR-SST-present.mcf" hus
@@ -226,22 +371,33 @@ teca_add_test(test_temporal_reduction_app_mcf_daily_average_thread
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS}
     REQ_TECA_DATA)
 
-teca_add_test(test_temporal_reduction_app_mcf_daily_average_mpi_thread
+teca_add_app_test(test_temporal_reduction_app_mcf_daily_average_mpi
+    teca_temporal_reduction
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app_mcf.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "${CMAKE_BINARY_DIR}/${BIN_PREFIX}/../test/ECMWF-IFS-HR-SST-present.mcf" hus
-    daily average 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    daily average 7 ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
     REQ_TECA_DATA)
 
-teca_add_test(test_cartesian_mesh_diff_app_pass
+teca_add_app_test(test_temporal_reduction_app_mcf_daily_average_mpi_threads
+    teca_temporal_reduction
+    COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction_app_mcf.sh
+    ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
+    "${CMAKE_BINARY_DIR}/${BIN_PREFIX}/../test/ECMWF-IFS-HR-SST-present.mcf" hus
+    daily average 7 ${MPIEXEC} ${HALF_TEST_CORES}
+    FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
+    REQ_TECA_DATA)
+
+teca_add_app_test(test_cartesian_mesh_diff_app_pass teca_cartesian_mesh_diff
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_cartesian_mesh_diff_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX}
     ${TECA_DATA_ROOT}/test_cartesian_mesh_regrid.bin
     ${TECA_DATA_ROOT}/test_cartesian_mesh_regrid.bin LSMASK
     REQ_TECA_DATA)
 
-teca_add_test(test_cartesian_mesh_diff_app_fail
+teca_add_app_test(test_cartesian_mesh_diff_app_fail teca_cartesian_mesh_diff
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_cartesian_mesh_diff_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX}
     ${TECA_DATA_ROOT}/test_cf_writer_collective_000213.bin
@@ -249,14 +405,14 @@ teca_add_test(test_cartesian_mesh_diff_app_fail
     REQ_TECA_DATA
     WILL_FAIL)
 
-teca_add_test(test_table_diff_app_pass
+teca_add_app_test(test_table_diff_app_pass teca_table_diff
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_table_diff_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX}
     ${TECA_DATA_ROOT}/cam5_1_amip_run2_tracks_2005_09.bin
     ${TECA_DATA_ROOT}/cam5_1_amip_run2_tracks_2005_09.bin
     REQ_TECA_DATA)
 
-teca_add_test(test_table_diff_app_fail
+teca_add_app_test(test_table_diff_app_fail teca_table_diff
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_table_diff_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX}
     ${TECA_DATA_ROOT}/test_tc_stats_app_output_class_table_ref.bin
@@ -264,21 +420,21 @@ teca_add_test(test_table_diff_app_fail
     REQ_TECA_DATA
     WILL_FAIL)
 
-teca_add_test(test_convert_table_app_csv_bin
+teca_add_app_test(test_convert_table_app_csv_bin teca_convert_table
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_convert_table_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "cam5-025deg-all-hist-est1-v3-r1-tracks_size.csv"
     "cam5-025deg-all-hist-est1-v3-r1-tracks_size.bin"
     REQ_TECA_DATA)
 
-teca_add_test(test_convert_table_app_bin_csv
+teca_add_app_test(test_convert_table_app_bin_csv teca_convert_table
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_convert_table_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "cam5-025deg-all-hist-est1-v3-r1-tracks_size.bin"
     "cam5-025deg-all-hist-est1-v3-r1-tracks_size.csv"
     REQ_TECA_DATA)
 
-teca_add_test(test_convert_table_app_bin_netcdf
+teca_add_app_test(test_convert_table_app_bin_netcdf teca_convert_table
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_convert_table_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT}
     "test_descriptive_statistics.bin"
@@ -286,28 +442,61 @@ teca_add_test(test_convert_table_app_bin_netcdf
     FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_metadata_probe_app_cf
+teca_add_app_test(test_metadata_probe_app_cf teca_metadata_probe
     COMMAND ${CMAKE_BINARY_DIR}/${BIN_PREFIX}/teca_metadata_probe
     --input_regex "${TECA_DATA_ROOT}/test_tc_candidates_1990_07_0[0-9]\\.nc"
-    FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_metadata_probe_app_mcf
+teca_add_app_test(test_metadata_probe_app_mcf teca_metadata_probe
     COMMAND ${CMAKE_BINARY_DIR}/${BIN_PREFIX}/teca_metadata_probe
     --input_file ${CMAKE_CURRENT_BINARY_DIR}/../ECMWF-IFS-HR-SST-present.mcf
     --z_axis plev
-    FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_cf_restripe_app
+teca_add_app_test(test_cf_restripe_app teca_cf_restripe
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_cf_restripe_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
-    FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(test_cf_restripe_app_mpi
+teca_add_app_test(test_cf_restripe_app_mpi teca_cf_restripe
     COMMAND ${CMAKE_CURRENT_SOURCE_DIR}/test_cf_restripe_app.sh
     ${CMAKE_BINARY_DIR}/${BIN_PREFIX} ${TECA_DATA_ROOT} -1
-    ${MPIEXEC} ${HALF_TEST_CORES}
+    ${MPIEXEC} ${TEST_CORES}
     FEATURES ${TECA_HAS_NETCDF_MPI} ${TECA_HAS_MPI}
     REQ_TECA_DATA)
+
+set(app_names
+    teca_bayesian_ar_detect
+    teca_cf_restripe
+    teca_convert_table
+    teca_deeplab_ar_detect
+    teca_event_filter
+    teca_integrated_vapor_transport
+    teca_metadata_probe
+    teca_profile_explorer
+    teca_tc_detect
+    teca_tc_stats
+    teca_tc_trajectory
+    teca_tc_trajectory_scalars
+    teca_tc_wind_radii
+    teca_tc_wind_radii_stats
+    teca_temporal_reduction)
+
+foreach (app_name ${app_names})
+    teca_add_app_test(${app_name}_help ${app_name}
+        COMMAND ${CMAKE_BINARY_DIR}/${BIN_PREFIX}/${app_name} --help)
+
+    get_target_property(app_type ${app_name} APP_TYPE)
+    if ("${app_type}" STREQUAL "C++")
+
+        teca_add_app_test(${app_name}_full_help ${app_name}
+            COMMAND ${CMAKE_BINARY_DIR}/${BIN_PREFIX}/${app_name} --full_help)
+
+        teca_add_app_test(${app_name}_advanced_help ${app_name}
+            COMMAND ${CMAKE_BINARY_DIR}/${BIN_PREFIX}/${app_name} --advanced_help)
+
+        teca_add_app_test(${app_name}_no_args ${app_name}
+            COMMAND ${CMAKE_BINARY_DIR}/${BIN_PREFIX}/${app_name}
+            WILL_FAIL)
+    endif()
+endforeach()
diff --git a/test/apps/test_bayesian_ar_detect_app.sh b/test/apps/test_bayesian_ar_detect_app.sh
index 1449e3d88..a46d1e881 100755
--- a/test/apps/test_bayesian_ar_detect_app.sh
+++ b/test/apps/test_bayesian_ar_detect_app.sh
@@ -23,6 +23,7 @@ set -x
 # run the app
 ${launcher} ${app_prefix}/teca_bayesian_ar_detect                \
     --input_regex "${data_root}/ARTMIP_MERRA_2D_2017-05.*\.nc$"  \
+    --ar_weighted_variables IVT --segment_ar_probability         \
     --output_file test_bayesian_ar_detect_app_output_%t%.nc      \
     --steps_per_file 365 --n_threads ${n_threads} --verbose
 
@@ -40,7 +41,7 @@ else
     ${app_prefix}/teca_cartesian_mesh_diff                                          \
         --reference_dataset "${data_root}/test_bayesian_ar_detect_app_ref.*\.nc"    \
         --test_dataset "test_bayesian_ar_detect_app_output.*\.nc"                   \
-        --arrays ar_probability ar_binary_tag --verbose
+        --arrays ar_probability ar_binary_tag ar_wgtd_IVT --verbose
 
     # clean up
     rm test_bayesian_ar_detect_app_output*.nc
diff --git a/test/apps/test_bayesian_ar_detect_app_mcf.sh b/test/apps/test_bayesian_ar_detect_app_mcf.sh
index c273c363b..8cb80b068 100755
--- a/test/apps/test_bayesian_ar_detect_app_mcf.sh
+++ b/test/apps/test_bayesian_ar_detect_app_mcf.sh
@@ -24,7 +24,7 @@ set -x
 ${launcher} ${app_prefix}/teca_bayesian_ar_detect                       \
     --input_file "${app_prefix}/../test/ECMWF-IFS-HR-SST-present.mcf"   \
     --compute_ivt --wind_u ua --wind_v va --specific_humidity hus       \
-    --write_ivt --write_ivt_magnitude                                   \
+    --segment_ar_probability --write_ivt --write_ivt_magnitude          \
     --output_file test_bayesian_ar_detect_app_mcf_output_%t%.nc         \
     --steps_per_file 365 --first_step 8 --last_step 23                  \
     --n_threads ${n_threads} --verbose
diff --git a/test/apps/test_bayesian_ar_detect_app_packed_data.sh b/test/apps/test_bayesian_ar_detect_app_packed_data.sh
new file mode 100755
index 000000000..40d131a5e
--- /dev/null
+++ b/test/apps/test_bayesian_ar_detect_app_packed_data.sh
@@ -0,0 +1,52 @@
+#!/bin/bash
+
+if [[ $# < 3 ]]
+then
+    echo "usage: test_bayesian_ar_detect_app_packed_data.sh "\
+        "[app prefix] [data root] [num threads] [mpiexec] [num ranks]"
+    exit -1
+fi
+
+app_prefix=${1}
+data_root=${2}
+n_threads=${3}
+
+if [[ $# -eq 5 ]]
+then
+    mpi_exec=${4}
+    test_cores=${5}
+    launcher="${mpi_exec} -n ${test_cores}"
+fi
+
+set -x
+
+# run the app
+${launcher} ${app_prefix}/teca_bayesian_ar_detect                                  \
+    --input_regex "${data_root}/ERAinterim_1979-01-0.*\.nc$"                       \
+    --x_axis_variable longitude --y_axis_variable latitude --z_axis_variable level \
+    --wind_u uwnd --wind_v vwnd --specific_humidity shum --segment_ar_probability  \
+    --compute_ivt --write_ivt --write_ivt_magnitude --steps_per_file 256           \
+    --n_threads ${n_threads} --verbose                                             \
+    --output_file test_bayesian_ar_detect_app_packed_data_output_%t%.nc
+
+do_test=1
+if [[ $do_test -eq 0 ]]
+then
+    echo "regenerating baseline..."
+    for f in `ls test_bayesian_ar_detect_app_packed_data_output_*.nc`
+    do
+        ff=`echo $f | sed s/output/ref/g`
+        cp -vd $f ${data_root}/$ff
+    done
+else
+    # run the diff
+    ${app_prefix}/teca_cartesian_mesh_diff                                                      \
+        --reference_dataset "${data_root}/test_bayesian_ar_detect_app_packed_data_ref.*\.nc"    \
+        --test_dataset "test_bayesian_ar_detect_app_packed_data_output.*\.nc"                   \
+        --test_reader::x_axis_variable longitude --test_reader::y_axis_variable latitude        \
+        --ref_reader::x_axis_variable longitude --ref_reader::y_axis_variable latitude          \
+        --arrays ar_probability ar_binary_tag --verbose
+
+    # clean up
+    rm test_bayesian_ar_detect_app_packed_data_output*.nc
+fi
diff --git a/test/apps/test_integrated_vapor_transport_app_packed_data.sh b/test/apps/test_integrated_vapor_transport_app_packed_data.sh
new file mode 100755
index 000000000..ba955b447
--- /dev/null
+++ b/test/apps/test_integrated_vapor_transport_app_packed_data.sh
@@ -0,0 +1,52 @@
+#!/bin/bash
+
+if [[ $# < 3 ]]
+then
+    echo "usage: test_integrated_vapor_transport_app.sh [app prefix] "   \
+         "[data root] [num threads] [mpiexec] [num ranks]"
+    exit -1
+fi
+
+app_prefix=${1}
+data_root=${2}
+n_threads=${3}
+
+if [[ $# -eq 5 ]]
+then
+    mpi_exec=${4}
+    test_cores=${5}
+    launcher="${mpi_exec} -n ${test_cores}"
+fi
+
+set -x
+set -e
+
+# run the app
+${launcher} ${app_prefix}/teca_integrated_vapor_transport                           \
+    --input_regex "${data_root}/ERAinterim_1979-01-0.*\.nc$"                        \
+    --x_axis_variable longitude --y_axis_variable latitude --z_axis_variable level  \
+    --wind_u uwnd --wind_v vwnd --specific_humidity shum --write_ivt 1              \
+    --write_ivt_magnitude 1 --steps_per_file 256 --n_threads ${n_threads} --verbose \
+    --output_file test_integrated_vapor_transport_app_packed_data_output_%t%.nc
+
+do_test=1
+if [[ $do_test -eq 0 ]]
+then
+    echo "regenerating baseline..."
+    for f in `ls test_integrated_vapor_transport_app_packed_data_output_*.nc`
+    do
+        ff=`echo $f | sed s/output/ref/g`
+        cp -vd $f ${data_root}/$ff
+    done
+else
+    # run the diff
+    ${app_prefix}/teca_cartesian_mesh_diff                                                              \
+        --reference_dataset ${data_root}/test_integrated_vapor_transport_app_packed_data_ref'.*\.nc'    \
+        --test_dataset test_integrated_vapor_transport_app_packed_data_output'.*\.nc'                   \
+        --test_reader::x_axis_variable longitude --test_reader::y_axis_variable latitude                \
+        --ref_reader::x_axis_variable longitude --ref_reader::y_axis_variable latitude                  \
+        --arrays IVT_U IVT_V IVT --verbose
+
+    # clean up
+    rm test_integrated_vapor_transport_app_packed_data_output*.nc
+fi
diff --git a/test/apps/test_integrated_water_vapor_app.sh b/test/apps/test_integrated_water_vapor_app.sh
new file mode 100755
index 000000000..06edffd8e
--- /dev/null
+++ b/test/apps/test_integrated_water_vapor_app.sh
@@ -0,0 +1,47 @@
+#!/bin/bash
+
+if [[ $# < 3 ]]
+then
+    echo "usage: test_integrated_water_vapor_app.sh [app prefix] "  \
+         "[data root] [num threads] [mpiexec] [num ranks]"
+    exit -1
+fi
+
+app_prefix=${1}
+data_root=${2}
+n_threads=${3}
+
+if [[ $# -eq 5 ]]
+then
+    mpi_exec=${4}
+    test_cores=${5}
+    launcher="${mpi_exec} -n ${test_cores}"
+fi
+
+set -x
+set -e
+
+# run the app
+${launcher} ${app_prefix}/teca_integrated_water_vapor                   \
+    --input_file "${app_prefix}/../test/ECMWF-IFS-HR-SST-present.mcf"   \
+    --specific_humidity hus --n_threads ${n_threads}                    \
+    --output_file test_integrated_water_vapor_app_mcf_output_%t%.nc                \
+    --verbose --steps_per_file 365
+
+do_test=1
+if [[ ${do_test} == 1 ]]
+then
+    # run the diff
+    ${app_prefix}/teca_cartesian_mesh_diff                                               \
+        --reference_dataset ${data_root}/test_integrated_water_vapor_app_mcf_ref'.*\.nc' \
+        --test_dataset test_integrated_water_vapor_app_mcf_output'.*\.nc' --arrays IWV   \
+        --verbose
+else
+    for f in `ls  test_integrated_water_vapor_app_mcf_output_*.nc`
+    do
+        cp -vd $f ${data_root}/${f/output/ref}
+    done
+fi
+
+# clean up
+rm test_integrated_water_vapor_app_mcf_output*.nc
diff --git a/test/apps/test_temporal_reduction_app.sh b/test/apps/test_temporal_reduction_app.sh
index 362ee7693..db1dd524b 100755
--- a/test/apps/test_temporal_reduction_app.sh
+++ b/test/apps/test_temporal_reduction_app.sh
@@ -32,8 +32,9 @@ output_base=${test_name}_${array_name}_${interval}_${operator}
 time ${launcher} ${app_prefix}/teca_temporal_reduction                  \
     --input_regex "${data_root}/${input_regex}" --interval ${interval}  \
     --operator ${operator} --point_arrays ${array_name}                 \
-    --steps_per_file ${steps_per_file} --n_threads 2 --verbose 1        \
-    --output_file "${output_base}_%t%.nc"
+    --file_layout yearly --steps_per_file ${steps_per_file}             \
+    --output_file "${output_base}_%t%.nc"                               \
+    --n_threads 2 --verbose 1
 
 # don't profile the diff
 unset PROFILER_ENABLE
diff --git a/test/apps/test_temporal_reduction_app_mcf.sh b/test/apps/test_temporal_reduction_app_mcf.sh
index eafdb29ea..4c135f90d 100755
--- a/test/apps/test_temporal_reduction_app_mcf.sh
+++ b/test/apps/test_temporal_reduction_app_mcf.sh
@@ -29,11 +29,12 @@ test_name=test_temporal_reduction
 output_base=${test_name}_${array_name}_${interval}_${operator}
 
 # run the app
-time ${launcher} ${app_prefix}/teca_temporal_reduction                                  \
-    --input_file "${app_prefix}/../test/ECMWF-IFS-HR-SST-present.mcf"                   \
-    --interval ${interval} --operator ${operator} --point_arrays ${array_name}          \
-    --z_axis_variable plev --steps_per_file ${steps_per_file} --n_threads 2 --verbose 1 \
-    --output_file "${output_base}_%t%.nc"
+time ${launcher} ${app_prefix}/teca_temporal_reduction                         \
+    --input_file "${app_prefix}/../test/ECMWF-IFS-HR-SST-present.mcf"          \
+    --interval ${interval} --operator ${operator} --point_arrays ${array_name} \
+    --z_axis_variable plev --file_layout yearly                                \
+    --steps_per_file ${steps_per_file} --output_file "${output_base}_%t%.nc"   \
+    --n_threads 2 --verbose 1
 
 # don't profile the diff
 unset PROFILER_ENABLE
diff --git a/test/python/CMakeLists.txt b/test/python/CMakeLists.txt
index 06a8720e2..042af1bf3 100644
--- a/test/python/CMakeLists.txt
+++ b/test/python/CMakeLists.txt
@@ -66,7 +66,7 @@ teca_add_test(py_test_cf_writer_mpi_threads
     ${CMAKE_CURRENT_SOURCE_DIR}/test_cf_writer.py
     "${TECA_DATA_ROOT}/cam5_1_amip_run2\\.cam2\\.h2\\.1991-10-0[12]-10800\\.nc"
     0 -1 2 1 "py_test_cf_writer_%t%.nc" U850 V850
-    FEATURES ${TECA_HAS_MPI} ${TECA_HAS_NETCDF}
+    FEATURES ${TECA_HAS_MPI} ${TECA_HAS_NETCDF} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 # TODO -- camke_parse_arguments eats ""
@@ -149,7 +149,7 @@ teca_add_test(py_test_programmable_reduce_mpi
     COMMAND ${MPIEXEC} -n ${TEST_CORES} ${PYTHON_EXECUTABLE}
     ${CMAKE_CURRENT_SOURCE_DIR}/test_programmable_reduce.py
     "${TECA_DATA_ROOT}/cam5_1_amip_run2\\.cam2\\.h2\\.1991-10-0[12]-10800\\.nc"
-    "${TECA_DATA_ROOT}/py_test_programmable_reduce.bin" 0 -1 1 TMQ T200 T500
+    "${TECA_DATA_ROOT}/py_test_programmable_reduce.bin" 0 -1 -1 TMQ T200 T500
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
     REQ_TECA_DATA)
 
@@ -157,9 +157,9 @@ teca_add_test(py_test_programmable_reduce_mpi_thread
     COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} ${PYTHON_EXECUTABLE}
     ${CMAKE_CURRENT_SOURCE_DIR}/test_programmable_reduce.py
     "${TECA_DATA_ROOT}/cam5_1_amip_run2\\.cam2\\.h2\\.1991-10-0[12]-10800\\.nc"
-    "${TECA_DATA_ROOT}/py_test_programmable_reduce.bin" 0 -1 ${HALF_TEST_CORES}
-    TMQ T200 T500
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
+    "${TECA_DATA_ROOT}/py_test_programmable_reduce.bin" 0 -1 -1 TMQ T200 T500
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(py_test_python_reduce_serial
@@ -188,9 +188,9 @@ teca_add_test(py_test_python_reduce_mpi_thread
     COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} ${PYTHON_EXECUTABLE}
     ${CMAKE_CURRENT_SOURCE_DIR}/test_python_reduce.py
     "${TECA_DATA_ROOT}/cam5_1_amip_run2\\.cam2\\.h2\\.1991-10-0[12]-10800\\.nc"
-    "${TECA_DATA_ROOT}/py_test_programmable_reduce.bin" 0 -1 ${HALF_TEST_CORES}
-    TMQ T200 T500
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
+    "${TECA_DATA_ROOT}/py_test_programmable_reduce.bin" 0 -1 -1 TMQ T200 T500
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(py_test_temporal_seasonal_average_thread
@@ -205,7 +205,8 @@ teca_add_test(py_test_temporal_seasonal_average_mpi_thread
     ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction.py
     "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc"
     "." "${TECA_DATA_ROOT}/test_temporal_reduction_prw" 7 2 seasonal average 0 prw
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(py_test_temporal_monthly_average_thread
@@ -220,7 +221,8 @@ teca_add_test(py_test_temporal_monthly_average_mpi_thread
     ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction.py
     "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc"
     "." "${TECA_DATA_ROOT}/test_temporal_reduction_prw" 7 2 monthly average 0 prw
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(py_test_temporal_monthly_minimum_thread
@@ -235,7 +237,8 @@ teca_add_test(py_test_temporal_monthly_minimum_mpi_thread
     ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction.py
     "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc"
     "." "${TECA_DATA_ROOT}/test_temporal_reduction_prw" 7 2 monthly minimum 0 prw
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(py_test_temporal_monthly_maximum_thread
@@ -250,7 +253,8 @@ teca_add_test(py_test_temporal_monthly_maximum_mpi_thread
     ${CMAKE_CURRENT_SOURCE_DIR}/test_temporal_reduction.py
     "${TECA_DATA_ROOT}/prw_hus_day_MRI-CGCM3_historical_r1i1p1_19500101-19501231\\.nc"
     "." "${TECA_DATA_ROOT}/test_temporal_reduction_prw" 7 2 monthly maximum 0 prw
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(py_test_temporal_daily_average
@@ -332,7 +336,7 @@ teca_add_test(py_test_tc_candidates_mpi_threads
     "${TECA_DATA_ROOT}/test_tc_candidates_1990_07_0[12]\\.nc"
     "${TECA_DATA_ROOT}/test_tc_candidates_20.bin" 0 3 2
     U850 V850 UBOT VBOT PSL T500 T200 Z1000 Z200 -20 20
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_UDUNITS} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(py_test_event_filter
@@ -378,20 +382,21 @@ teca_add_test(py_test_tc_wind_radii_stats
     FEATURES ${TECA_HAS_UDUNITS}
     REQ_TECA_DATA)
 
-teca_add_test(py_test_bayesian_ar_detect_serial
+teca_add_test(py_test_bayesian_ar_detect
     COMMAND  ${PYTHON_EXECUTABLE} ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect.py
     "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\\.nc$"
     "${TECA_DATA_ROOT}/test_bayesian_ar_detect.bin" IVT
-    "bayesian_ar_detect_py_%t%.vtk" 1 0 -1
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_SERIAL_TESTS}
+    "bayesian_ar_detect_py_%t%.vtk" -1 0 -1
+    FEATURES ${TECA_HAS_NETCDF}
     REQ_TECA_DATA)
 
-teca_add_test(py_test_bayesian_ar_detect_threads
-    COMMAND  ${PYTHON_EXECUTABLE} ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect.py
+teca_add_test(py_test_bayesian_ar_detect_mpi
+    COMMAND ${MPIEXEC} -n ${TEST_CORES} ${PYTHON_EXECUTABLE}
+    ${CMAKE_CURRENT_SOURCE_DIR}/test_bayesian_ar_detect.py
     "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\\.nc$"
     "${TECA_DATA_ROOT}/test_bayesian_ar_detect.bin" IVT
     "bayesian_ar_detect_py_%t%.vtk" -1 0 -1
-    FEATURES ${TECA_HAS_NETCDF}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI}
     REQ_TECA_DATA)
 
 teca_add_test(py_test_bayesian_ar_detect_mpi_threads
@@ -400,18 +405,10 @@ teca_add_test(py_test_bayesian_ar_detect_mpi_threads
     "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\\.nc$"
     "${TECA_DATA_ROOT}/test_bayesian_ar_detect.bin" IVT
     "bayesian_ar_detect_py_%t%.vtk" -1 0 -1
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_MPI} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
-teca_add_test(py_test_deeplab_ar_detect_serial
-    COMMAND  ${PYTHON_EXECUTABLE} ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect.py
-    "${TECA_DATA_ROOT}/cascade_deeplab_IVT.pt"
-    "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\.nc$"
-    "${TECA_DATA_ROOT}/test_deeplab_ar_detect" IVT 1
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_PYTORCH} ${TECA_SERIAL_TESTS}
-    REQ_TECA_DATA)
-
-teca_add_test(py_test_deeplab_ar_detect_threads
+teca_add_test(py_test_deeplab_ar_detect
     COMMAND  ${PYTHON_EXECUTABLE} ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect.py
     "${TECA_DATA_ROOT}/cascade_deeplab_IVT.pt"
     "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\.nc$"
@@ -419,13 +416,24 @@ teca_add_test(py_test_deeplab_ar_detect_threads
     FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_PYTORCH}
     REQ_TECA_DATA)
 
+teca_add_test(py_test_deeplab_ar_detect_mpi
+    COMMAND ${MPIEXEC} -n ${TEST_CORES} ${PYTHON_EXECUTABLE}
+        ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect.py
+        "${TECA_DATA_ROOT}/cascade_deeplab_IVT.pt"
+        "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\.nc$"
+        "${TECA_DATA_ROOT}/test_deeplab_ar_detect" IVT -1
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_PYTORCH} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND}
+    REQ_TECA_DATA)
+
 teca_add_test(py_test_deeplab_ar_detect_mpi_threads
     COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} ${PYTHON_EXECUTABLE}
         ${CMAKE_CURRENT_SOURCE_DIR}/test_deeplab_ar_detect.py
         "${TECA_DATA_ROOT}/cascade_deeplab_IVT.pt"
         "${TECA_DATA_ROOT}/ARTMIP_MERRA_2D_2017-05.*\.nc$"
         "${TECA_DATA_ROOT}/test_deeplab_ar_detect" IVT -1
-    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_PYTORCH} ${TECA_HAS_MPI} ${MPI4Py_FOUND}
+    FEATURES ${TECA_HAS_NETCDF} ${TECA_HAS_PYTORCH} ${TECA_HAS_MPI}
+        ${MPI4Py_FOUND} ${TEST_MPI_THREADS}
     REQ_TECA_DATA)
 
 teca_add_test(py_test_binary_stream
@@ -435,11 +443,16 @@ teca_add_test(py_test_binary_stream
     FEATURES ${TECA_HAS_MPI} ${MPI4Py_FOUND}
     REQ_TECA_DATA)
 
-teca_add_test(py_test_nested_pipeline
-    COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} ${PYTHON_EXECUTABLE}
-    ${CMAKE_CURRENT_SOURCE_DIR}/test_nested_pipeline.py 16 16 32 ${HALF_TEST_CORES}
+teca_add_test(py_test_nested_pipeline_mpi
+    COMMAND ${MPIEXEC} -n ${TEST_CORES} ${PYTHON_EXECUTABLE}
+    ${CMAKE_CURRENT_SOURCE_DIR}/test_nested_pipeline.py 16 16 32 -1
     FEATURES ${TECA_HAS_MPI} ${MPI4Py_FOUND})
 
+teca_add_test(py_test_nested_pipeline_mpi_threads
+    COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} ${PYTHON_EXECUTABLE}
+    ${CMAKE_CURRENT_SOURCE_DIR}/test_nested_pipeline.py 16 16 32 -1
+    FEATURES ${TECA_HAS_MPI} ${MPI4Py_FOUND} ${TEST_MPI_THREADS})
+
 teca_add_test(py_test_cf_writer_collective_serial
     COMMAND ${PYTHON_EXECUTABLE}
     "${CMAKE_CURRENT_SOURCE_DIR}/test_cf_writer_collective.py" 128 512 128
@@ -463,10 +476,15 @@ teca_add_test(py_test_thread_parameters_serial
     "${CMAKE_CURRENT_SOURCE_DIR}/test_thread_parameters.py")
 
 teca_add_test(py_test_thread_parameters_mpi
-    COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} ${PYTHON_EXECUTABLE}
+    COMMAND ${MPIEXEC} -n ${TEST_CORES} ${PYTHON_EXECUTABLE}
     "${CMAKE_CURRENT_SOURCE_DIR}/test_thread_parameters.py"
     FEATURES ${MPI4Py_FOUND})
 
+teca_add_test(py_test_thread_parameters_mpi_threads
+    COMMAND ${MPIEXEC} -n ${HALF_TEST_CORES} ${PYTHON_EXECUTABLE}
+    "${CMAKE_CURRENT_SOURCE_DIR}/test_thread_parameters.py"
+    FEATURES ${MPI4Py_FOUND} ${TEST_MPI_THREADS})
+
 teca_add_test(py_test_calendaring
     COMMAND ${PYTHON_EXECUTABLE} ${CMAKE_CURRENT_SOURCE_DIR}/test_calendaring.py)
 
@@ -479,3 +497,7 @@ teca_add_test(py_test_table_from_stream_bin
     COMMAND ${PYTHON_EXECUTABLE} ${CMAKE_CURRENT_SOURCE_DIR}/test_table_from_stream.py
         "${TECA_DATA_ROOT}/cam5-025deg-all-hist-est1-v3-r1-tracks_size.bin"
     REQ_TECA_DATA)
+
+teca_add_test(py_test_apply_binary_mask
+    COMMAND ${PYTHON_EXECUTABLE} ${CMAKE_CURRENT_SOURCE_DIR}/test_apply_binary_mask.py
+        128 128 mask_ 1e-5)
diff --git a/test/python/test_apply_binary_mask.py b/test/python/test_apply_binary_mask.py
new file mode 100644
index 000000000..0d2e873ab
--- /dev/null
+++ b/test/python/test_apply_binary_mask.py
@@ -0,0 +1,132 @@
+from teca import *
+import sys
+import numpy as np
+
+set_stack_trace_on_error()
+
+def isequal(a, b, epsilon):
+    return np.fabs(a - b) < epsilon
+
+
+if not len(sys.argv) == 5:
+    sys.stderr.write('test_apply_binary_mask.py [nx] [ny] [prefix] [tolerance]\n')
+    sys.exit(-1)
+
+nx = int(sys.argv[1])
+ny = int(sys.argv[2])
+prefix = str(sys.argv[3])
+tolerance = float(sys.argv[4])
+
+nxy = nx*ny
+
+dx = 360./float(nx - 1)
+x = []
+for i in range(nx):
+    x.append(i*dx)
+
+dy = 180./float(ny - 1)
+y = []
+for i in range(ny):
+    y.append(-90. + i*dy)
+
+# create a mask variable representing cosine-latitude weighting
+coslat = np.cos(np.deg2rad(np.array(y)[:,np.newaxis]))*np.ones([ny, nx])
+# normalize it so it ranges from 0 to 1
+coslat /= np.sum(coslat)
+
+
+x = teca_variant_array.New(x)
+y = teca_variant_array.New(y)
+z = teca_variant_array.New([0.])
+t = teca_variant_array.New([1.])
+mask_grid = teca_variant_array.New(coslat.astype(np.float32).ravel())
+
+ones_grid = teca_variant_array.New(np.ones(nxy).astype(np.float64))
+zeros_grid = teca_variant_array.New(np.zeros(nxy).astype(np.float64))
+mask_grid = teca_variant_array.New(mask_grid)
+
+wext = [0, nx - 1, 0, ny - 1, 0, 0]
+
+mesh = teca_cartesian_mesh.New()
+mesh.set_x_coordinates("lon", x)
+mesh.set_y_coordinates("lat", y)
+mesh.set_z_coordinates("z", z)
+mesh.set_whole_extent(wext)
+mesh.set_extent(wext)
+mesh.set_time(1.0)
+mesh.set_time_step(0)
+mesh.get_point_arrays().append("ones_grid", ones_grid)
+mesh.get_point_arrays().append("zeros_grid", zeros_grid)
+mesh.get_point_arrays().append("mask_grid", mask_grid)
+
+md = teca_metadata()
+md["whole_extent"] = wext
+md["time_steps"] = [0]
+md["variables"] = ["ones_grid", "zeros_grid", "mask_grid"]
+md["number_of_time_steps"] = 1
+md["index_initializer_key"] = "number_of_time_steps"
+md["index_request_key"] = "time_step"
+
+# add attributes
+ones_atts = teca_array_attributes(
+    teca_double_array_code.get(),
+    teca_array_attributes.no_centering,
+    2, 'ones', 'unitless',
+    'an array full of ones',
+    None)
+
+zeros_atts = teca_array_attributes(
+    teca_double_array_code.get(),
+    teca_array_attributes.no_centering,
+    2, 'zeros', 'unitless',
+    'an array full of zeros',
+    None)
+
+# put it in the array attributes
+try:
+    atts = md['attributes']
+except:
+    atts = teca_metadata()
+atts['ones_grid'] = ones_atts.to_metadata()
+atts['zeros_grid'] = zeros_atts.to_metadata()
+md['attributes'] = atts
+
+
+
+source = teca_dataset_source.New()
+source.set_metadata(md)
+source.set_dataset(mesh)
+
+mask_comp = teca_apply_binary_mask.New()
+mask_comp.set_input_connection(source.get_output_port())
+mask_comp.set_mask_variable("mask_grid")
+mask_comp.set_masked_variables(["ones_grid", "zeros_grid"])
+mask_comp.set_output_variable_prefix(prefix)
+
+mask_o = teca_dataset_capture.New()
+mask_o.set_input_connection(mask_comp.get_output_port())
+
+mask_o.update()
+
+ds = mask_o.get_dataset()
+mdo = ds.get_metadata()
+
+out_mesh = teca_cartesian_mesh.New()
+out_mesh.copy(ds)
+
+masked_ones_array = out_mesh.get_point_arrays().get(prefix + "ones_grid")
+masked_zeros_array = out_mesh.get_point_arrays().get(prefix + "zeros_grid")
+
+# check that the sum of ones times the mask is equal to 1
+sum_difference = np.sum(masked_ones_array) - 1
+if np.abs(sum_difference) > tolerance:
+    sys.stderr.write('Failure: sum of dx*dy field ' +
+        'differs from 1 by {:2.2g}\n'.format(sum_difference))
+    sys.exit(-1)
+
+# check that the sum of zeros is zero
+sum_difference = np.sum(masked_zeros_array)
+if not np.isclose(sum_difference, 0):
+    sys.stderr.write('Failure: sum of zeros field ' +
+        'differs from 0 by {:2.2g}\n'.format(sum_difference))
+    sys.exit(-1)
diff --git a/test/python/test_cf_writer.py b/test/python/test_cf_writer.py
index 5a70775f4..379cdf6db 100644
--- a/test/python/test_cf_writer.py
+++ b/test/python/test_cf_writer.py
@@ -44,6 +44,7 @@
 wri = teca_cf_writer.New()
 wri.set_input_connection(coords.get_output_port())
 wri.set_thread_pool_size(n_threads)
+wri.set_layout('number_of_steps')
 wri.set_steps_per_file(steps_per_file)
 wri.set_first_step(first_step)
 wri.set_last_step(end_index)
diff --git a/test/python/test_cf_writer_collective.py b/test/python/test_cf_writer_collective.py
index 3d0b8fe49..2fbead9f0 100644
--- a/test/python/test_cf_writer_collective.py
+++ b/test/python/test_cf_writer_collective.py
@@ -195,8 +195,7 @@ def execute(self, port, data_in, req_in):
 src = teca_cartesian_mesh_source.New()
 src.set_whole_extents([0, nx -1, 0, nx - 1, 0, 0, 0, n_steps-1])
 src.set_bounds([-90.0, 90.0, -90.0, 90.0, 0.0, 0.0, 0.0, 2.*np.pi])
-src.set_calendar('standard')
-src.set_time_units('days since 2019-09-24')
+src.set_calendar('standard', 'days since 2019-09-24')
 
 # generate point and information data to be written and then read
 # the point data is z = sin^2(x*y + t) thus correctness can be easily
@@ -216,6 +215,7 @@ def execute(self, port, data_in, req_in):
 cfw.set_file_name(out_file)
 cfw.set_information_arrays(gd.get_info_array_names())
 cfw.set_point_arrays(gd.get_point_array_names())
+cfw.set_layout('number_of_steps')
 cfw.set_steps_per_file(steps_per_file)
 cfw.set_thread_pool_size(n_threads)
 cfw.set_executive(wex)
diff --git a/test/python/test_multi_cf_reader.py b/test/python/test_multi_cf_reader.py
index ebaed411a..9394fbf8d 100644
--- a/test/python/test_multi_cf_reader.py
+++ b/test/python/test_multi_cf_reader.py
@@ -137,7 +137,7 @@ def parse_args(args):
     i = 0
     while i < n:
         key = 'r_%d'%(i)
-        cfmr.add_reader(key, regex[i], 0, 0, var[i])
+        cfmr.add_reader(regex[i], key, 0, 0, var[i])
         i += 1
     cfmr.set_time_reader(time_reader)
     cfmr.set_geometry_reader(geometry_reader)
diff --git a/test/python/test_temporal_reduction.py b/test/python/test_temporal_reduction.py
index 42f84ce73..ba7437f09 100644
--- a/test/python/test_temporal_reduction.py
+++ b/test/python/test_temporal_reduction.py
@@ -58,6 +58,7 @@
     # run the test
     if rank == 0:
         sys.stderr.write('running test...\n')
+        sys.stderr.write('regex=%s_%s_%s_.*\\.nc$\n'%(out_base,interval,operator))
     bcfr = teca_cf_reader.New()
     bcfr.set_files_regex(('%s_%s_%s_.*\\.nc$'%(out_base,interval,operator)))
     bcfr.set_z_axis_variable(z_axis)
@@ -76,10 +77,12 @@
     # make a baseline
     if rank == 0:
         sys.stderr.write('generating baseline...\n')
+        sys.stderr.write('filename=%s_%s_%s_%%t%%.nc\n'%(out_base,interval,operator))
     cfw = teca_cf_writer.New()
     cfw.set_input_connection(mav.get_output_port())
     cfw.set_verbose(1)
     cfw.set_thread_pool_size(1)
+    cfw.set_layout('yearly')
     cfw.set_steps_per_file(steps_per_file)
     cfw.set_file_name('%s_%s_%s_%%t%%.nc'%(out_base,interval,operator))
     cfw.set_point_arrays(arrays)
diff --git a/test/teca_test_util.h b/test/teca_test_util.h
index f116355c5..cf912c456 100644
--- a/test/teca_test_util.h
+++ b/test/teca_test_util.h
@@ -6,8 +6,6 @@
 #include "teca_table.h"
 #include "teca_mpi.h"
 
-
-
 namespace teca_test_util
 {
 
diff --git a/test/test_2d_component_area.cpp b/test/test_2d_component_area.cpp
index 9f71da08b..65047483a 100644
--- a/test/test_2d_component_area.cpp
+++ b/test/test_2d_component_area.cpp
@@ -11,6 +11,7 @@
 #include "teca_dataset.h"
 #include "teca_cartesian_mesh.h"
 #include "teca_variant_array.h"
+#include "teca_array_attributes.h"
 
 #define _USE_MATH_DEFINES
 #include <cmath>
diff --git a/test/test_array/array.h b/test/test_array/array.h
index de54e5041..fd5b98ce7 100644
--- a/test/test_array/array.h
+++ b/test/test_array/array.h
@@ -1,12 +1,15 @@
 #ifndef array_h
 #define array_h
 
-#include "array_fwd.h"
+#include "array.h"
 #include "teca_dataset.h"
+#include "teca_shared_object.h"
 
 #include <string>
 #include <vector>
 
+TECA_SHARED_OBJECT_FORWARD_DECL(array)
+
 class teca_binary_stream;
 
 // trivial implementation of an array based datatset
diff --git a/test/test_array/array_fwd.h b/test/test_array/array_fwd.h
deleted file mode 100644
index dd90aa51b..000000000
--- a/test/test_array/array_fwd.h
+++ /dev/null
@@ -1,8 +0,0 @@
-#ifndef array_fwd_h
-#define array_fwd_h
-
-#include "teca_shared_object.h"
-
-TECA_SHARED_OBJECT_FORWARD_DECL(array)
-
-#endif
diff --git a/test/test_array/array_temporal_stats.h b/test/test_array/array_temporal_stats.h
index b887eb2e5..4029dfd60 100644
--- a/test/test_array/array_temporal_stats.h
+++ b/test/test_array/array_temporal_stats.h
@@ -2,7 +2,7 @@
 #define array_temporal_stats_h
 
 #include "teca_shared_object.h"
-#include "array_fwd.h"
+#include "array.h"
 
 #include "teca_index_reduce.h"
 #include "teca_metadata.h"
diff --git a/test/test_bounds_to_extent.cpp b/test/test_bounds_to_extent.cpp
new file mode 100644
index 000000000..1591ce8df
--- /dev/null
+++ b/test/test_bounds_to_extent.cpp
@@ -0,0 +1,98 @@
+#include "teca_coordinate_util.h"
+#include "teca_common.h"
+#include "teca_variant_array.h"
+
+#include <iostream>
+
+// **************************************************************************
+p_teca_double_array get_test_data(bool ascending)
+{
+    int nx = 10;
+    double data_asc[] = {-90, -70, -50, -30, -10, 10, 30, 50, 70, 90};
+
+    p_teca_double_array array = teca_double_array::New(nx);
+
+    for (int i = 0; i < nx; ++i)
+        array->set(i, data_asc[i] * (ascending ? 1.0 : -1.0));
+
+    return array;
+}
+
+// **************************************************************************
+void get_test_bounds(bool ascending, double *bounds)
+{
+    double bounds_asc[2] = {-60, 60};
+    bounds[0] = bounds_asc[0] * (ascending ? 1.0 : -1.0);
+    bounds[1] = bounds_asc[1] * (ascending ? 1.0 : -1.0);
+}
+
+// **************************************************************************
+void get_expected_extent(bool, unsigned long *extent)
+{
+    unsigned long expected[2] = {1, 8};
+    extent[0] = expected[0];
+    extent[1] = expected[1];
+}
+
+// **************************************************************************
+int check_extent(bool ascending, double *test_bounds,
+    p_teca_double_array test_data, unsigned long *test_extent)
+{
+    double result_bounds[2];
+    test_data->get(test_extent[0], result_bounds[0]);
+    test_data->get(test_extent[1], result_bounds[1]);
+    std::cerr << "looked for [" << test_bounds[0] << ", "
+        << test_bounds[1] << "]" << " in " << std::endl;
+    test_data->to_stream(std::cerr);
+    std::cerr << std::endl << "computed extent [" << test_extent[0] << ", "
+        << test_extent[1] << "]" << std::endl << "result bounds [" << result_bounds[0]
+        << ", " << result_bounds[1] << " ]" << std::endl << std::endl;
+
+
+    unsigned long expect[2];
+    get_expected_extent(ascending, expect);
+
+    if (test_extent[0] != expect[0])
+    {
+        TECA_ERROR("Low test_extent " << test_extent[0] << " != " << expect[0]
+            << " in " << (ascending ? "ascending" : "descending")
+            << " data")
+        return -1;
+    }
+
+    if (test_extent[1] != expect[1])
+    {
+        TECA_ERROR("High test_extent " << test_extent[1] << " != " << expect[1]
+            << " in " << (ascending ? "ascending" : "descending")
+            << " data")
+        return -1;
+    }
+
+    return 0;
+}
+
+
+
+int main(int, char **)
+{
+    p_teca_double_array test_data;
+    double test_bounds[2];
+    unsigned long test_extent[2];
+    bool ascending[] = {true, false};
+
+    for (int i = 0; i < 2; ++i)
+    {
+        test_data = get_test_data(ascending[i]);
+        get_test_bounds(ascending[i], test_bounds);
+
+        if (teca_coordinate_util::bounds_to_extent(test_bounds,
+            test_data, test_extent))
+            return -1;
+
+        if (check_extent(ascending[i], test_bounds, test_data, test_extent))
+            return -1;
+    }
+
+    // all checks pass
+    return 0;
+}
diff --git a/test/test_cf_writer.cpp b/test/test_cf_writer.cpp
index e9ef3622a..6da351e25 100644
--- a/test/test_cf_writer.cpp
+++ b/test/test_cf_writer.cpp
@@ -175,6 +175,7 @@ int parse_command_line(int argc, char **argv, int rank,
     cf_writer->set_thread_pool_size(n_threads);
     cf_writer->set_first_step(first_step);
     cf_writer->set_last_step(last_step);
+    cf_writer->set_layout(teca_cf_writer::number_of_steps);
     cf_writer->set_steps_per_file(steps_per_file);
     cf_writer->set_compression_level(deflate_level);
     cf_writer->set_point_arrays(arrays);
diff --git a/test/test_cf_writer_bad_type.cpp b/test/test_cf_writer_bad_type.cpp
index 7a2212b0e..47f1b4f1f 100644
--- a/test/test_cf_writer_bad_type.cpp
+++ b/test/test_cf_writer_bad_type.cpp
@@ -35,8 +35,7 @@ int main(int, char **)
     p_teca_cartesian_mesh_source ms = teca_cartesian_mesh_source::New();
     ms->set_whole_extents({0, 359, 0, 179, 0, 0, 0, 7});
     ms->set_bounds({0.0, 360.0, -90.0, 90.0, 0.0, 0.0, 0.0, 10.0});
-    ms->set_calendar("standard");
-    ms->set_time_units("days since 07-14-2020");
+    ms->set_calendar("standard", "days since 07-14-2020");
     ms->append_field_generator({"mesh_time",
         teca_array_attributes(teca_variant_array_code<int>::get(), // this is the wrong type code!
             teca_array_attributes::point_centering, 0, "days since 01-01-1980",
diff --git a/test/test_cf_writer_collective.cpp b/test/test_cf_writer_collective.cpp
index 426da51d9..2f404c0f2 100644
--- a/test/test_cf_writer_collective.cpp
+++ b/test/test_cf_writer_collective.cpp
@@ -354,8 +354,7 @@ int main(int argc, char **argv)
     p_teca_cartesian_mesh_source src = teca_cartesian_mesh_source::New();
     src->set_whole_extents({0, nx - 1, 0, nx - 1, 0, 0, 0, n_steps-1});
     src->set_bounds({-90.0, 90.0, -90.0, 90.0, 0.0, 0.0, 0.0, 2.*M_PI});
-    src->set_calendar("standard");
-    src->set_time_units("days since 2019-09-24");
+    src->set_calendar("standard", "days since 2019-09-24");
 
     // generate point and information data to be written and then read
     // the point data is z = sin^2(x*y + t) thus correctness can be easily
diff --git a/test/test_descriptive_statistics.cpp b/test/test_descriptive_statistics.cpp
index 2ab040e4d..67f39d63f 100644
--- a/test/test_descriptive_statistics.cpp
+++ b/test/test_descriptive_statistics.cpp
@@ -132,7 +132,7 @@ int main(int argc, char **argv)
         // we pass the time axis with a list of files
         cf_reader->set_t_axis_variable("");
         cf_reader->set_t_values(time_values);
-        cf_reader->set_t_calendar("noleap");
+        cf_reader->set_calendar("noleap");
         cf_reader->set_t_units("days since 1979-01-01");
         cf_reader->set_file_names(files);
     }
diff --git a/test/test_elevation_mask.cpp b/test/test_elevation_mask.cpp
new file mode 100644
index 000000000..ee7b71e43
--- /dev/null
+++ b/test/test_elevation_mask.cpp
@@ -0,0 +1,171 @@
+#include "teca_config.h"
+#include "teca_cf_reader.h"
+#include "teca_cartesian_mesh_regrid.h"
+#include "teca_cartesian_mesh_source.h"
+#include "teca_normalize_coordinates.h"
+#include "teca_elevation_mask.h"
+#include "teca_indexed_dataset_cache.h"
+#include "teca_cf_writer.h"
+#include "teca_cf_reader.h"
+#include "teca_multi_cf_reader.h"
+#include "teca_dataset_diff.h"
+#include "teca_file_util.h"
+#include "teca_system_util.h"
+
+#include "teca_index_executive.h"
+#include "teca_mpi_manager.h"
+#include "teca_system_interface.h"
+#include "teca_mpi.h"
+
+#include <vector>
+#include <string>
+#include <iostream>
+using namespace std;
+
+int main(int argc, char **argv)
+{
+    teca_mpi_manager mpi_man(argc, argv);
+    int rank = mpi_man.get_comm_rank();
+
+    teca_system_interface::set_stack_trace_on_error();
+    teca_system_interface::set_stack_trace_on_mpi_error();
+
+    if (argc < 5)
+    {
+        if (rank == 0)
+        {
+            std::cerr << std::endl << "Usage error:" << std::endl
+                << "test_elevation_mask [reader type (cf,mcf)] [mesh files]"
+                   " [surface elev file] [out file] [first step] [last step]"
+                << std::endl << std::endl;
+        }
+        return -1;
+    }
+    std::string reader_type = argv[1];
+    std::string mesh_regex = argv[2];
+    std::string elev_regex = argv[3];
+    std::string baseline = argv[4];
+    int first_step = (argc > 5 ? atoi(argv[5]) : 0);
+    int last_step = (argc > 6 ? atoi(argv[6]) : -1);
+
+    // mesh
+    p_teca_algorithm mesh_reader;
+    if (reader_type == "cf")
+    {
+        p_teca_cf_reader cfr = teca_cf_reader::New();
+        cfr->set_z_axis_variable("plev");
+        cfr->set_files_regex(mesh_regex);
+        mesh_reader = cfr;
+    }
+    else if (reader_type == "mcf")
+    {
+        p_teca_multi_cf_reader cfr = teca_multi_cf_reader::New();
+        cfr->set_z_axis_variable("plev");
+        cfr->set_input_file(mesh_regex);
+        mesh_reader = cfr;
+    }
+
+    p_teca_normalize_coordinates mesh_coords = teca_normalize_coordinates::New();
+    mesh_coords->set_input_connection(mesh_reader->get_output_port());
+
+    teca_metadata md = mesh_coords->update_metadata();
+
+    // surface elevations
+    p_teca_cf_reader elev_cfr = teca_cf_reader::New();
+    elev_cfr->set_files_regex(elev_regex);
+    elev_cfr->set_t_axis_variable("");
+
+    p_teca_normalize_coordinates elev_coords = teca_normalize_coordinates::New();
+    elev_coords->set_input_connection(elev_cfr->get_output_port());
+    elev_coords->set_enable_periodic_shift_x(1);
+
+    // regrid the surface elevations onto the mesh coordinates
+    p_teca_cartesian_mesh_source elev_tgt = teca_cartesian_mesh_source::New();
+    elev_tgt->set_spatial_bounds(md, false);
+    elev_tgt->set_spatial_extents(md, false);
+    elev_tgt->set_x_axis_variable(md);
+    elev_tgt->set_y_axis_variable(md);
+    elev_tgt->set_z_axis_variable(md);
+    elev_tgt->set_t_axis_variable(md);
+    elev_tgt->set_t_axis(md);
+
+    p_teca_cartesian_mesh_regrid regrid = teca_cartesian_mesh_regrid::New();
+    regrid->set_input_connection(0, elev_tgt->get_output_port());
+    regrid->set_input_connection(1, elev_coords->get_output_port());
+
+    p_teca_algorithm head = regrid;
+#ifdef TECA_DEBUG
+    p_teca_cartesian_mesh_writer vtkwr = teca_cartesian_mesh_writer::New();
+    vtkwr->set_input_connection(regrid->get_output_port());
+    vtkwr->set_file_name("out_%t%.vtk");
+    head = vtkwr;
+#endif
+
+    p_teca_indexed_dataset_cache elev_cache = teca_indexed_dataset_cache::New();
+    elev_cache->set_input_connection(head->get_output_port());
+    elev_cache->set_max_cache_size(1);
+
+    // mask
+    p_teca_elevation_mask mask = teca_elevation_mask::New();
+    mask->set_input_connection(0, mesh_coords->get_output_port());
+    mask->set_input_connection(1, elev_cache->get_output_port());
+    mask->set_mesh_height_variable("zg");
+    mask->set_surface_elevation_variable("z");
+    mask->set_mask_variables({"hus_valid","ua_valid","va_valid"});
+
+    p_teca_index_executive rex = teca_index_executive::New();
+    rex->set_verbose(1);
+
+    std::vector<std::string> arrays({"zg", "hus", "hus_valid",
+            "ua", "ua_valid", "va", "va_valid"});
+
+
+    // run the test or generate the baseline
+    bool do_test = true;
+    teca_system_util::get_environment_variable("TECA_DO_TEST", do_test);
+
+    // find files named by a regex.
+    std::string tmp_baseline = baseline + ".*\\.nc$";
+    std::vector<std::string> test_files;
+    std::string regex = teca_file_util::filename(tmp_baseline);
+    std::string tmp_path = teca_file_util::path(tmp_baseline);
+    if (do_test && !teca_file_util::locate_files(tmp_path, regex, test_files))
+    {
+        std::cerr << "running the test ..." << std::endl;
+
+        p_teca_cf_reader cfr = teca_cf_reader::New();
+        cfr->set_files_regex(baseline);
+        cfr->set_z_axis_variable("plev");
+
+        rex->set_arrays(arrays);
+
+        p_teca_dataset_diff diff = teca_dataset_diff::New();
+        diff->set_input_connection(0, cfr->get_output_port());
+        diff->set_input_connection(1, mask->get_output_port());
+        diff->set_executive(rex);
+        diff->set_verbose(1);
+
+        diff->update();
+    }
+    else
+    {
+        std::cerr << "writing the baseline ..." << std::endl;
+        tmp_baseline = baseline + ".nc";
+
+        p_teca_cf_writer cmw = teca_cf_writer::New();
+        cmw->set_input_connection(mask->get_output_port());
+        cmw->set_thread_pool_size(1);
+        cmw->set_file_name(tmp_baseline);
+        cmw->set_steps_per_file(10000);
+        cmw->set_point_arrays(arrays);
+
+        cmw->set_first_step(first_step);
+        cmw->set_last_step(last_step);
+        cmw->set_verbose(1);
+
+        cmw->set_executive(rex);
+        cmw->update();
+    }
+
+    return 0;
+}
diff --git a/test/test_integrated_vapor_transport.cpp b/test/test_integrated_vapor_transport.cpp
index d29829c0c..45a22952b 100644
--- a/test/test_integrated_vapor_transport.cpp
+++ b/test/test_integrated_vapor_transport.cpp
@@ -2,7 +2,9 @@
 #include "teca_cartesian_mesh_writer.h"
 #include "teca_cf_writer.h"
 #include "teca_valid_value_mask.h"
+#include "teca_elevation_mask.h"
 #include "teca_integrated_vapor_transport.h"
+#include "teca_index_executive.h"
 #include "teca_coordinate_util.h"
 #include "teca_dataset_capture.h"
 #include "teca_system_interface.h"
@@ -89,9 +91,10 @@ int main(int argc, char **argv)
     double p_sfc = 92500e-4;
     double p_top = 5000e-4;
     double fill_value = 1.0e14;
-    int write_input = 0;
-    int write_output = 0;
-    
+    int vv_mask = (argc > 0 ? atoi(argv[1]) : 1);
+    int write_input = (argc > 1 ? atoi(argv[2]) : 0);
+    int write_output = (argc > 2 ? atoi(argv[3]) : 0);
+
     // double the z axis, but hit all of the original points.  if we set the
     // integrand to the fill_value where p > p_sfc and apply the valid value
     // mask then the integral should have the value as if integrated from p_sfc
@@ -103,8 +106,7 @@ int main(int argc, char **argv)
     p_teca_cartesian_mesh_source mesh = teca_cartesian_mesh_source::New();
     mesh->set_whole_extents({0, 2, 0, 2, 0, j1, 0, 0});
     mesh->set_bounds({-1.0, 1.0, -1.0, 1.0, p_sfc_2, p_top, 0.0, 0.0});
-    mesh->set_calendar("standard");
-    mesh->set_time_units("days since 2020-09-30 00:00:00");
+    mesh->set_calendar("standard", "days since 2020-09-30 00:00:00");
 
     // let q = sin(p)
     function_of_z<double> q([](double p) -> double { return sin(p); },
@@ -139,25 +141,81 @@ int main(int argc, char **argv)
             1, fill_value),
             v});
 
-    // generate the valid value mask
-    p_teca_valid_value_mask mask = teca_valid_value_mask::New();
-    mask->set_input_connection(mesh->get_output_port());
-    mask->set_verbose(0);
+    p_teca_algorithm head;
+    if (vv_mask)
+    {
+        // generate the valid value mask
+        std::cerr << "Testing with the valid_value_mask" << std::endl;
+
+        p_teca_valid_value_mask mask = teca_valid_value_mask::New();
+        mask->set_input_connection(mesh->get_output_port());
+        mask->set_verbose(0);
+
+        head = mask;
+    }
+    else
+    {
+        // generate the elevation mask
+        std::cerr << "Testing with the elevation_mask" << std::endl;
+
+        // add generator for mesh height
+        // let zg = -p
+        function_of_z<double> zg([](double z) -> double { return -z; },
+                1e6, fill_value);
+
+        mesh->append_field_generator({"zg",
+            teca_array_attributes(teca_variant_array_code<double>::get(),
+                teca_array_attributes::point_centering, 0, "m",
+                "mesh height", "test data where zg = p",
+                1, fill_value),
+                zg});
+
+        // generate surface elevation
+        p_teca_cartesian_mesh_source elev = teca_cartesian_mesh_source::New();
+        elev->set_whole_extents({0, 2, 0, 2, 0, 0, 0, 0});
+        elev->set_bounds({-1.0, 1.0, -1.0, 1.0, p_sfc, p_sfc, 0.0, 0.0});
+        elev->set_t_axis_variable("");
+
+        elev->append_field_generator({"z",
+            teca_array_attributes(teca_variant_array_code<double>::get(),
+                teca_array_attributes::point_centering, 0, "m",
+                "surface elevation", "test data where z = p",
+                1, fill_value),
+                zg});
+
+        p_teca_elevation_mask mask = teca_elevation_mask::New();
+        mask->set_input_connection(0, mesh->get_output_port());
+        mask->set_input_connection(1, elev->get_output_port());
+        mask->set_mask_variables({"q_valid", "u_valid", "v_valid"});
+        mask->set_surface_elevation_variable("z");
+        mask->set_mesh_height_variable("zg");
+
+        head = mask;
+    }
 
     // write the test input dataset
     if (write_input)
     {
+        std::string fn = std::string("test_integrated_vapor_transport_input_") +
+            std::string(vv_mask ? "vv_mask" : "elev_mask") + std::string("_%t%.nc");
+
+        p_teca_index_executive exec = teca_index_executive::New();
+
         p_teca_cf_writer w = teca_cf_writer::New();
-        w->set_input_connection(mask->get_output_port());
-        w->set_file_name("test_integrated_vapor_transport_input_%t%.nc");
+        w->set_input_connection(head->get_output_port());
+        w->set_file_name(fn);
         w->set_thread_pool_size(1);
         w->set_point_arrays({"q", "u", "v", "q_valid", "u_valid", "v_valid"});
+        if (!vv_mask)
+            w->append_point_array("zg");
+        w->set_executive(exec);
+
         w->update();
     }
 
     // compute IVT
     p_teca_integrated_vapor_transport ivt = teca_integrated_vapor_transport::New();
-    ivt->set_input_connection(mask->get_output_port());
+    ivt->set_input_connection(head->get_output_port());
     ivt->set_wind_u_variable("u");
     ivt->set_wind_v_variable("v");
     ivt->set_specific_humidity_variable("q");
@@ -165,9 +223,12 @@ int main(int argc, char **argv)
     // write the result
     if (write_output)
     {
+        std::string fn = std::string("test_integrated_vapor_transport_output_") +
+            std::string(vv_mask ? "vv_mask" : "elev_mask") + std::string("_%t%.nc");
+
         p_teca_cf_writer w = teca_cf_writer::New();
         w->set_input_connection(ivt->get_output_port());
-        w->set_file_name("test_integrated_vapor_transport_output_%t%.nc");
+        w->set_file_name(fn);
         w->set_thread_pool_size(1);
         w->set_point_arrays({"ivt_u", "ivt_v"});
         w->update();
diff --git a/test/test_integrated_water_vapor.cpp b/test/test_integrated_water_vapor.cpp
new file mode 100644
index 000000000..53aa3e145
--- /dev/null
+++ b/test/test_integrated_water_vapor.cpp
@@ -0,0 +1,239 @@
+#include "teca_cartesian_mesh_source.h"
+#include "teca_cartesian_mesh_writer.h"
+#include "teca_cf_writer.h"
+#include "teca_valid_value_mask.h"
+#include "teca_elevation_mask.h"
+#include "teca_integrated_water_vapor.h"
+#include "teca_index_executive.h"
+#include "teca_coordinate_util.h"
+#include "teca_dataset_capture.h"
+#include "teca_system_interface.h"
+
+
+#include <cmath>
+#include <functional>
+
+
+// iwv = - \frac{1}{g} \int_{p_{sfc}}^{p_{top}} q dp
+//
+// strategy: define integrand q = exp(p) and evaluate numerically using our
+// implementation and analytically and compare the results as a check
+//
+// let q = exp(p)
+//
+// we can then validate our implementation against the analyitic solutions:
+//
+// iwv = exp(p) |_{p_{sfc}}^{p_{top}}
+//
+
+template <typename num_t>
+struct function_of_z
+{
+    using f_type = std::function<num_t(num_t)>;
+
+    function_of_z(const f_type &a_f, num_t max_z, num_t fill_value) :
+        m_max_z(max_z), m_fill_value(fill_value), m_f(a_f)  {}
+
+    p_teca_variant_array operator()(const const_p_teca_variant_array &x,
+        const const_p_teca_variant_array &y, const const_p_teca_variant_array &z,
+        double t)
+    {
+        (void)t;
+
+        size_t nx = x->size();
+        size_t ny = y->size();
+        size_t nz = z->size();
+        size_t nxy = nx*ny;
+
+        p_teca_variant_array_impl<num_t> fz = teca_variant_array_impl<num_t>::New(nx*ny*nz);
+        num_t *pfz = fz->get();
+
+        TEMPLATE_DISPATCH(teca_variant_array_impl,
+            fz.get(),
+            const NT *pz = dynamic_cast<const TT*>(z.get())->get();
+            for (size_t k = 0; k < nz; ++k)
+            {
+                for (size_t j = 0; j < ny; ++j)
+                {
+                    for (size_t i = 0; i < nx; ++i)
+                    {
+                        num_t z = pz[k];
+                        pfz[k*nxy + j*nx + i] = z > m_max_z ? m_fill_value : this->m_f(z);
+                    }
+                }
+            }
+            )
+
+        return fz;
+    }
+
+    num_t m_max_z;
+    num_t m_fill_value;
+    f_type m_f;
+};
+
+// an actual sequence of pressure levels from the HighResMIP data
+// plev = 92500, 85000, 70000, 60000, 50000, 25000, 5000 ;
+
+int main(int argc, char **argv)
+{
+    (void)argc;
+    (void)argv;
+
+    teca_system_interface::set_stack_trace_on_error();
+
+    unsigned long i1 = 1024;
+    double p_sfc = 92500e-4;
+    double p_top = 5000e-4;
+    double fill_value = 1.0e14;
+    int vv_mask = (argc > 0 ? atoi(argv[1]) : 1);
+    int write_input = (argc > 1 ? atoi(argv[2]) : 0);
+    int write_output = (argc > 2 ? atoi(argv[3]) : 0);
+
+    // double the z axis, but hit all of the original points.  if we set the
+    // integrand to the fill_value where p > p_sfc and apply the valid value
+    // mask then the integral should have the value as if integrated from p_sfc
+    // to p_top. This lets us verify that the integrator works correctly in
+    // the presence of missing values
+    double p_sfc_2 = 2.0*p_sfc - p_top;
+    unsigned long j1 = 2*i1;
+
+    p_teca_cartesian_mesh_source mesh = teca_cartesian_mesh_source::New();
+    mesh->set_whole_extents({0, 2, 0, 2, 0, j1, 0, 0});
+    mesh->set_bounds({-1.0, 1.0, -1.0, 1.0, p_sfc_2, p_top, 0.0, 0.0});
+    mesh->set_calendar("standard", "days since 2020-09-30 00:00:00");
+
+    // let q = exp(p)
+    function_of_z<double> q([](double p) -> double { return exp(p); },
+        p_sfc, fill_value);
+
+    mesh->append_field_generator({"q",
+        teca_array_attributes(teca_variant_array_code<double>::get(),
+            teca_array_attributes::point_centering, 0, "g kg^-1",
+            "specific humidty", "test data where q = sin(p)",
+            1, fill_value),
+            q});
+
+    p_teca_algorithm head;
+    if (vv_mask)
+    {
+        // generate the valid value mask
+        std::cerr << "Testing with the valid_value_mask" << std::endl;
+
+        p_teca_valid_value_mask mask = teca_valid_value_mask::New();
+        mask->set_input_connection(mesh->get_output_port());
+        mask->set_verbose(0);
+
+        head = mask;
+    }
+    else
+    {
+        // generate the elevation mask
+        std::cerr << "Testing with the elevation_mask" << std::endl;
+
+        // add generator for mesh height
+        // let zg = -p
+        function_of_z<double> zg([](double z) -> double { return -z; },
+                1e6, fill_value);
+
+        mesh->append_field_generator({"zg",
+            teca_array_attributes(teca_variant_array_code<double>::get(),
+                teca_array_attributes::point_centering, 0, "m",
+                "mesh height", "test data where zg = p",
+                1, fill_value),
+                zg});
+
+        // generate surface elevation
+        p_teca_cartesian_mesh_source elev = teca_cartesian_mesh_source::New();
+        elev->set_whole_extents({0, 2, 0, 2, 0, 0, 0, 0});
+        elev->set_bounds({-1.0, 1.0, -1.0, 1.0, p_sfc, p_sfc, 0.0, 0.0});
+        elev->set_t_axis_variable("");
+
+        elev->append_field_generator({"z",
+            teca_array_attributes(teca_variant_array_code<double>::get(),
+                teca_array_attributes::point_centering, 0, "m",
+                "surface elevation", "test data where z = p",
+                1, fill_value),
+                zg});
+
+        p_teca_elevation_mask mask = teca_elevation_mask::New();
+        mask->set_input_connection(0, mesh->get_output_port());
+        mask->set_input_connection(1, elev->get_output_port());
+        mask->set_mask_variables({"q_valid"});
+        mask->set_surface_elevation_variable("z");
+        mask->set_mesh_height_variable("zg");
+
+        head = mask;
+    }
+
+    // write the test input dataset
+    if (write_input)
+    {
+        std::string fn = std::string("test_integrated_water_vapor_input_") +
+            std::string(vv_mask ? "vv_mask" : "elev_mask") + std::string("_%t%.nc");
+
+        p_teca_index_executive exec = teca_index_executive::New();
+
+        p_teca_cf_writer w = teca_cf_writer::New();
+        w->set_input_connection(head->get_output_port());
+        w->set_file_name(fn);
+        w->set_thread_pool_size(1);
+        w->set_point_arrays({"q", "q_valid"});
+        if (!vv_mask)
+            w->append_point_array("zg");
+        w->set_executive(exec);
+
+        w->update();
+    }
+
+    // compute IWV
+    p_teca_integrated_water_vapor iwv = teca_integrated_water_vapor::New();
+    iwv->set_input_connection(head->get_output_port());
+    iwv->set_specific_humidity_variable("q");
+    iwv->set_iwv_variable("iwv");
+
+    // write the result
+    if (write_output)
+    {
+        std::string fn = std::string("test_integrated_water_vapor_output_") +
+            std::string(vv_mask ? "vv_mask" : "elev_mask") + std::string("_%t%.nc");
+
+        p_teca_cf_writer w = teca_cf_writer::New();
+        w->set_input_connection(iwv->get_output_port());
+        w->set_file_name(fn);
+        w->set_thread_pool_size(1);
+        w->set_point_arrays({"iwv"});
+        w->update();
+    }
+
+    // capture the result
+    p_teca_dataset_capture dsc = teca_dataset_capture::New();
+    dsc->set_input_connection(iwv->get_output_port());
+    dsc->update();
+
+    const_p_teca_cartesian_mesh m =
+        std::dynamic_pointer_cast<const teca_cartesian_mesh>(dsc->get_dataset());
+
+    const_p_teca_double_array iwva =
+        std::dynamic_pointer_cast<const teca_double_array>
+            (m->get_point_arrays()->get("iwv"));
+
+    double test_iwv = iwva->get(0);
+
+    // calculate the analytic solution
+    double g = 9.80665;
+    double base_iwv = -(1./g) * (exp(p_top) - exp(p_sfc));
+
+    // display
+    std::cerr << "base_iwv = " << base_iwv << std::endl;
+    std::cerr << "test_iwv = " << test_iwv << std::endl << std::endl;
+
+    // compare against the analytic solution
+    if (!teca_coordinate_util::equal(base_iwv, test_iwv, 1e-4))
+    {
+        TECA_ERROR("base_iwv = " << base_iwv << " test_iwv = " << test_iwv)
+        return -1;
+    }
+
+    return 0;
+}
diff --git a/test/test_interval_iterator.cpp b/test/test_interval_iterator.cpp
new file mode 100644
index 000000000..fa558fb5d
--- /dev/null
+++ b/test/test_interval_iterator.cpp
@@ -0,0 +1,71 @@
+#include "teca_cf_reader.h"
+#include "teca_calendar_util.h"
+#include "teca_metadata.h"
+#include "teca_variant_array.h"
+
+#include <string>
+#include <iostream>
+
+int main(int argc, char **argv)
+{
+    // process command line
+    if (argc != 4)
+    {
+        std::cerr << "usage:" << std::endl
+            << "test_interval_iterator [interval]"
+            " [cf reader regex] [n expected]" << std::endl;
+    }
+
+    std::string interval = argv[1];
+    std::string regex = argv[2];
+    int n_expected = atoi(argv[3]);
+
+    // get the time values
+    p_teca_cf_reader cfr = teca_cf_reader::New();
+    cfr->set_files_regex(regex);
+
+    teca_metadata md = cfr->update_metadata();
+
+    // iterate over the time axis, count the number of intervals and compare
+    // against the expected number
+    teca_calendar_util::p_interval_iterator it =
+        teca_calendar_util::interval_iterator_factory::New(interval);
+
+    if (!it || it->initialize(md))
+    {
+        TECA_ERROR("Failed to initialize the \"" << interval << "\" iterator")
+        return -1;
+    }
+
+    int n_intervals = 0;
+    long n_steps_total = 0;
+
+    while (*it)
+    {
+        teca_calendar_util::time_point first_step;
+        teca_calendar_util::time_point last_step;
+
+        it->get_next_interval(first_step, last_step);
+
+        long n_steps = last_step.index - first_step.index + 1;
+        n_steps_total += n_steps;
+
+        std::cerr << "From: " << first_step << " To: " << last_step
+            << " steps=" << n_steps  << std::endl;
+
+        n_intervals += 1;
+    }
+
+    std::cerr << n_steps_total << " steps located" << std::endl;
+
+    // check the number of intervals
+    if (n_intervals != n_expected)
+    {
+        TECA_ERROR("The \"" << interval << "\" iterator produced "
+            << n_intervals << " where " << n_expected << " were expected")
+        return -1;
+    }
+
+    return 0;
+}
+
diff --git a/test/test_normalize_coordinates.cpp b/test/test_normalize_coordinates.cpp
index 608310d27..ced39441f 100644
--- a/test/test_normalize_coordinates.cpp
+++ b/test/test_normalize_coordinates.cpp
@@ -86,43 +86,71 @@ int main(int argc, char **argv)
 {
     teca_system_interface::set_stack_trace_on_error();
 
-    if (argc != 14)
+    if ((argc != 17) && (argc != 11))
     {
-        cerr << "test_normalize_coordinates [nx] [ny] [nz] [flip x] [flip y] [flip z] "
-            "[x0 x1 y0 y1 z0 z1] [out file]" << endl;
+        std::cerr << "test_normalize_coordinates [nx] [ny] [nz]"
+            " [dataset bounds : x0 x1 y0 y1 z0 z1] [subset bounds : x0 x1 y0 y1 z0 z1]"
+            " [out file]" << std::endl;
         return -1;
     }
 
     unsigned long nx = atoi(argv[1]);
     unsigned long ny = atoi(argv[2]);
     unsigned long nz = atoi(argv[3]);
-    int flip_x = atoi(argv[4]);
-    int flip_y = atoi(argv[5]);
-    int flip_z = atoi(argv[6]);
-    std::vector<double> req_bounds({atof(argv[7]), atof(argv[8]),
-        atof(argv[9]), atof(argv[10]), atof(argv[11]), atof(argv[12])});
-    std::string out_file = argv[13];
 
+    std::vector<double> bounds({atof(argv[4]), atof(argv[5]),
+        atof(argv[6]), atof(argv[7]), atof(argv[8]), atof(argv[9])});
+
+    // optional subset
+    std::vector<double> req_bounds(6);
+    bool subset = false;
+    if (argc == 17)
+    {
+        req_bounds = std::vector<double>({atof(argv[10]), atof(argv[11]),
+            atof(argv[12]), atof(argv[13]), atof(argv[14]), atof(argv[15])});
+
+        subset = true;
+    }
+
+    std::string out_file = argv[subset ? 16 : 10];
 
     p_teca_cartesian_mesh_source source = teca_cartesian_mesh_source::New();
     source->set_whole_extents({0, nx-1, 0, ny-1, 0, nz-1, 0, 0});
 
-    double x0 = flip_x ? 360.0 : 0.0;
-    double x1 = flip_x ? 0.0 : 360.0;
-    double y0 = flip_y ? 90.0 : -90.0;
-    double y1 = flip_y ? -90.0 : 90.0;
-    double z0 = flip_z ? 10.0 : 0.0;
-    double z1 = flip_z ? 0.0 : 10.0;
-    source->set_bounds({x0, x1, y0, y1, z0, z1, 0., 0.});
+    source->set_bounds({bounds[0], bounds[1], bounds[2],
+        bounds[3], bounds[4], bounds[5], 0., 0.});
 
     distance_field distance = {80., -80., 2.5};
     source->append_field_generator({"distance", distance.get_attributes(), distance});
 
     p_teca_normalize_coordinates coords = teca_normalize_coordinates::New();
     coords->set_input_connection(source->get_output_port());
+    coords->set_enable_periodic_shift_x(1);
 
     p_teca_index_executive exec = teca_index_executive::New();
-    exec->set_bounds(req_bounds);
+    if (subset)
+        exec->set_bounds(req_bounds);
+    exec->set_verbose(1);
+
+    std::cerr << "running the test with " << std::endl
+        << "whole_extents = [0, " << nx-1 << ", 0, "
+        << ny-1 << ", 0, " << nz-1 << "]" << std::endl
+        << "bounds = [" << bounds[0] << ", " << bounds[1] << ", " << bounds[2]
+        << ", " << bounds[3] << ", " << bounds[4] << ", " << bounds[5] << "]"
+        << std::endl
+        << "req_bounds = [" << req_bounds[0] << ", " << req_bounds[1] << ", "
+        << req_bounds[2] << ", " << req_bounds[3] << ", " << req_bounds[4]
+        << ", " << req_bounds[5] << "]"
+        << std::endl;
+
+    teca_metadata md = coords->update_metadata();
+
+    teca_metadata coord_axes;
+    md.get("coordinates", coord_axes);
+
+    std::cerr << "coordinates" << std::endl;
+    coord_axes.to_stream(std::cerr);
+    std::cerr << std::endl;
 
     bool do_test = true;
     teca_system_util::get_environment_variable("TECA_DO_TEST", do_test);
diff --git a/test/test_priority_queue.cpp b/test/test_priority_queue.cpp
new file mode 100644
index 000000000..664f68981
--- /dev/null
+++ b/test/test_priority_queue.cpp
@@ -0,0 +1,193 @@
+#include "teca_priority_queue.h"
+#include "teca_common.h"
+
+#include <stdlib.h>
+#include <iostream>
+#include <vector>
+
+// using contiguous ordinal keys
+// randomly generate num_vals priorities, construct the queue, and update the
+// priorities num_vals/2 times. finally verify that priorities are in sorted
+// order.
+int test_contiguous(int num_vals)
+{
+    // generate some values to prioritize
+    std::vector<int> vals;
+    for (int i = 0; i < num_vals; ++i)
+    {
+        int val = rand() % num_vals;
+        vals.push_back(val);
+    }
+
+    std::cerr << "vals=";
+    for (int i = 0; i < num_vals; ++i)
+        std::cerr << vals[i] << " ";
+    std::cerr << std::endl;
+
+    /*std::function<int(int)> lookup = [&](int i) -> int
+        { return vals[i]; };*/
+
+    contiguous_key_priority<int,int> lookup(vals);
+    auto q = teca_priority_queue<int, decltype(lookup)>::New(lookup);
+
+    // test push keys
+    for (int i = 0; i < num_vals; ++i)
+        q->push(i);
+
+    std::cerr << "initial state  " << std::endl
+        << q << std::endl;
+
+    // test updating priority of any element
+    for (int i = 0; i < num_vals/2; ++i)
+    {
+        int j = rand() % num_vals;
+        int vj = vals[j];
+        int dvj = num_vals * (i % 2 == 0 ? -1 : 1);
+
+        vals[j] += dvj;
+
+        q->modified(j);
+
+        std::cerr << "after vals[" << j << "] = " << vj
+            << " + " << dvj << " = " << vals[j] << std::endl
+            << q << std::endl;
+    }
+
+    // test pop
+    int cur = 0;
+    int prev = vals[q->peak()];
+    std::cerr << "sorted = ";
+    while (!q->empty())
+    {
+        cur = vals[q->pop()];
+        std::cerr << cur << " ";
+        if (prev > cur)
+        {
+            std::cerr << std::endl;
+            TECA_ERROR(
+                << "ERROR: heap ordering is violated! "
+                << prev << " > " << cur)
+            return -1;
+        }
+        prev = cur;
+    }
+    std::cerr << std::endl;
+
+    return 0;
+}
+
+// using unordered keys
+// randomly generate num_vals priorities, construct the queue, and update the
+// priorities num_vals/2 times. finally verify that priorities are in sorted
+// order.
+int test_mapped(int num_vals)
+{
+    using map_t = std::map<int,int>;
+    using map_it_t = map_t::iterator;
+
+    // generate some values to prioritize
+    map_t vals;
+    for (int i = 0; i < num_vals; ++i)
+    {
+        int key = 3*i;
+        int val = rand() % num_vals;
+        vals[key] = val;
+    }
+
+    std::cerr << "vals=";
+    for (map_it_t it = vals.begin(); it != vals.end(); ++it)
+        std::cerr << "(key = " << it->first << ", value = " << it->second << ") ";
+    std::cerr << std::endl;
+
+    mapped_key_priority<int,int> lookup(vals);
+    auto q = teca_priority_queue<int, decltype(lookup),
+        std::greater<>, std::map<int, unsigned long>>::New(lookup);
+
+    // test push keys
+    std::cerr << "vals=";
+    for (map_it_t it = vals.begin(); it != vals.end(); ++it)
+        q->push(it->first);
+
+    std::cerr << "initial state  " << std::endl
+        << q << std::endl;
+
+    // test updating priority of any element
+    for (int i = 0; i < num_vals/2; ++i)
+    {
+        int j = 3*(rand() % num_vals);
+        int vj = vals[j];
+        int dvj = num_vals * (i % 2 == 0 ? -1 : 1);
+
+        vals[j] += dvj;
+
+        q->modified(j);
+
+        std::cerr << "after vals[" << j << "] = " << vj
+            << " + " << dvj << " = " << vals[j] << std::endl
+            << q << std::endl;
+    }
+
+    // test pop
+    int cur = 0;
+    int prev = vals[q->peak()];
+    std::cerr << "sorted = ";
+    while (!q->empty())
+    {
+        cur = vals[q->pop()];
+        std::cerr << cur << " ";
+        if (prev < cur)
+        {
+            std::cerr << std::endl;
+            TECA_ERROR(
+                << "Heap ordering is violated! "
+                << prev << " < " << cur)
+            return -1;
+        }
+        prev = cur;
+    }
+    std::cerr << std::endl;
+
+    return 0;
+}
+
+// run the test
+int main(int argc, char **argv)
+{
+    if (argc < 3)
+    {
+        std::cerr << "usage: a.out [num vals] [rng seed]" << std::endl;
+        return -1;
+    }
+
+
+    int num_vals = atoi(argv[1]);
+    int seed = atoi(argv[2]);
+
+    srand(seed);
+
+    std::cerr
+        << "============================================" << std::endl
+        << "Test contiguous keys" << std::endl
+        << "============================================" << std::endl;
+
+    if (test_contiguous(num_vals))
+    {
+        TECA_ERROR("Test contiguous failed")
+        return -1;
+    }
+
+    std::cerr
+        << "============================================" << std::endl
+        << "Test mapped keys" << std::endl
+        << "============================================" << std::endl;
+
+    if (test_mapped(num_vals))
+    {
+        TECA_ERROR("Test mapped failed")
+        return -1;
+    }
+
+    return 0;
+}
+
+
diff --git a/test/test_rename_variables.cpp b/test/test_rename_variables.cpp
new file mode 100644
index 000000000..9dc7e990b
--- /dev/null
+++ b/test/test_rename_variables.cpp
@@ -0,0 +1,112 @@
+#include "teca_cartesian_mesh_source.h"
+#include "teca_rename_variables.h"
+#include "teca_cf_reader.h"
+#include "teca_cf_writer.h"
+#include "teca_index_executive.h"
+#include "teca_dataset_diff.h"
+#include "teca_file_util.h"
+#include "teca_system_util.h"
+#include "teca_system_interface.h"
+#include "teca_array_attributes.h"
+#include "teca_metadata.h"
+
+#include <cmath>
+#include <functional>
+
+
+// generates f = k*nxy + j*nx + i
+struct index_function
+{
+    p_teca_variant_array operator()(const const_p_teca_variant_array &x,
+        const const_p_teca_variant_array &y, const const_p_teca_variant_array &z,
+        double t)
+    {
+        (void)t;
+
+        size_t nx = x->size();
+        size_t ny = y->size();
+        size_t nz = z->size();
+        size_t nxyz = nx*ny*nz;
+
+        p_teca_variant_array f = x->new_instance(nxyz);
+
+        TEMPLATE_DISPATCH(teca_variant_array_impl,
+            f.get(),
+            NT *pf = dynamic_cast<TT*>(f.get())->get();
+            for (size_t i = 0; i < nxyz; ++i)
+            {
+                pf[i] = i;
+            }
+            )
+
+        return f;
+    }
+};
+
+
+int main(int argc, char **argv)
+{
+    teca_system_interface::set_stack_trace_on_error();
+
+    if (argc < 2)
+    {
+        std::cerr << "usage: test_rename_variables [baseline]" << std::endl;
+        return -1;
+    }
+
+    std::string baseline = argv[1];
+
+    p_teca_cartesian_mesh_source src = teca_cartesian_mesh_source::New();
+    src->set_whole_extents({0, 99, 0, 99, 0, 0, 0, 0});
+    src->set_bounds({0.0, 360.0, -90.0, 90.0, 0.0, 0.0, 0.0, 0.0});
+    src->set_calendar("standard", "days since 2020-04-17 00:00:00");
+
+    index_function func;
+
+    src->append_field_generator({"index",
+        teca_array_attributes(teca_variant_array_code<double>::get(),
+            teca_array_attributes::point_centering, 0, "unitless",
+            "index", "some test data"),
+        func});
+
+    p_teca_rename_variables ren = teca_rename_variables::New();
+    ren->set_input_connection(src->get_output_port());
+    ren->set_original_variable_names({"index"});
+    ren->set_new_variable_names({"test_data"});
+
+    // run the test
+    p_teca_index_executive exe = teca_index_executive::New();
+
+    bool do_test = true;
+    teca_system_util::get_environment_variable("TECA_DO_TEST", do_test);
+    if (do_test && teca_file_util::file_exists(baseline.c_str()))
+    {
+        std::cerr << "running the test..." << std::endl;
+
+        exe->set_arrays({"test_data"});
+
+        p_teca_cf_reader cfr = teca_cf_reader::New();
+        cfr->append_file_name(baseline);
+
+        p_teca_dataset_diff diff = teca_dataset_diff::New();
+        diff->set_input_connection(0, cfr->get_output_port());
+        diff->set_input_connection(1, ren->get_output_port());
+        diff->set_executive(exe);
+        diff->update();
+    }
+    else
+    {
+        std::cerr << "writing the baseline..." << std::endl;
+
+        p_teca_cf_writer cfw = teca_cf_writer::New();
+        cfw->set_input_connection(ren->get_output_port());
+        cfw->set_file_name(baseline);
+        cfw->set_point_arrays({"test_data"});
+        cfw->set_executive(exe);
+        cfw->set_thread_pool_size(1);
+        cfw->update();
+    }
+
+
+    return 0;
+}
diff --git a/test/test_simple_moving_average.cpp b/test/test_simple_moving_average.cpp
new file mode 100644
index 000000000..e785ea342
--- /dev/null
+++ b/test/test_simple_moving_average.cpp
@@ -0,0 +1,107 @@
+#include "teca_cf_reader.h"
+#include "teca_normalize_coordinates.h"
+#include "teca_indexed_dataset_cache.h"
+#include "teca_simple_moving_average.h"
+#include "teca_cartesian_mesh_writer.h"
+#include "teca_cf_writer.h"
+#include "teca_dataset_diff.h"
+#include "teca_index_executive.h"
+#include "teca_system_interface.h"
+#include "teca_system_util.h"
+
+#include <vector>
+#include <string>
+#include <iostream>
+using namespace std;
+
+int main(int argc, char **argv)
+{
+    teca_system_interface::set_stack_trace_on_error();
+
+    if (argc < 8)
+    {
+        std::cerr << std::endl << "Usage error:" << std::endl
+            << "test_simple_moving_average [input regex] [baseline] [first step] [last step]"
+               "  [filter width] [n threads] [array] [array] ..." << std::endl
+            << std::endl;
+        return -1;
+    }
+
+    // parse command line
+    string regex = argv[1];
+    string baseline = argv[2];
+    long first_step = atoi(argv[3]);
+    long last_step = atoi(argv[4]);
+    int filter_width = atoi(argv[5]);
+    int n_threads = atoi(argv[6]);
+    std::vector<std::string> arrays;
+    arrays.push_back(argv[7]);
+    for (int i = 8; i < argc; ++i)
+        arrays.push_back(argv[i]);
+
+    // create the cf reader
+    p_teca_cf_reader r = teca_cf_reader::New();
+    r->set_files_regex(regex);
+
+    // normalize coords
+    p_teca_normalize_coordinates c = teca_normalize_coordinates::New();
+    c->set_input_connection(r->get_output_port());
+
+    // ds cache
+    p_teca_indexed_dataset_cache dsc = teca_indexed_dataset_cache::New();
+    dsc->set_input_connection(c->get_output_port());
+    dsc->set_max_cache_size(2*n_threads*filter_width);
+
+    // temporal avg
+    p_teca_simple_moving_average a = teca_simple_moving_average::New();
+    a->set_filter_width(filter_width);
+    a->set_filter_type(teca_simple_moving_average::backward);
+    a->set_input_connection(dsc->get_output_port());
+
+
+    bool do_test = true;
+    teca_system_util::get_environment_variable("TECA_DO_TEST", do_test);
+    if (do_test)
+    {
+        std::cerr << "running the test..." << std::endl;
+
+        baseline += ".*\\.nc$";
+
+        p_teca_cf_reader br = teca_cf_reader::New();
+        br->set_files_regex(baseline);
+
+        // executive
+        p_teca_index_executive rex = teca_index_executive::New();
+        rex->set_start_index(first_step);
+        rex->set_end_index(last_step);
+        rex->set_arrays(arrays);
+
+        p_teca_dataset_diff diff = teca_dataset_diff::New();
+        diff->set_input_connection(0, br->get_output_port());
+        diff->set_input_connection(1, a->get_output_port());
+        diff->set_verbose(1);
+        diff->set_executive(rex);
+        // TODO : test with threads
+        //diff->set_thread_pool_size(n_threads);
+        diff->update();
+    }
+    else
+    {
+        std::cerr << "writing the baseline..." << std::endl;
+
+        baseline += "_%t%.nc";
+
+        // writer
+        p_teca_cf_writer w = teca_cf_writer::New();
+        w->set_input_connection(a->get_output_port());
+        w->set_thread_pool_size(n_threads);
+        w->set_point_arrays(arrays);
+        w->set_file_name(baseline);
+        w->set_first_step(first_step);
+        w->set_last_step(last_step);
+        w->set_steps_per_file(10000);
+        w->update();
+    }
+
+    return 0;
+}
diff --git a/test/test_temporal_average.cpp b/test/test_temporal_average.cpp
deleted file mode 100644
index a4ee13b0f..000000000
--- a/test/test_temporal_average.cpp
+++ /dev/null
@@ -1,68 +0,0 @@
-#include "teca_cf_reader.h"
-#include "teca_normalize_coordinates.h"
-#include "teca_temporal_average.h"
-#include "teca_cartesian_mesh_writer.h"
-#include "teca_index_executive.h"
-#include "teca_system_interface.h"
-
-#include <vector>
-#include <string>
-#include <iostream>
-using namespace std;
-
-// example use
-// ./test/test_cf_reader ~/work/teca/data/'cam5_1_amip_run2.cam2.h2.1991-10-.*' tmp 0 -1 PS
-
-int main(int argc, char **argv)
-{
-    teca_system_interface::set_stack_trace_on_error();
-
-    if (argc < 7)
-    {
-        cerr << endl << "Usage error:" << endl
-            << "test_cf_reader [input regex] [output] [first step] [last step] [filter width] [array] [array] ..." << endl
-            << endl;
-        return -1;
-    }
-
-    // parse command line
-    string regex = argv[1];
-    string output = argv[2];
-    long first_step = atoi(argv[3]);
-    long last_step = atoi(argv[4]);
-    int filter_width = atoi(argv[5]);
-    vector<string> arrays;
-    arrays.push_back(argv[6]);
-    for (int i = 7; i < argc; ++i)
-        arrays.push_back(argv[i]);
-
-    // create the cf reader
-    p_teca_cf_reader r = teca_cf_reader::New();
-    r->set_files_regex(regex);
-
-    p_teca_normalize_coordinates c = teca_normalize_coordinates::New();
-    c->set_input_connection(r->get_output_port());
-
-    p_teca_temporal_average a = teca_temporal_average::New();
-    a->set_filter_width(filter_width);
-    a->set_filter_type(teca_temporal_average::backward);
-    a->set_input_connection(c->get_output_port());
-
-    // create the vtk writer connected to the cf reader
-    p_teca_cartesian_mesh_writer w = teca_cartesian_mesh_writer::New();
-    w->set_file_name(output);
-    w->set_input_connection(a->get_output_port());
-
-    // set the executive on the writer to stream time steps
-    p_teca_index_executive exec = teca_index_executive::New();
-    exec->set_start_index(first_step);
-    exec->set_end_index(last_step);
-    exec->set_arrays(arrays);
-
-    w->set_executive(exec);
-
-    // run the pipeline
-    w->update();
-
-    return 0;
-}
diff --git a/test/test_unpack_data.cpp b/test/test_unpack_data.cpp
new file mode 100644
index 000000000..562bf4173
--- /dev/null
+++ b/test/test_unpack_data.cpp
@@ -0,0 +1,194 @@
+#include "teca_variant_array.h"
+#include "teca_cartesian_mesh_source.h"
+#include "teca_valid_value_mask.h"
+#include "teca_unpack_data.h"
+#include "teca_cf_reader.h"
+#include "teca_cf_writer.h"
+#include "teca_dataset_diff.h"
+#include "teca_array_attributes.h"
+#include "teca_index_executive.h"
+#include "teca_system_util.h"
+#include "teca_file_util.h"
+
+#include "math.h"
+
+
+// compute data to pack
+// f = cos(z)*sin(x+t)*sin(y+t)
+// min(f) = -1
+// max(f) = 1
+struct packed_data
+{
+    unsigned char m_fill;
+    float m_scale;
+    float m_offset;
+
+    packed_data()
+    {
+        // reserving 255 for the _FillValue
+        // scale = (max(f) - min(f)) / (2^n - 2)
+        // offs = min(f)
+        m_scale = (1.0f - -1.0f)/254.0f;
+        m_offset = -1.0f;
+        m_fill = 255;
+    }
+
+    teca_metadata get_attributes()
+    {
+        teca_array_attributes aa(teca_variant_array_code<unsigned char>::get(),
+           teca_array_attributes::point_centering,
+           0, "unitless", "packed data", "cos(z)*sin(x+t)*sin(x+t)",
+           1, m_fill);
+
+        teca_metadata atts((teca_metadata)aa);
+
+        atts.set("scale_factor", m_scale);
+        atts.set("add_offset", m_offset);
+
+        return atts;
+    }
+
+    p_teca_variant_array operator()(
+        const const_p_teca_variant_array &x,
+        const const_p_teca_variant_array &y,
+        const const_p_teca_variant_array &z,
+        double t)
+    {
+        size_t nx = x->size();
+        size_t ny = y->size();
+        size_t nz = z->size();
+
+        size_t nxy = nx*ny;
+        size_t nxyz = nxy*nz;
+
+        // allocate f
+        p_teca_float_array f = teca_float_array::New(nxyz);
+        float *p_f = f->get();
+
+        // compute
+        // f = cos(z)*sin(x+t)*sin(y+t)
+        TEMPLATE_DISPATCH(const teca_variant_array_impl,
+            x.get(),
+
+            const NT *p_x = dynamic_cast<const TT*>(x.get())->get();
+            const NT *p_y = dynamic_cast<const TT*>(y.get())->get();
+            const NT *p_z = dynamic_cast<const TT*>(z.get())->get();
+
+            for (size_t k = 0; k < nz; ++k)
+            {
+                for (size_t j = 0; j < ny; ++j)
+                {
+                    for (size_t i = 0; i < nx; ++i)
+                    {
+                        p_f[k*nxy + j*nx + i] = cos(p_z[k])*sin(p_x[i]+t)*sin(p_y[j]+t);
+                    }
+                }
+            }
+            )
+
+
+        // allcate q
+        p_teca_unsigned_char_array q = teca_unsigned_char_array::New(nxyz);
+        unsigned char *p_q = q->get();
+
+        // pack
+        for (size_t i = 0; i < nxyz; ++i)
+        {
+            p_q[i] = (unsigned char)roundf((p_f[i] - m_offset)/m_scale);
+        }
+
+        // mask bottom and top row
+        for (size_t i = 0; i < nx; ++i)
+        {
+            p_q[i] = m_fill;
+            p_q[nxy - nx + i] = m_fill;
+        }
+
+        // mask left and right column
+        for (size_t j = 0; j < ny; ++j)
+        {
+            p_q[j*nx] = m_fill;
+            p_q[(j+1)*nx - 1] = m_fill;
+        }
+
+        return q;
+    }
+};
+
+
+int main(int argc, char **argv)
+{
+    int write_input = 0;
+
+    if (argc != 2)
+    {
+        std::cerr << "usage:" << std::endl
+            << "test_unpack_data [baseline]" << std::endl;
+        return -1;
+    }
+
+    std::string baseline = argv[1];
+
+    packed_data pd;
+
+    p_teca_cartesian_mesh_source src = teca_cartesian_mesh_source::New();
+    src->set_coordinate_type_code(teca_variant_array_code<float>::get());
+    src->set_field_type_code(teca_variant_array_code<unsigned char>::get());
+    src->set_whole_extents({0, 63, 0, 63, 0, 0, 0, 15});
+    src->set_bounds({-M_PI, M_PI, -M_PI, M_PI, 0.0, 0.0, 0.0, M_PI/4.});
+    src->append_field_generator({"func", pd.get_attributes(), pd});
+    src->set_calendar("standard", "days since 1980-01-01 00:00:00");
+
+    if (write_input)
+    {
+        p_teca_cf_writer in_wri = teca_cf_writer::New();
+        in_wri->set_input_connection(src->get_output_port());
+        in_wri->set_point_arrays({"func"});
+        in_wri->set_file_name("./test_unpack_data_input_%t%.nc");
+        in_wri->set_thread_pool_size(1);
+        in_wri->set_steps_per_file(64);
+        in_wri->update();
+    }
+
+    p_teca_valid_value_mask vvm = teca_valid_value_mask::New();
+    vvm->set_input_connection(src->get_output_port());
+
+    p_teca_unpack_data unp = teca_unpack_data::New();
+    unp->set_input_connection(vvm->get_output_port());
+
+    bool do_test = true;
+    teca_system_util::get_environment_variable("TECA_DO_TEST", do_test);
+    if (do_test && teca_file_util::file_exists(baseline.c_str()))
+    {
+        std::cerr << "running the test ... " << std::endl;
+
+        p_teca_index_executive rex = teca_index_executive::New();
+        rex->set_arrays({"func"});
+        rex->set_verbose(1);
+
+        p_teca_cf_reader rdr = teca_cf_reader::New();
+        rdr->set_files_regex(baseline);
+
+        p_teca_dataset_diff diff = teca_dataset_diff::New();
+        diff->set_input_connection(0, rdr->get_output_port());
+        diff->set_input_connection(1, unp->get_output_port());
+        diff->set_executive(rex);
+
+        diff->update();
+    }
+    else
+    {
+        std::cerr << "writing the baseline ... " << std::endl;
+
+        p_teca_cf_writer in_wri = teca_cf_writer::New();
+        in_wri->set_input_connection(unp->get_output_port());
+        in_wri->set_point_arrays({"func", "func_valid"});
+        in_wri->set_file_name(baseline);
+        in_wri->set_thread_pool_size(1);
+        in_wri->set_steps_per_file(64);
+        in_wri->update();
+
+    }
+
+    return 0;
+}
diff --git a/test/test_valid_value_mask.cpp b/test/test_valid_value_mask.cpp
index 0608292f2..b275e27bf 100644
--- a/test/test_valid_value_mask.cpp
+++ b/test/test_valid_value_mask.cpp
@@ -76,8 +76,7 @@ int main(int argc, char **argv)
     p_teca_cartesian_mesh_source s = teca_cartesian_mesh_source::New();
     s->set_whole_extents({0, 99, 0, 99, 0, 0, 0, 0});
     s->set_bounds({-pi, pi, -pi, pi, 0.0, 0.0, 0.0, 0.0});
-    s->set_calendar("standard");
-    s->set_time_units("days since 2020-12-15 00:00:00");
+    s->set_calendar("standard", "days since 2020-12-15 00:00:00");
 
     cosx_cosy func(threshold, fill_value);
 
diff --git a/test/travis_ci/ctest_linux.cmake b/test/travis_ci/ctest_linux.cmake
index f1897272d..63ea5bf67 100644
--- a/test/travis_ci/ctest_linux.cmake
+++ b/test/travis_ci/ctest_linux.cmake
@@ -21,6 +21,7 @@ TECA_ENABLE_PROFILER=ON
 TECA_PYTHON_VERSION=$ENV{TECA_PYTHON_VERSION}
 TECA_DATA_ROOT=$ENV{DASHROOT}/TECA_data
 TECA_TEST_CORES=2
+HYPERTHREADS_PER_CORE=1
 REQUIRE_OPENSSL=TRUE
 REQUIRE_BOOST=TRUE
 REQUIRE_NETCDF=TRUE
diff --git a/test/travis_ci/ctest_linux.sh b/test/travis_ci/ctest_linux.sh
index 4fede64d8..864074349 100755
--- a/test/travis_ci/ctest_linux.sh
+++ b/test/travis_ci/ctest_linux.sh
@@ -19,6 +19,8 @@ then
     export NETCDF_BUILD_TYPE="netcdf_mpi"
 fi
 
+cat /proc/cpuinfo
+
 export PATH=.:${PATH}
 export PYTHONPATH=${DASHROOT}/build/lib
 export LD_LIBRARY_PATH=${DASHROOT}/build/lib
diff --git a/test/travis_ci/ctest_osx.cmake b/test/travis_ci/ctest_osx.cmake
index c56923421..df49f7a07 100644
--- a/test/travis_ci/ctest_osx.cmake
+++ b/test/travis_ci/ctest_osx.cmake
@@ -21,6 +21,7 @@ TECA_ENABLE_PROFILER=ON
 TECA_PYTHON_VERSION=$ENV{TECA_PYTHON_VERSION}
 TECA_DATA_ROOT=$ENV{DASHROOT}/TECA_data
 TECA_TEST_CORES=2
+HYPERTHREADS_PER_CORE=1
 REQUIRE_OPENSSL=TRUE
 OPENSSL_ROOT_DIR=/usr/local/opt/openssl@1.1
 REQUIRE_BOOST=TRUE
diff --git a/test/travis_ci/ctest_osx.sh b/test/travis_ci/ctest_osx.sh
index c7c882a78..9d562c035 100755
--- a/test/travis_ci/ctest_osx.sh
+++ b/test/travis_ci/ctest_osx.sh
@@ -14,6 +14,9 @@ set +x
 source `pwd`/../tci/bin/activate
 set -x
 
+export PATH=$(brew --prefix)/opt/curl/bin:$PATH
+export DYLD_LIBRARY_PATH=$(brew --prefix)/opt/curl/lib:$DYLD_LIBRARY_PATH
+
 mkdir build
 ctest -S ${DASHROOT}/test/travis_ci/ctest_osx.cmake --output-on-failure --timeout 180 &
 ctest_pid=$!
diff --git a/test/travis_ci/install_osx.sh b/test/travis_ci/install_osx.sh
index 21ebd6914..ec2910982 100755
--- a/test/travis_ci/install_osx.sh
+++ b/test/travis_ci/install_osx.sh
@@ -7,10 +7,12 @@ export PATH=/usr/local/bin:$PATH
 # install deps. note that many are included as a part of brew-core
 # these days. hence this list isn't comprehensive
 brew update
+brew upgrade
 brew unlink python@2
-brew install mpich swig svn udunits openssl python@3.8
+brew install openmpi swig svn udunits openssl python@3.8 curl cmake
 brew unlink python
 brew link --force python@3.8
+brew link curl --force
 
 # matplotlib currently doesn't have a formula
 # teca fails to locate mpi4py installed from brew