develop/doxygen/teca__index__reduce_8h_source.html

 #ifndef teca_index_reduce_h

 #define teca_index_reduce_h


 #include "teca_config.h"

 #include "teca_dataset.h"

 #include "teca_metadata.h"

 #include "teca_shared_object.h"

 #include "teca_threaded_algorithm.h"


 #include <vector>


 TECA_SHARED_OBJECT_FORWARD_DECL(teca_index_reduce)


 /// Base class for MPI+threads+GPUs map reduce reduction over a set of indices.

 /**

  * The available indices are partitioned across MPI ranks and threads. Threads

  * are assigned to service GPUs or CPU cores. One can restrict operation to a

  * range of time steps by setting first and last indices to process.

  *

  * ### metadata keys:

  * #### Requires:

  *

  *  | key                   | description |

  *  | ----                  | ----------- |

  *  | index_initializer_key | Holds the name of the key that tells how many |

  *  |                       | indices are available. The named key must also |

  *  |                       | be present and should contain the number of |

  *  |                       | indices available. |

  *  | index_request_key     | Holds the name of the key used to request a |

  *  |                       | specific index. Requests are generated with this |

  *  |                       | name set to a specific index to be processed |

  *  |                       | some upstream algorithm is expected to produce |

  *  |                       | the data associated with the given index. |

  *

  * #### Exports:

  *

  * | Key                    | Description |

  * | ---------------------- | ----------- |

  * | index_request_key      | The name of the key holding the requested index |

  * | <index_request_key>    | the requested index |

  * | device_id              | the CPU (-1) or CUDA device (0 - n-1 devices) to |

  * |                        | use for calculations |

  * | bounds                 | the [x0 x1 y0 y1 z0 z1] spatial bounds requested |

  * |                        | (optional) |

  * | extent                 | the [i0 i1 j0 j1 k0 k1] index space grid extent |

  * |                        | requested (optional) |

  * | arrays                 | a list of arrays requested (optional) |

  *

  */

 class TECA_EXPORT teca_index_reduce : public teca_threaded_algorithm

 {

 public:

     using extent_type = std::vector<long>;

     using bounds_type = std::vector<double>;


     TECA_ALGORITHM_DELETE_COPY_ASSIGN(teca_index_reduce)

     virtual ~teca_index_reduce(){}


     // report/initialize to/from Boost program options

     // objects.

     TECA_GET_ALGORITHM_PROPERTIES_DESCRIPTION()

     TECA_SET_ALGORITHM_PROPERTIES()


     /** @name extent

      * If provided the extent defines the index space region

      * [i0, i1, j0, j1, k0, k1] of data to request. If not provided the

      * whole_extent is requested when the whole_extent key is present.

      * Otherwise the request is not modified.

      */

     ///@{

     TECA_ALGORITHM_PROPERTY(extent_type, extent)

     ///@}


     /** @name bounds

      * If provided the bounds defines the world coordinate space region

      * [x0, x1, y0, y1, z0, z1] of data to request. bounds take precedence over

      * extents.  If bounds are not provided any provided extents will be used

      * (see ::set_extents) otherwise the request is not modified.

      */

     ///@{

     TECA_ALGORITHM_PROPERTY(bounds_type, bounds)

     ///@}


     /** @name arrays

      * set the list of arrays to request. If not provided then the request is

      * not modified.

      */

     ///@{

     TECA_ALGORITHM_VECTOR_PROPERTY(std::string, array)

     ///@}


     /** @name start_index

      * set the first index to process. Indices go from 0 to n-1. The default

      * start_index is 0.

      */

     ///@{

     TECA_ALGORITHM_PROPERTY(long, start_index)

     ///@}


     /** @name end_index

      * set the last index to process. Indices go from 0 to n-1. The default

      * end_index is -1, which is used to indicate all indices should be

      * processed.

      */

     ///@{

     TECA_ALGORITHM_PROPERTY(long, end_index)

     ///@}


 protected:

     teca_index_reduce();


 protected:


     /** An override that implements the reduction. given two datasets a left

      * and right, reduce into a single dataset and return.

      *

      * @param[in] device_id The device that should be used for the reduction.

      *                      A value of -1 indicates the CPU should be used.

      * @param[in] left a dataset to reduce

      * @param[in] right a dataset to reduce

      *

      * @returns the reduced dataset

      */

     virtual p_teca_dataset reduce(int device_id,

         const const_p_teca_dataset &left,

         const const_p_teca_dataset &right) = 0;


     /** An override that is called when the reduction is complete.  The default

      * implementation passes data through. This might be used for instance to

      * complete an averaging operation where the ::reduce override sums the

      * data and the ::finalize override scales by 1/N, where N is the number of

      * datasets summed.

      *

      * @param[in] device_id The device that should be used for the reduction.

      *                      A value of -1 indicates the CPU should be used.

      * @param[in] ds the reduced dataset

      *

      * @returns a dataset that has been finalized.

      */

     virtual p_teca_dataset finalize(int device_id,

         const const_p_teca_dataset &ds)

     {

         (void) device_id;

         return std::const_pointer_cast<teca_dataset>(ds);

     }


     /** An override that allows derived classes to generate upstream requests

      * that will be applied over all time steps. derived classes implement this

      * method instead of ::get_upstream_request, which here is already

      * implemented to handle the application of requests over the index set.

      * The default implementation creates an empty request that is then

      * populated with extent, bounds, and arrays if these have been provided.

      */

     virtual std::vector<teca_metadata> initialize_upstream_request(

         unsigned int port, const std::vector<teca_metadata> &input_md,

         const teca_metadata &request);


     /** An override that allows derived classes to report what they can

      * produce. this will be called from ::get_output_metadata which will strip

      * out time and partition time across MPI ranks. The default implementation

      * passes the incoming metadata through.

      */

     virtual teca_metadata initialize_output_metadata(unsigned int port,

         const std::vector<teca_metadata> &input_md);


 protected:

 // customized pipeline behavior and parallel code.

 // most derived classes won't need to override these.


     using teca_threaded_algorithm::get_output_metadata;

     using teca_threaded_algorithm::execute;


     /** Generates an upstream request for each index. will call

      * initialize_upstream_request and apply the results to all time steps.

      */

     std::vector<teca_metadata> get_upstream_request(

         unsigned int port, const std::vector<teca_metadata> &input_md,

         const teca_metadata &request) override;


     /** Uses MPI communication to collect remote data for required for the

      * reduction. Calls ::reduce with each pair of datasets until the datasets

      * across all threads and ranks are reduced into a single dataset, which is

      * returned.

      */

     const_p_teca_dataset execute(unsigned int port,

         const std::vector<const_p_teca_dataset> &input_data,

         const teca_metadata &request, int streaming) override;


     /// consumes index metadata, and partitions indices across MPI ranks.

     teca_metadata get_output_metadata(unsigned int port,

         const std::vector<teca_metadata> &input_md) override;


 private:

     /** The driver for reducing the local datasets. Calls the ::reduce override as

      * needed.

      */

     const_p_teca_dataset reduce_local(int device_id,

         std::vector<const_p_teca_dataset> local_data);


     /** The driver for reducing the remote datasets. Calls the ::reduce override

      * as needed.

      */

     const_p_teca_dataset reduce_remote(int device_id,

         const_p_teca_dataset local_data);


 private:

     extent_type extent;

     bounds_type bounds;

     std::vector<std::string> arrays;

     long start_index;

     long end_index;

 };


 #endif

teca_algorithm::get_output_metadata
virtual teca_metadata get_output_metadata(unsigned int port, const std::vector< teca_metadata > &input_md)

teca_index_reduce
Base class for MPI+threads+GPUs map reduce reduction over a set of indices.
Definition: teca_index_reduce.h:51

teca_index_reduce::get_upstream_request
std::vector< teca_metadata > get_upstream_request(unsigned int port, const std::vector< teca_metadata > &input_md, const teca_metadata &request) override

teca_index_reduce::execute
const_p_teca_dataset execute(unsigned int port, const std::vector< const_p_teca_dataset > &input_data, const teca_metadata &request, int streaming) override

teca_index_reduce::initialize_output_metadata
virtual teca_metadata initialize_output_metadata(unsigned int port, const std::vector< teca_metadata > &input_md)

teca_index_reduce::get_output_metadata
teca_metadata get_output_metadata(unsigned int port, const std::vector< teca_metadata > &input_md) override
consumes index metadata, and partitions indices across MPI ranks.

teca_index_reduce::initialize_upstream_request
virtual std::vector< teca_metadata > initialize_upstream_request(unsigned int port, const std::vector< teca_metadata > &input_md, const teca_metadata &request)

teca_metadata
A generic container for meta data in the form of name=value pairs.
Definition: teca_metadata.h:22

teca_threaded_algorithm
This is the base class defining a threaded algorithm.
Definition: teca_threaded_algorithm.h:71

teca_error::TECA_EXPORT
p_teca_error_handler error_handler TECA_EXPORT
The global error handler instance.

teca_geometry::left
TECA_EXPORT bool left(n_t e0x, n_t e0y, n_t e1x, n_t e1y, n_t px, n_t py)
tests if a point is Left|On|Right of an infinite line.
Definition: teca_geometry.h:29

teca_shared_object.h