doc/master/sort__manager_8h_source.html

 // -*- mode: c++; tab-width: 4; indent-tabs-mode: t; eval: (progn (c-set-style "stroustrup") (c-set-offset 'innamespace 0)); -*-

 // vi:set ts=4 sts=4 sw=4 noet :

 // Copyright 2008, The TPIE development team

 //

 // This file is part of TPIE.

 //

 // TPIE is free software: you can redistribute it and/or modify it under

 // the terms of the GNU Lesser General Public License as published by the

 // Free Software Foundation, either version 3 of the License, or (at your

 // option) any later version.

 //

 // TPIE is distributed in the hope that it will be useful, but WITHOUT ANY

 // WARRANTY; without even the implied warranty of MERCHANTABILITY or

 // FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public

 // License for more details.

 //

 // You should have received a copy of the GNU Lesser General Public License

 // along with TPIE.  If not, see <http://www.gnu.org/licenses/>


 #ifndef _TPIE_AMI_SORT_MANAGER_H

 #define _TPIE_AMI_SORT_MANAGER_H


 // Get definitions for working with Unix and Windows

 #include <tpie/portability.h>

 #include <tpie/stream.h>

 #include <tpie/tempname.h>

 #include <tpie/array.h>

 #include <tpie/merge_sorted_runs.h>

 #include <tpie/mergeheap.h>  //For templated heaps

 #include <tpie/internal_sort.h> // Contains classes for sorting internal runs

 // using different comparison types

 #include <cmath> //for log, ceil, etc.

 #include <string>

 #include <boost/filesystem.hpp>


 #include <tpie/progress_indicator_base.h>


 #include <tpie/tpie_assert.h>


 namespace tpie {


 typedef TPIE_OS_SIZE_T arity_t;


 template <class T, class I, class M>

 class sort_manager {


 public:

     sort_manager(I* isort, M* mheap);


     ~sort_manager() {

         //  No code in this destructor.

     };


     void sort(file_stream<T>* in, file_stream<T>* out,

               progress_indicator_base* indicator = NULL);


     void sort(file_stream<T>* in, progress_indicator_base* indicator = NULL);


 private:

     // *************

     // * Functions *

     // *************


     void start_sort();              // high level wrapper to full sort

     void compute_sort_params();     // compute nInputItems, mrgArity, nRuns

     void partition_and_sort_runs(progress_indicator_base* indicator, tpie::array<temp_file> & temporaries); // make initial sorted runs

     void merge_to_output(progress_indicator_base* indicator, tpie::array<temp_file> & temporaries); // loop over merge tree, create output stream

     // Merge a single group mrgArity streams to an output stream

     void single_merge(

         typename tpie::array<tpie::unique_ptr<file_stream<T> > >::iterator,

         typename tpie::array<tpie::unique_ptr<file_stream<T> > >::iterator,

         file_stream<T>*, TPIE_OS_OFFSET = -1, progress_indicator_base* indicator=0);


     // **************

     // * Attributes *

     // **************


     I*              m_internalSorter;   // Method for sorting runs in memory

     M*              m_mergeHeap;        // Merge heap implementation

     file_stream<T>* inStream;

     file_stream<T>* outStream;

     TPIE_OS_OFFSET  nInputItems;        // Number of items in inStream;

     TPIE_OS_SIZE_T  mmBytesAvail;       // Amount of spare memory we can use

     TPIE_OS_SIZE_T  mmBytesPerStream;   // Memory consumed by each Stream obj


     progress_indicator_base* m_indicator; // pointer to progress indicator


     TPIE_OS_OFFSET progCount; //counter for showing progress


     bool use2xSpace; //flag to indicate if we are doing a 2x sort


     // The maximum number of stream items of type T that we can

     // sort in internal memory

     TPIE_OS_SIZE_T nItemsPerRun;


     TPIE_OS_OFFSET nRuns; //The number of sorted runs left to merge

     arity_t mrgArity; //Max runs we can merge at one time


     // The output stream to which we are currently writing runs

     file_stream<T>* curOutputRunStream;


     // The mininum number of runs in each output stream

     // some streams can have one additional run

     TPIE_OS_OFFSET minRunsPerStream;

     // The number of extra runs or the number of streams that

     // get one additional run.

     arity_t nXtraRuns;


     // The last run can have fewer than nItemsPerRun;

     TPIE_OS_SIZE_T nItemsInLastRun;

     // How many items we will sort in a given run

     TPIE_OS_SIZE_T nItemsInThisRun;

     // For each output stream, how many runs it should get

     TPIE_OS_OFFSET runsInStream;


     // A buffer for building the output file names

     std::string   newName;


     //prefix of temp files created during sort

     std::string working_disk;


 private:

     sort_manager(const sort_manager<T,I,M>& other);

     sort_manager<T,I,M>& operator=(const sort_manager<T,I,M>& other);

 };


 template <class T, class I, class M>

 sort_manager<T, I, M>::sort_manager(I* isort, M* mheap):

     m_internalSorter(isort),

     m_mergeHeap(mheap),

     inStream(0),

     outStream(0),

     nInputItems(0),

     mmBytesAvail(0),

     mmBytesPerStream(0),

     m_indicator(NULL),

     progCount(0),

     use2xSpace(false),

     nItemsPerRun(0),

     nRuns(0),

     mrgArity(0),

     curOutputRunStream(NULL),

     minRunsPerStream(0),

     nXtraRuns(0),

     nItemsInLastRun(0),

     nItemsInThisRun(0),

     runsInStream(0) {


     // Prefix of temp files created during sort

     working_disk = std::string(tempname::tpie_name("sort"));

 };


 template<class T, class I, class M>

 void sort_manager<T,I,M>::sort(file_stream<T>* in, file_stream<T>* out,

                                progress_indicator_base* indicator){

     m_indicator = indicator;


     // if the input and output stream are the same, we only use 2x space.

     // otherwise, we need 3x space. (input, current temp runs, output runs)

     use2xSpace = (in == out);


     inStream = in;

     outStream = out;


     // Basic checks that input is ok

     if (in==NULL || out==NULL) {

         if (m_indicator) {m_indicator->init(1); m_indicator->step(); m_indicator->done();}

         throw exception("NULL_POINTER");

     }


     if (inStream->size() < 2) {

         if (m_indicator) {m_indicator->init(1); m_indicator->step(); m_indicator->done();}

         in->seek(0);

         if (in != out) {

             out->seek(0);

             if (in->size() == 1)

                 out->write(in->read());

         }

         return;

     }


     // Else, there is something to sort, do it

     start_sort();

 }


 template<class T, class I, class M>

 void sort_manager<T,I,M>::sort(file_stream<T>* in, progress_indicator_base* indicator){

     sort(in, in, indicator);

 }


 template<class T, class I, class M>

 void sort_manager<T,I,M>::start_sort(){


     // ********************************************************************

     // * PHASE 1: See if we can sort the entire stream in internal memory *

     // * without the need to use general merge sort                       *

     // ********************************************************************


     // Figure out how much memory we've got to work with.

     mmBytesAvail = consecutive_memory_available();


     // Space for internal buffers for the input and output stream may not

     // have been allocated yet. Query the space usage and subtract.

     mmBytesPerStream = file_stream<T>::memory_usage(1);


     // This is how much we can use for internal sort if

     // we are not doing general merge sort

     mmBytesAvail -= 2 * mmBytesPerStream;


     // Check if all input items can be sorted internally using less than

     // mmBytesAvail

     nInputItems = inStream->size();


     inStream->seek (0);


     if (nInputItems < TPIE_OS_OFFSET(m_internalSorter->MaxItemCount(mmBytesAvail))) {


         fractional_progress fp(m_indicator);

         fp.id() << __FILE__ << __FUNCTION__ << "internal_sort" << typeid(T) << typeid(I) << typeid(M);

         fractional_subindicator allocate_progress(fp, "allocate", TPIE_FSI, nInputItems, "Allocating");

         fractional_subindicator sort_progress(fp, "sort", TPIE_FSI, nInputItems);

         fp.init();

         allocate_progress.init(nInputItems);

         m_internalSorter->allocate(static_cast<TPIE_OS_SIZE_T>(nInputItems));

         allocate_progress.done();


         // load the items into main memory, sort, and write to output.

         // m_internalSorter also checks if inStream/outStream are the same and

         // truncates/rewrites inStream if they are. This probably should not

         // be the job of m_internalSorter-> TODO: build a cleaner interface

         m_internalSorter->sort(inStream,

                                outStream,

                                static_cast<TPIE_OS_SIZE_T>(nInputItems),

                                &sort_progress);

         // de-allocate the internal array of items

         m_internalSorter->deallocate();

         fp.done();

         return;

     }


     // ******************************************************************

     // * Input stream too large for main memory, use general merge sort *

     // ******************************************************************


     // PHASE 2: compute nItemsPerRun, nItemsPerRun, nRuns

     compute_sort_params();


     // ********************************************************************

     // * By this point we have checked that we have valid input, checked  *

     // * that we indeed need an external memory sort, verified that we    *

     // * have enough memory to partition and at least do a binary merge.  *

     // * Also checked that we have enough file descriptors to  merge,     *

     // * and calculated the mrgArity and nItemsPerRun given memory        *

     // * constraints. We have also calculated nRuns for the initial       *

     // * number of runs we will partition into. Let's sort!               *

     // ********************************************************************


     // ********************************************************************

     // * WARNING: Since we accounted for all known memory usage in PHASE 2*

     // * be very wary of memory allocation via "new" or constructors from *

     // * this point on and make sure it was accounted for in PHASE 2      *

     // ********************************************************************

     fractional_progress fp(m_indicator);

     fp.id() << __FILE__ << __FUNCTION__ << "external_sort" << typeid(T) << typeid(I) << typeid(M);

     fractional_subindicator run_progress(fp, "run", TPIE_FSI, nInputItems,"",tpie::IMPORTANCE_LOG);

     fractional_subindicator merge_progress(fp, "merge", TPIE_FSI, nInputItems,"",tpie::IMPORTANCE_LOG);

     fp.init();


     tpie::array<temp_file> temporaries(mrgArity*2);


     // PHASE 3: partition and form sorted runs

     TP_LOG_DEBUG_ID ("Beginning general merge sort.");

     partition_and_sort_runs(&run_progress, temporaries);

     // PHASE 4: merge sorted runs to a single output stream

     merge_to_output(&merge_progress, temporaries);


     fp.done();

 }


 template<class T, class I, class M>

 void sort_manager<T,I,M>::compute_sort_params(void){

     // ********************************************************************

     // * PHASE 2: Compute/check limits                                    *

     // * Compute the maximum number of items we can sort in main memory   *

     // * and the maximium number of sorted runs we can merge at one time  *

     // * Before doing any sorting, check that we can fit at least one item*

     // * in internal memory for sorting and that we can merge at least two*

     // * runs at at time                                                  *

     // *                                                                  *

     // * Memory needed for the run formation phase:                       *

     // * 2*mmBytesPerStream +                  {for input/output streams} *

     // * nItemsPerRun*space_per_sort_item() +  {for each item sorted }    *

     // * space_overhead_sort()                 {constant overhead in      *

     // *                                        sort management object    *

     // *                                        during sorting       }    *

     // *                                                                  *

     // * Memory needed for a D-way merge:                                 *

     // *  Cost per merge stream:                                          *

     // *   mmBytesPerStream+              {a open stream to read from}    *

     // *   space_per_merge_item()+        {used in internal merge heap}   *

     // *   sizeof(T*)+sizeof(off_t)       {arrays in single_merge()}      *

     // *   sizeof(stream<T>*)         {array element that points to   *

     // *                                    merge stream}                 *

     // *  Fixed costs:                                                    *

     // *    2*mmBytesPerStream+        {original input stream + output    *

     // *                                 of current merge}                *

     // *    space_overhead_merge()+    {fixed dynamic memory costs of     *

     // *                                 merge heap}                      *

     // *    3*space_overhead()         {overhead per "new" memory request *

     // *                                for allocating array of streams   *

     // *                                in merge_to_output and two arrays *

     // *                                in single_merge}                  *

     // *                                                                  *

     // *  Total cost for D-way Merge:                                     *

     // *    D*(Cost per merge stream)+(Fixed costs)                       *

     // *                                                                  *

     // *  Any additional memory requests that call "new" directly or      *

     // *  indirectly should be documented and accounted for in this phase *

     // ********************************************************************


     TP_LOG_DEBUG_ID ("Computing merge sort parameters.");


     TPIE_OS_SIZE_T mmBytesAvailSort; // Bytes available for sorting


     TP_LOG_DEBUG ("Each object of size " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(sizeof(T)) << " uses "

                   << static_cast<TPIE_OS_OUTPUT_SIZE_T>(m_internalSorter->space_per_item ()) << " bytes "

                   << "for sorting in memory\n");


     // Subtract off size of temp output stream

     // The size of the input stream was already subtracted from

     // mmBytesAvail

     mmBytesAvailSort=mmBytesAvail - mmBytesPerStream;


     nItemsPerRun=m_internalSorter->MaxItemCount(mmBytesAvailSort);


     if(nItemsPerRun<1){

         throw stream_exception("Insufficient Memory for forming sorted runs");

     }


     // Now we know the max number of Items we can sort in a single

     // internal memory run. Next, compute the number of runs we can

     // merge together at one time


     TPIE_OS_SIZE_T mmBytesPerMergeItem = mmBytesPerStream +

         m_mergeHeap->space_per_item() + sizeof(T*) +

         sizeof(TPIE_OS_OFFSET)+sizeof(ami::stream<T>*);


     // Fixed cost of mergheap impl. + MM_manager overhead of allocating

     // an array of stream<T> ptrs (pending)

     // cost of Input stream already accounted for in mmBytesAvail..

     TPIE_OS_SIZE_T mmBytesFixedForMerge = m_mergeHeap->space_overhead() +

         mmBytesPerStream;


     if (mmBytesFixedForMerge > mmBytesAvail) {

         throw stream_exception("Insufficient memory for merge heap and output stream");

     }


     // Cast down from TPIE_OS_OFFSET (type of mmBytesAvail).

     // mmBytesPerMergeItem is at least 1KB, so we are OK unless we

     // have more than 2 TerraBytes of memory, assuming 64 bit

     // (or smaller) TPIE_OS_OFFSETS. I look forward to the day

     // this comment seems silly and wrong

     mrgArity = static_cast<arity_t>(mmBytesAvail-mmBytesFixedForMerge) /

         mmBytesPerMergeItem;

     TP_LOG_DEBUG("mem avail=" << static_cast<TPIE_OS_OUTPUT_SIZE_T>(mmBytesAvail-mmBytesFixedForMerge)

                  << " bytes per merge item=" <<  static_cast<TPIE_OS_OUTPUT_SIZE_T>(mmBytesPerMergeItem)

                  << " initial mrgArity=" << static_cast<TPIE_OS_OUTPUT_SIZE_T>(mrgArity) << "\n");


     // Need to support at least binary merge

     if(mrgArity < 2) {

         throw stream_exception("Merge arity < 2 -- Insufficient memory for a merge.");

     }


     // Make sure that the AMI is willing to provide us with the

     // number of substreams we want.  It may not be able to due to

     // operating system restrictions, such as on the number of regions

     // that can be mmap()ed in, max number of file descriptors, etc.

     int availableStreams = static_cast<int>(get_file_manager().available());


     // Merging requires an available stream/file decriptor for

     // each of the mrgArity input strems. We need one additional file descriptor

     // for the output of the current merge, so binary merge requires

     // three available streams.

     if (availableStreams < 3) {

         throw stream_exception("Not enough stream descriptors available to perform merge.");

     }


     // Can at least do binary merge. See if availableStreams limits

     // maximum mrgArity

     // Due to the previous test, we know that available_streams >= 3.

     if (mrgArity > static_cast<arity_t>(availableStreams - 1)) {


         mrgArity = static_cast<arity_t>(availableStreams - 1);


         TP_LOG_DEBUG_ID ("Reduced merge arity due to AMI restrictions.");

     }


     // The number of memory-sized runs that the original input stream

     // will be partitioned into.

     nRuns = ((nInputItems + nItemsPerRun - 1) / nItemsPerRun);


 #ifdef TPIE_SORT_SMALL_MRGARITY

     // KEEP OUT!!!

     // This should not be done by the typical user and is only for

     // testing/debugging purposes. ONLY define this flag and set a value

     // if you know what you are doing.

     TP_LOG_WARNING_ID("TPIE_SORT_SMALL_MRGARITY flag is set."

                       " Did you mean to do this?");

     if(mrgArity > TPIE_SORT_SMALL_MRGARITY) {

         TP_LOG_WARNING_ID("Reducing merge arity due to compiler specified flag");

         mrgArity=TPIE_SORT_SMALL_MRGARITY;

     }

 #endif // TPIE_SORT_SMALL_MRGARITY


 #ifdef TPIE_SORT_SMALL_RUNSIZE

     // KEEP OUT!!!

     // This should not be done by the typical user and is only for

     // testing/debugging purposes ONLY define this flag and set a value

     // if you know what you are doing.

     TP_LOG_WARNING_ID("TPIE_SORT_SMALL_RUNSIZE flag is set."

                       " Did you mean to do this?");

     if(nItemsPerRun > TPIE_SORT_SMALL_RUNSIZE) {

         TP_LOG_WARNING_ID("Reducing run size due to compiler specified flag");

         nItemsPerRun=TPIE_SORT_SMALL_RUNSIZE;

     }


     // need to adjust nRuns

     nRuns = ((nInputItems + nItemsPerRun - 1) / nItemsPerRun);

 #endif // TPIE_SORT_SMALL_RUNSIZE


     //#define MINIMIZE_INITIAL_RUN_LENGTH

 #ifdef MINIMIZE_INITIAL_RUN_LENGTH

     // If compiled with the above flag, try to reduce the length of

     // the initial sorted runs without increasing the merge tree height

     // This could be a speed-up if it is faster to quicksort many small

     // runs and merge them than it is to quicksort fewer long

     // runs and merge them.

     TP_LOG_DEBUG_ID ("Minimizing initial run lengths without increasing" <<

                      " the height of the merge tree.");


     // The tree height is the ceiling of the log base mrgArity of the

     // number of original runs.

     double tree_height = log((double)nRuns) / log((double)mrgArity);

     tp_assert (tree_height > 0, "Negative or zero tree height!");

     tree_height = ceil (tree_height);


     // See how many runs we could possibly fit in the tree without

     // increasing the height.

     double maxOrigRuns = pow ((double) mrgArity, tree_height);

     tp_assert (maxOrigRuns >= nRuns "Number of permitted runs was reduced!");


     // How big will such runs be?

     double new_nItemsPerRun = ceil (nInputItems/ maxOrigRuns);

     tp_assert (new_nItemsPerRun <= nItemsPerRun,

                "Size of original runs increased!");


     // Update the number of items per run and the number of original runs

     nItemsPerRun = (TPIE_OS_SIZE_T) new_nItemsPerRun;


     TP_LOG_DEBUG_ID ("With long internal memory runs, nRuns = "

                      << nRuns);


     nRuns = (nInputItems + nItemsPerRun - 1) / nItemsPerRun;


     TP_LOG_DEBUG_ID ("With shorter internal memory runs "

                      << "and the same merge tree height, nRuns = "

                      << nRuns );


     tp_assert (maxOrigRuns >= nRuns,

                "We increased the merge height when we weren't supposed to do so!");

 #endif  // MINIMIZE_INITIAL_SUBSTREAM_LENGTH


         // If we have just a few runs, we don't need the

         // full mrgArity. This is the last change to mrgArity

         // N.B. We need to "up"-cast mrgArity here!

     if(static_cast<TPIE_OS_OFFSET>(mrgArity)>nRuns){

         // N.B. We know that nRuns is small, so

         //      it is safr to downcast.

         mrgArity=static_cast<TPIE_OS_SIZE_T>(nRuns);

     }


     // We should always end up with at least two runs

     // otherwise why are we doing it externally?

     tp_assert (nRuns > 1, "Less than two runs to merge!");

     // Check that numbers are consistent with input size

     tp_assert (nRuns * nItemsPerRun - nInputItems < nItemsPerRun,

                "Total expected output size is too large.");

     tp_assert (nInputItems - (nRuns - 1) * nItemsPerRun <= nItemsPerRun,

                "Total expected output size is too small.");


     TP_LOG_DEBUG_ID ("Input stream has " << nInputItems << " items");

     TP_LOG_DEBUG ("Max number of items per runs " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(nItemsPerRun) );

     TP_LOG_DEBUG ("\nInitial number of runs " << nRuns );

     TP_LOG_DEBUG ("\nMerge arity is " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(mrgArity) << "\n" );

 }


 template<class T, class I, class M>

 void sort_manager<T,I,M>::partition_and_sort_runs(progress_indicator_base* indicator, tpie::array<temp_file> & temporaries){

     // ********************************************************************

     // * PHASE 3: Partition                                               *

     // * Partition the input stream into nRuns of at most nItemsPerRun    *

     // * and sort them, and write them to temporay output files.          *

     // * The last run may have fewer than nItemsPerRun. To keep the number*

     // * of files down and to support sequential I/O, we distribute the   *

     // * nRuns evenly across mrgArity files, thus each file on disk holds *

     // * multiple sorted runs.                                            *

     // ********************************************************************


     // The mininum number of runs in each output stream

     // some streams can have one additional run

     minRunsPerStream = nRuns/mrgArity;

     // The number of extra runs or the number of streams that

     // get one additional run. This is less than mrgArity and

     // it is OK to downcast to an arity_t.

     nXtraRuns = static_cast<arity_t>(nRuns - minRunsPerStream*mrgArity);

     tp_assert(nXtraRuns<mrgArity, "Too many extra runs");


     // The last run can have fewer than nItemsPerRun;

     // general case

     nItemsInLastRun = static_cast<TPIE_OS_SIZE_T>(nInputItems % nItemsPerRun);

     if(nItemsInLastRun==0){

         // Input size is an exact multiple of nItemsPerStream

         nItemsInLastRun=nItemsPerRun;

     }


     // Initialize memory for the internal memory runs

     // accounted for in phase 2:  (nItemsPerRun*size_of_sort_item) +

     // space_overhead_sort

     m_internalSorter->allocate(nItemsPerRun);


     TP_LOG_DEBUG_ID ("Partitioning and forming sorted runs.");


     // nItemsPerRun except for last run.

     nItemsInThisRun=nItemsPerRun;


     // Rewind the input stream, we are about to begin

     inStream->seek(0);


     // ********************************************************************

     // * Partition and make initial sorted runs                           *

     // ********************************************************************

     TPIE_OS_OFFSET check_size = 0; //for debugging


     if (indicator)

         indicator->init(nRuns*1000);


     for(arity_t ii=0; ii<mrgArity; ii++){   //For each output stream

         // Dynamically allocate the stream

         // We account for these mmBytesPerStream in phase 2 (output stream)

         curOutputRunStream = tpie_new<file_stream<T> >();

         curOutputRunStream->open(temporaries[ii], access_write);


         // How many runs should this stream get?

         // extra runs go in the LAST nXtraRuns streams so that

         // the one short run is always in the LAST output stream

         runsInStream = minRunsPerStream + ((ii >= mrgArity-nXtraRuns)?1:0);


         for(TPIE_OS_OFFSET  jj=0; jj < runsInStream; jj++ ) { // For each run in this stream

             // See if this is the last run

             if( (ii==mrgArity-1) && (jj==runsInStream-1)) {

                 nItemsInThisRun=nItemsInLastRun;

             }


             progress_indicator_subindicator sort_indicator(indicator, 1000);

             m_internalSorter->sort(inStream, curOutputRunStream,

                                    nItemsInThisRun, &sort_indicator);

         } // For each run in this stream


         // All runs created for this stream, clean up

         TP_LOG_DEBUG_ID ("Wrote " << runsInStream << " runs and "

                          << curOutputRunStream->size() << " items to file "

                          << static_cast<TPIE_OS_OUTPUT_SIZE_T>(ii));

         check_size+=curOutputRunStream->size();

         tpie_delete(curOutputRunStream);


     }//For each output stream

     tp_assert(check_size == nInputItems, "item count mismatch");


     // Done with partitioning and initial run formation

     // free space associated with internal memory sorting

     m_internalSorter->deallocate();

     if(use2xSpace){

         //recall outStream/inStream point to same file in this case

         inStream->truncate(0); //free up disk space

         inStream->seek(0);

     }

     if (indicator) indicator->done();

 }


 template<class T, class I, class M>

 void sort_manager<T,I,M>::merge_to_output(progress_indicator_base* indicator, tpie::array<temp_file> & temporaries){

     // ********************************************************************

     // * PHASE 4: Merge                                                   *

     // * Loop over all levels of the merge tree, reading mrgArity runs    *

     // * at a time from the streams at the current level and distributing *

     // * merged runs over mrgArity output streams one level up, until     *

     // * a single output stream exists                                    *

     // ********************************************************************


     // The input streams we from which will read sorted runs

     // This Memory allocation accounted for in phase 2:

     //   mrgArity*sizeof(stream<T>*) + space_overhead()[fixed cost]

     tpie::array<tpie::unique_ptr<file_stream<T> > > mergeInputStreams(mrgArity);


     TP_LOG_DEBUG_ID("Allocated " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(sizeof(ami::stream<T>*)*mrgArity)

                     << " bytes for " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(mrgArity) << " merge input stream pointers.\n"

                     << "Mem. avail. is " << consecutive_memory_available ());


     // the number of iterations the main loop has gone through,

     // at most the height of the merge tree log_{M/B}(N/B),

     // typically 1 or 2

     int mrgHeight  = 0;

     int treeHeight = 0; //for progress

     TPIE_OS_SIZE_T ii; //index vars

     TPIE_OS_OFFSET jj; //index vars


     // This Memory allocation accounted for in phase 2:

     //   mrgArity*space_per_merge_item

     m_mergeHeap->allocate( mrgArity ); //Allocate mem for mergeheap


     // *****************************************************************

     // *                                                               *

     // * The main loop.  At the outermost level we are looping over    *

     // * levels of the merge tree.  Typically this will be very small, *

     // * e.g. 1-3.  The final merge pass is handled outside the loop.  *

     // * Future extension may want to do something special in the last *

     // * merge                                                         *

     // *                                                               *

     // *****************************************************************


     if (indicator) {

         //compute merge depth, number of passes over data

         treeHeight= static_cast<int>(ceil(log(static_cast<float>(nRuns)) /

                                           log(static_cast<float>(mrgArity))));


         indicator->set_range( nInputItems * treeHeight);

         indicator->init();

     }


     //nRuns is initially the number of runs we formed in partition_and_sort

     //phase. nXtraRuns is initially the number of outputs streams that

     //contain one extra run. Runs and nXtraRuns are updated as we

     //complete a merge level.

     while (nRuns > TPIE_OS_OFFSET(mrgArity)) {

         // if (m_indicator) {

         //  std::string description;

         //  std::stringstream buf;

         //  buf << "Merge pass " << mrgHeight+1 << " of " << treeHeight << " ";

         //  buf >> description;

         //     m_indicator->set_percentage_range(0, nInputItems);

         //     m_indicator->init(description);

         // }


         // We are not yet at the top of the merge tree

         // Write merged runs to temporary output streams

         TP_LOG_DEBUG ("Intermediate merge. level="<<mrgHeight << "\n");


         // The number of output runs we will form after a mrgArity merge

         nRuns = (nRuns + mrgArity - 1)/mrgArity;


         // Distribute the new nRuns evenly across mrgArity (or fewer)

         // output streams

         minRunsPerStream = nRuns/mrgArity;


         // We may have less mrgArity input runs for the last

         // merged output run if the current set of merge streams has

         // xtra runs

         arity_t mergeRunsInLastOutputRun=(nXtraRuns>0) ? nXtraRuns : mrgArity;


         // The number of extra runs or the number of output streams that

         // get one additional run. This is less than mrgArity and

         // it is OK to downcast to an arity_t.

         nXtraRuns = static_cast<arity_t>(nRuns - minRunsPerStream*mrgArity);

         tp_assert(nXtraRuns<mrgArity, "Too many extra runs");


         // How many Streams we will create at the next level

         arity_t nOutputStreams = (minRunsPerStream > 0) ? mrgArity : nXtraRuns;


         arity_t nRunsToMerge = mrgArity; // may change for last output run


         // open the mrgArity Input streams from which to read runs

         for(ii = 0; ii < mrgArity; ii++){

             // Dynamically allocate the stream

             // We account for these mmBytesPerStream in phase 2

             // (input stream to read from)

             file_stream<T> * stream = tpie_new<file_stream<T> >();

             mergeInputStreams[ii].reset(stream);

             stream->open(temporaries[mrgArity*(mrgHeight%2)+ii], access_read);

             stream->seek(0);

         }


         TPIE_OS_OFFSET check_size=0;

         // For each new output stream, fill with merged runs.

         // strange indexing is for the case that there are fewer than mrgArity

         // output streams needed, and we use the LAST nOutputStreams. This

         // always keeps the one possible short run in the LAST of the

         // mrgArity output streams.

         TP_LOG_DEBUG("Writing " << nRuns << " runs to " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(nOutputStreams)

                      << " output files.\nEach output file has at least "

                      << minRunsPerStream << " runs.\n");


         for(ii = mrgArity-nOutputStreams; ii < mrgArity; ii++){

             // Dynamically allocate the stream

             // We account for these mmBytesPerStream in phase 2

             // (temp merge output stream)

             file_stream<T> curOutputRunStream;

             curOutputRunStream.open(temporaries[mrgArity*((mrgHeight+1)%2)+ii], access_write);


             // How many runs should this stream get?

             // extra runs go in the LAST nXtraRuns streams so that

             // the one short run is always in the LAST output stream

             runsInStream = minRunsPerStream + ((ii >= mrgArity-nXtraRuns)?1:0);

             TP_LOG_DEBUG("Writing " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(runsInStream) << " runs to output "

                          << " file " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(ii) << "\n");

             for( jj=0; jj < runsInStream; jj++ ) { // For each run in this stream

                 // See if this is the last run.

                 if( (ii==mrgArity-1) && (jj==runsInStream-1)) {

                     nRunsToMerge=mergeRunsInLastOutputRun;

                 }

                 // Merge runs to curOutputRunStream

                 single_merge(mergeInputStreams.find(mrgArity-nRunsToMerge),

                              mergeInputStreams.find(mrgArity),

                              &curOutputRunStream,

                              nItemsPerRun, indicator);

             } // For each output run in this stream


             // Commit new output stream to disk

             TP_LOG_DEBUG("Wrote " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(runsInStream) << " runs and "

                          << curOutputRunStream.size() << " items "

                          << "to file " << static_cast<TPIE_OS_OUTPUT_SIZE_T>(ii) << "\n");

             check_size+=curOutputRunStream.size();

         } // For each new output stream


         tp_assert(check_size==nInputItems, "item count mismatch in merge");

         // All output streams created/filled.

         // Clean up, go up to next level


         // Delete temp input merge streams

         for(ii = 0; ii < mrgArity; ii++) {

             mergeInputStreams[ii].reset();

             temporaries[mrgArity*(mrgHeight%2)+ii].free();

         }

         // Update run lengths

         nItemsPerRun=mrgArity*nItemsPerRun; //except for maybe last run

         mrgHeight++; // moving up a level

     } // while (nRuns > mrgArity)


     tp_assert( nRuns > 1, "Not enough runs to merge to final output");

     tp_assert( nRuns <= TPIE_OS_OFFSET(mrgArity), "Too many runs to merge to final output");


     // We are at the last merge phase, write to specified output stream

     // Open up the nRuns final merge streams to merge

     // These runs are packed in the LAST nRuns elements of the array

     // nRuns is small, so it is safe to downcast.

     TP_LOG_DEBUG_ID ("Final merge. level="<<mrgHeight);

     TP_LOG_DEBUG("Merge runs left="<<nRuns<<"\n");

     for(ii = mrgArity-static_cast<TPIE_OS_SIZE_T>(nRuns); ii < mrgArity; ii++){

         /* Dynamically allocate the stream

            We account for these mmBytesPerStream in phase 2

            (input stream to read from)

            Put LAST nRuns files in FIRST nRuns spots here

            either one of mergeInputStreams loading or the call to

            single_merge is a little messy. I put the mess here. (abd) */

         TP_LOG_DEBUG ("Putting merge stream "<< static_cast<TPIE_OS_OUTPUT_SIZE_T>(ii) << " in slot "

                       << static_cast<TPIE_OS_OUTPUT_SIZE_T>(ii-(mrgArity-static_cast<TPIE_OS_SIZE_T>(nRuns))) << "\n");

         file_stream<T> * stream = tpie_new<file_stream<T> >();

         mergeInputStreams[ii-(mrgArity-static_cast<TPIE_OS_SIZE_T>(nRuns))].reset(stream);

         stream->open(temporaries[mrgArity*(mrgHeight%2)+ii], access_read);

         stream->seek(0);

     }


     // Merge last remaining runs to the output stream.

     // mergeInputStreams is address( address (the first input stream) )

     // N.B. nRuns is small, so it is safe to downcast.

     single_merge(mergeInputStreams.begin(),

                  mergeInputStreams.find((size_t)nRuns),

                  outStream, -1, indicator);


     if (indicator) indicator->done();

     tp_assert((TPIE_OS_OFFSET)outStream->size() == nInputItems, "item count mismatch");


     TP_LOG_DEBUG("merge cleanup\n");


     // Delete stream ptr arrays

     mergeInputStreams.resize(0);


     // Deallocate the merge heap, free up memory

     m_mergeHeap->deallocate();

     TP_LOG_DEBUG_ID ("Number of passes incl run formation is " <<

                      mrgHeight+2 );

     TP_LOG_DEBUG("AMI_partition_and_merge END\n");

 }


 template<class T, class I, class M>

 void sort_manager<T,I,M>::single_merge(

     typename tpie::array<tpie::unique_ptr<file_stream<T> > >::iterator start,

     typename tpie::array<tpie::unique_ptr<file_stream<T> > >::iterator end,

     file_stream < T >*outStream, TPIE_OS_OFFSET cutoff, progress_indicator_base* indicator)

 {


     merge_sorted_runs(start, end, outStream, m_mergeHeap,

                       cutoff, indicator);

 }


 }  //  tpie namespace


 #endif // _TPIE_AMI_SORT_MANAGER_H

tpie::sort
void sort(uncompressed_stream< T > &instream, uncompressed_stream< T > &outstream, Compare comp, progress_indicator_base &indicator)
Sort elements of a stream using the given STL-style comparator object.
Definition: sort.h:141

tpie_assert.h
Defines the tp_assert macro.

tpie::consecutive_memory_available
size_t consecutive_memory_available(size_t granularity=5 *1024 *1024)
Find the largest amount of memory that can be allocated as a single chunk.

tpie::progress_indicator_base
The base class for indicating the progress of some task.
Definition: progress_indicator_base.h:61

tpie::tempname::tpie_name
static std::string tpie_name(const std::string &post_base="", const std::string &dir="", const std::string &ext="")
Generate path for a new temporary file.

tpie::array
A generic array with a fixed size.
Definition: array.h:144

merge_sorted_runs.h
merge_sorted_runs as used in several of TPIE's merge variants

TPIE_FSI
#define TPIE_FSI
For use when constructing a fractional subindicator.
Definition: fractional_progress.h:37

tpie::file_stream::read
const T & read()
Reads next item from stream if can_read() == true.
Definition: stream.h:947

tpie::fractional_progress
Fractional progress reporter.
Definition: fractional_progress.h:107

portability.h
This file contains a few deprecated definitions for legacy code.

tpie::access_read
Open a file for reading.
Definition: access_type.h:31

tpie::ami::merge_sorted_runs
void merge_sorted_runs(typename tpie::array< tpie::unique_ptr< file_stream< T > > >::iterator start, typename tpie::array< tpie::unique_ptr< file_stream< T > > >::iterator end, file_stream< T > *outStream, M *MergeHeap, TPIE_OS_OFFSET cutoff=-1, progress_indicator_base *indicator=NULL)
This is a common merge routine for all of the AMI_merge_sorted, AMI_ptr_merge_sorted and AMI_key_merg...
Definition: merge_sorted_runs.h:73

tpie::file_stream::seek
void seek(stream_offset_type offset, offset_type whence=beginning)
Precondition: is_open() Precondition: offset == 0.
Definition: stream.h:627

tpie::sort_manager::sort
void sort(file_stream< T > *in, file_stream< T > *out, progress_indicator_base *indicator=NULL)
Sort in stream to out stream an save in stream (uses 3x space)
Definition: sort_manager.h:176

internal_sort.h
Internal sorter objects.

array.h
Generic internal array with known memory requirements.

mergeheap.h
Merge heap templates.

tpie::arity_t
TPIE_OS_SIZE_T arity_t
Intended to signal the number of input streams in a merge.
Definition: sort_manager.h:51

progress_indicator_base.h
Progress indicator base.

tpie::get_file_manager
file_manager & get_file_manager()
Return a reference to the file manager.

tpie::access_write
Open a file for writing only, content is truncated.
Definition: access_type.h:33

tpie::resource_manager::available
size_t available() const noexcept
Return the amount of the resource still available to be assigned.

tpie::unique_ptr
std::unique_ptr< T, tpie_deleter > unique_ptr
like std::unique_ptr, but delete the object with tpie_delete.
Definition: memory.h:338

tpie::exception
Definition: exception.h:33

tpie::file_stream
Compressed stream.
Definition: predeclare.h:46

tpie::tpie_delete
void tpie_delete(T *p)
Delete an object allocated with tpie_new.
Definition: memory.h:301

tempname.h
Temporary file names.

tp_assert
#define tp_assert(condition, message)
Definition: tpie_assert.h:48

tpie::sort_manager
A class of manager objects for merge sorting objects of type T.
Definition: sort_manager.h:60

tpie::fractional_subindicator
Subindicator for fractional progress reporting.
Definition: fractional_progress.h:56