Stxxl
1.4.0
|
This is an example of how to use some basic algorithms from the stream package. The example sorts characters of a string producing an array of sorted tuples (character, index position).
/*************************************************************************** * stream/test_stream.cpp * * Part of the STXXL. See http://stxxl.sourceforge.net * * Copyright (C) 2003 Roman Dementiev <dementiev@mpi-sb.mpg.de> * Copyright (C) 2007 Andreas Beckmann <beckmann@mpi-inf.mpg.de> * Copyright (C) 2009, 2010 Johannes Singler <singler@kit.edu> * * Distributed under the Boost Software License, Version 1.0. * (See accompanying file LICENSE_1_0.txt or copy at * http://www.boost.org/LICENSE_1_0.txt) **************************************************************************/ //! \example stream/test_stream.cpp //! This is an example of how to use some basic algorithms from the //! stream package. The example sorts characters of a string producing an //! array of sorted tuples (character, index position). #include <limits> #include <vector> #include <stxxl/stream> #include <stxxl/vector> #define USE_FORMRUNS_N_MERGE // comment if you want to use one 'sort' algorithm // without producing intermediate sorted runs. #define USE_EXTERNAL_ARRAY // comment if you want to use internal vectors as // input/output of the algorithm #define block_size (8 * 1024) typedef stxxl::tuple<char, int> tuple_type; namespace std { std::ostream & operator << (std::ostream & os, const tuple_type & t) { os << "<" << t.first << "," << t.second << ">"; return os; } } #ifdef USE_EXTERNAL_ARRAY typedef stxxl::VECTOR_GENERATOR<char>::result input_array_type; typedef stxxl::VECTOR_GENERATOR<tuple_type>::result output_array_type; #else typedef std::vector<char> input_array_type; typedef std::vector<tuple_type> output_array_type; #endif using stxxl::stream::streamify; using stxxl::stream::streamify_traits; using stxxl::stream::make_tuple; using stxxl::tuple; const char * phrase = "Hasta la vista, baby"; template <class Container_, class It_> void fill_input_array(Container_ & container, It_ p) { while (*p) { container.push_back(*p); ++p; } } template <class ValTp> struct counter { typedef ValTp value_type; value_type cnt; counter() : cnt(0) { } value_type operator () () { value_type ret = cnt; ++cnt; return ret; } }; typedef counter<int> counter_type; struct cmp_type : std::binary_function<tuple_type, tuple_type, bool> { typedef tuple_type value_type; bool operator () (const value_type & a, const value_type & b) const { return a.first < b.first; } value_type min_value() const { return value_type((std::numeric_limits<char>::min)(), 0); } value_type max_value() const { return value_type((std::numeric_limits<char>::max)(), 0); } }; struct cmp_int : std::binary_function<int, int, bool> { typedef int value_type; bool operator () (const value_type & a, const value_type & b) const { return a > b; } value_type max_value() const { return (((std::numeric_limits<value_type>::min))()); } value_type min_value() const { return (((std::numeric_limits<value_type>::max))()); } }; template <typename T> struct identity : std::unary_function<T, T> { typedef T value_type; const T & operator () (const T & t) { return t; } }; int main() { input_array_type input; output_array_type output; stxxl::stats * s = stxxl::stats::get_instance(); std::cout << *s; fill_input_array(input, phrase); output.resize(input.size()); // HERE streaming part begins (streamifying) // create input stream #ifdef BOOST_MSVC typedef streamify_traits<input_array_type::iterator>::stream_type input_stream_type; #else typedef __typeof__(streamify(input.begin(), input.end())) input_stream_type; #endif input_stream_type input_stream = streamify(input.begin(), input.end()); // create counter stream #ifdef BOOST_MSVC typedef stxxl::stream::generator2stream<counter_type> counter_stream_type; #else typedef __typeof__(streamify(counter_type())) counter_stream_type; #endif counter_stream_type counter_stream = streamify(counter_type()); // create tuple stream typedef make_tuple<input_stream_type, counter_stream_type> tuple_stream_type; tuple_stream_type tuple_stream(input_stream, counter_stream); const stxxl::unsigned_type sorter_memory = 128 * 1024; #ifdef USE_FORMRUNS_N_MERGE // sort tuples by character // 1. form runs typedef stxxl::stream::runs_creator<tuple_stream_type, cmp_type, block_size> runs_creator_stream_type; runs_creator_stream_type runs_creator_stream(tuple_stream, cmp_type(), sorter_memory); // 2. merge runs typedef stxxl::stream::runs_merger<runs_creator_stream_type::sorted_runs_type, cmp_type> sorted_stream_type; sorted_stream_type sorted_stream(runs_creator_stream.result(), cmp_type(), sorter_memory); #else // sort tuples by character // (combination of the previous two steps in one algorithm: form runs and merge) typedef stxxl::stream::sort<tuple_stream_type, cmp_type, block_size> sorted_stream_type; sorted_stream_type sorted_stream(tuple_stream, cmp_type(), sorter_memory); #endif typedef stxxl::stream::transform<identity<stxxl::tuple<char, int> >, sorted_stream_type> transformed_stream_type; identity<stxxl::tuple<char, int> > id; transformed_stream_type transformed_stream(id, sorted_stream); // HERE streaming part ends (materializing) output_array_type::iterator o = stxxl::stream::materialize(transformed_stream, output.begin(), output.end()); // or materialize(sorted_stream,output.begin()); assert(o == output.end()); STXXL_MSG("input string (character,position) :"); for (unsigned i = 0; i < input.size(); ++i) { STXXL_MSG("('" << input[i] << "'," << i << ")"); } STXXL_MSG("sorted tuples (character,position):"); for (unsigned i = 0; i < input.size(); ++i) { STXXL_MSG("('" << output[i].first << "'," << output[i].second << ")"); } std::cout << *s; std::vector<int> InternalArray(1024 * 1024); std::sort(InternalArray.begin(), InternalArray.end(), cmp_int()); //convenience function based on streaming stxxl::sort<1024 * 1024>(InternalArray.begin(), InternalArray.end(), cmp_int(), 1024 * 1024 * 31, stxxl::RC()); return 0; }