blob: 36442f1570178315e9274d44a633de3d546eb5d8 [file] [log] [blame]
/*
Copyright 2005-2010 Intel Corporation. All Rights Reserved.
This file is part of Threading Building Blocks.
Threading Building Blocks is free software; you can redistribute it
and/or modify it under the terms of the GNU General Public License
version 2 as published by the Free Software Foundation.
Threading Building Blocks is distributed in the hope that it will be
useful, but WITHOUT ANY WARRANTY; without even the implied warranty
of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with Threading Building Blocks; if not, write to the Free Software
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
As a special exception, you may use this file as part of a free software
library without restriction. Specifically, if other files instantiate
templates or use macros or inline functions from this file, or you compile
this file and link it with other files to produce an executable, this
file does not by itself cause the resulting executable to be covered by
the GNU General Public License. This exception does not however
invalidate any other reasons why the executable file might be covered by
the GNU General Public License.
*/
//#define DO_SCALABLEALLOC
#include <cstdlib>
#include <cmath>
#include <vector>
#include <algorithm>
#include <functional>
#include <numeric>
#include "tbb/tbb_stddef.h"
#include "tbb/spin_mutex.h"
#ifdef DO_SCALABLEALLOC
#include "tbb/scalable_allocator.h"
#endif
#include "tbb/concurrent_vector.h"
#include "tbb/tbb_allocator.h"
#include "tbb/cache_aligned_allocator.h"
#include "tbb/task_scheduler_init.h"
#include "tbb/parallel_for.h"
#include "tbb/tick_count.h"
#include "tbb/blocked_range.h"
#define HARNESS_CUSTOM_MAIN 1
#include "../test/harness.h"
//#include "harness_barrier.h"
#include "../test/harness_allocator.h"
#define STATISTICS_INLINE
#include "statistics.h"
using namespace tbb;
bool ExtraVerbose = false;
class Timer {
tbb::tick_count tick;
public:
Timer() { tick = tbb::tick_count::now(); }
double get_time() { return (tbb::tick_count::now() - tick).seconds(); }
double diff_time(const Timer &newer) { return (newer.tick - tick).seconds(); }
double mark_time() { tick_count t1(tbb::tick_count::now()), t2(tick); tick = t1; return (t1 - t2).seconds(); }
double mark_time(const Timer &newer) { tick_count t(tick); tick = newer.tick; return (tick - t).seconds(); }
};
/************************************************************************/
/* TEST1 */
/************************************************************************/
#define mk_vector_test1(v, a) vector_test1<v<Timer, static_counting_allocator<a<Timer> > >, v<double, static_counting_allocator<a<double> > > >
template<class timers_vector_t, class values_vector_t>
class vector_test1 {
const char *mode;
StatisticsCollector &stat;
StatisticsCollector::TestCase key[16];
public:
vector_test1(const char *m, StatisticsCollector &s) : mode(m), stat(s) {}
vector_test1 &operator()(size_t len) {
if(Verbose) printf("test1<%s>(%u): collecting timing statistics\n", mode, unsigned(len));
__TBB_ASSERT(sizeof(Timer) == sizeof(double), NULL);
static const char *test_names[] = {
"b)creation wholly",
"a)creation by push",
"c)operation time per item",
0 };
for(int i = 0; test_names[i]; ++i) key[i] = stat.SetTestCase(test_names[i], mode, len);
Timer timer0; timers_vector_t::allocator_type::init_counters();
timers_vector_t tv(len);
Timer timer1; values_vector_t::allocator_type::init_counters();
values_vector_t dv;
for (size_t i = 0; i < len; ++i)
dv.push_back( i );
Timer timer2;
for (size_t i = 0; i < len; ++i)
{
dv[len-i-1] = timer0.diff_time(tv[i]);
tv[i].mark_time();
}
stat.AddStatisticValue( key[2], "1total, ms", "%.3f", timer2.get_time()*1000.0 );
stat.AddStatisticValue( key[1], "1total, ms", "%.3f", timer1.diff_time(timer2)*1000.0 );
stat.AddStatisticValue( key[0], "1total, ms", "%.3f", timer0.diff_time(timer1)*1000.0 );
//allocator statistics
stat.AddStatisticValue( key[0], "2total allocations", "%d", int(timers_vector_t::allocator_type::allocations) );
stat.AddStatisticValue( key[1], "2total allocations", "%d", int(values_vector_t::allocator_type::allocations) );
stat.AddStatisticValue( key[2], "2total allocations", "%d", 0);
stat.AddStatisticValue( key[0], "3total alloc#items", "%d", int(timers_vector_t::allocator_type::items_allocated) );
stat.AddStatisticValue( key[1], "3total alloc#items", "%d", int(values_vector_t::allocator_type::items_allocated) );
stat.AddStatisticValue( key[2], "3total alloc#items", "%d", 0);
//remarks
stat.AddStatisticValue( key[0], "9note", "segment creation time, ns:");
stat.AddStatisticValue( key[2], "9note", "average op-time per item, ns:");
Timer last_timer(timer2); double last_value = 0;
for (size_t j = 0, i = 2; i < len; i *= 2, j++) {
stat.AddRoundResult( key[0], (dv[len-i-1]-last_value)*1000000.0 );
last_value = dv[len-i-1];
stat.AddRoundResult( key[2], last_timer.diff_time(tv[i])/double(i)*1000000.0 );
last_timer = tv[i];
stat.SetRoundTitle(j, i);
}
tv.clear(); dv.clear();
//__TBB_ASSERT(timers_vector_t::allocator_type::items_allocated == timers_vector_t::allocator_type::items_freed, NULL);
//__TBB_ASSERT(values_vector_t::allocator_type::items_allocated == values_vector_t::allocator_type::items_freed, NULL);
return *this;
}
};
/************************************************************************/
/* TEST2 */
/************************************************************************/
#define mk_vector_test2(v, a) vector_test2<v<size_t, a<size_t> > >
template<class vector_t>
class vector_test2 {
const char *mode;
static const int ntrial = 10;
StatisticsCollector &stat;
public:
vector_test2(const char *m, StatisticsCollector &s) : mode(m), stat(s) {}
vector_test2 &operator()(size_t len) {
if(Verbose) printf("test2<%s>(%u): performing standard transformation sequence on vector\n", mode, unsigned(len));
StatisticsCollector::TestCase init_key = stat.SetTestCase("allocate", mode, len);
StatisticsCollector::TestCase fill_key = stat.SetTestCase("fill", mode, len);
StatisticsCollector::TestCase proc_key = stat.SetTestCase("process", mode, len);
StatisticsCollector::TestCase full_key = stat.SetTestCase("total time", mode, len);
for (int i = 0; i < ntrial; i++) {
Timer timer0;
vector_t v1(len);
vector_t v2(len);
Timer timer1;
std::generate(v1.begin(), v1.end(), values(0));
std::generate(v2.begin(), v2.end(), values(size_t(-len)));
Timer timer2;
std::reverse(v1.rbegin(), v1.rend());
std::inner_product(v1.begin(), v1.end(), v2.rbegin(), 1);
std::sort(v1.rbegin(), v1.rend());
std::sort(v2.rbegin(), v2.rend());
std::set_intersection(v1.begin(), v1.end(), v2.rbegin(), v2.rend(), v1.begin());
Timer timer3;
stat.AddRoundResult( proc_key, timer2.diff_time(timer3)*1000.0 );
stat.AddRoundResult( fill_key, timer1.diff_time(timer2)*1000.0 );
stat.AddRoundResult( init_key, timer0.diff_time(timer1)*1000.0 );
stat.AddRoundResult( full_key, timer0.diff_time(timer3)*1000.0 );
}
stat.SetStatisticFormula("1Average", "=AVERAGE(ROUNDS)");
stat.SetStatisticFormula("2+/-", "=(MAX(ROUNDS)-MIN(ROUNDS))/2");
return *this;
}
class values
{
size_t value;
public:
values(size_t i) : value(i) {}
size_t operator()() {
return value++%(1|(value^55));
}
};
};
/************************************************************************/
/* TEST3 */
/************************************************************************/
#define mk_vector_test3(v, a) vector_test3<v<char, local_counting_allocator<a<char>, size_t > > >
template<class vector_t>
class vector_test3 {
const char *mode;
StatisticsCollector &stat;
public:
vector_test3(const char *m, StatisticsCollector &s) : mode(m), stat(s) {}
vector_test3 &operator()(size_t len) {
if(Verbose) printf("test3<%s>(%u): collecting allocator statistics\n", mode, unsigned(len));
static const size_t sz = 1024;
vector_t V[sz];
StatisticsCollector::TestCase vinst_key = stat.SetTestCase("instances number", mode, len);
StatisticsCollector::TestCase count_key = stat.SetTestCase("allocations count", mode, len);
StatisticsCollector::TestCase items_key = stat.SetTestCase("allocated items", mode, len);
//stat.ReserveRounds(sz-1);
for (size_t c = 0, i = 0, s = sz/2; s >= 1 && i < sz; s /= 2, c++)
{
const size_t count = c? 1<<(c-1) : 0;
for (size_t e = i+s; i < e; i++) {
//if(count >= 16) V[i].reserve(count);
for (size_t j = 0; j < count; j++)
V[i].push_back(j);
}
stat.SetRoundTitle ( c, count );
stat.AddRoundResult( vinst_key, s );
stat.AddRoundResult( count_key, V[i-1].get_allocator().allocations );
stat.AddRoundResult( items_key, V[i-1].get_allocator().items_allocated );
}
return *this;
}
};
/************************************************************************/
/* TYPES SET FOR TESTS */
/************************************************************************/
#define types_set(n, title, op) { StatisticsCollector Collector("time_vector"#n); Collector.SetTitle title; \
{mk_vector_test##n(tbb::concurrent_vector, tbb::cache_aligned_allocator) ("TBB:NFS", Collector)op;} \
{mk_vector_test##n(tbb::concurrent_vector, tbb::tbb_allocator) ("TBB:TBB", Collector)op;} \
{mk_vector_test##n(tbb::concurrent_vector, std::allocator) ("TBB:STD", Collector)op;} \
{mk_vector_test##n(std::vector, tbb::cache_aligned_allocator) ("STL:NFS", Collector)op;} \
{mk_vector_test##n(std::vector, tbb::tbb_allocator) ("STL:TBB", Collector)op;} \
{mk_vector_test##n(std::vector, std::allocator) ("STL:STD", Collector)op;} \
Collector.Print(StatisticsCollector::Stdout|StatisticsCollector::HTMLFile|StatisticsCollector::ExcelXML); }
/************************************************************************/
/* MAIN DRIVER */
/************************************************************************/
int main(int argc, char* argv[]) {
if(argc>1) Verbose = true;
if(argc>2) ExtraVerbose = true;
MinThread = 0; MaxThread = 500000; // use in another meaning - test#:problem size
ParseCommandLine( argc, argv );
ASSERT(tbb_allocator<int>::allocator_type() == tbb_allocator<int>::scalable, "expecting scalable allocator library to be loaded");
if(!MinThread || MinThread == 1)
types_set(1, ("Vectors performance test #1 for %d", MaxThread), (MaxThread) )
if(!MinThread || MinThread == 2)
types_set(2, ("Vectors performance test #2 for %d", MaxThread), (MaxThread) )
if(!MinThread || MinThread == 3)
types_set(3, ("Vectors performance test #3 for %d", MaxThread), (MaxThread) )
if(!Verbose) printf("done\n");
return 0;
}