2011-06-13 09:14:15 +03:00
|
|
|
#include <set>
|
|
|
|
#include <string>
|
2011-11-10 20:44:37 +02:00
|
|
|
#include <unordered_map>
|
2011-06-13 09:14:15 +03:00
|
|
|
|
|
|
|
#include "bm_common.h"
|
2011-06-14 08:24:40 +03:00
|
|
|
#include "stringpiece.h"
|
2011-06-13 09:14:15 +03:00
|
|
|
#include "mph_index.h"
|
|
|
|
|
|
|
|
using namespace cxxmph;
|
|
|
|
|
|
|
|
using std::string;
|
2011-11-10 20:44:37 +02:00
|
|
|
using std::unordered_map;
|
2011-06-13 09:14:15 +03:00
|
|
|
|
|
|
|
class BM_MPHIndexCreate : public UrlsBenchmark {
|
|
|
|
public:
|
|
|
|
BM_MPHIndexCreate(const std::string& urls_file)
|
|
|
|
: UrlsBenchmark(urls_file) { }
|
|
|
|
protected:
|
|
|
|
virtual void Run() {
|
|
|
|
SimpleMPHIndex<StringPiece> index;
|
|
|
|
index.Reset(urls_.begin(), urls_.end());
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
class BM_STLIndexCreate : public UrlsBenchmark {
|
|
|
|
public:
|
|
|
|
BM_STLIndexCreate(const std::string& urls_file)
|
|
|
|
: UrlsBenchmark(urls_file) { }
|
|
|
|
protected:
|
|
|
|
virtual void Run() {
|
2011-06-14 08:24:40 +03:00
|
|
|
unordered_map<StringPiece, uint32_t> index;
|
|
|
|
int idx = 0;
|
|
|
|
for (auto it = urls_.begin(); it != urls_.end(); ++it) {
|
|
|
|
index.insert(make_pair(*it, idx++));
|
|
|
|
}
|
2011-06-13 09:14:15 +03:00
|
|
|
}
|
|
|
|
};
|
2011-11-10 20:44:37 +02:00
|
|
|
|
2011-06-13 09:14:15 +03:00
|
|
|
class BM_MPHIndexSearch : public SearchUrlsBenchmark {
|
|
|
|
public:
|
|
|
|
BM_MPHIndexSearch(const std::string& urls_file, int nsearches)
|
|
|
|
: SearchUrlsBenchmark(urls_file, nsearches) { }
|
|
|
|
virtual void Run() {
|
|
|
|
for (auto it = random_.begin(); it != random_.end(); ++it) {
|
2011-06-14 08:24:40 +03:00
|
|
|
auto idx = index_.index(*it);
|
|
|
|
// Collision check to be fair with STL
|
|
|
|
if (strcmp(urls_[idx].c_str(), it->data()) != 0) idx = -1;
|
2011-06-13 09:14:15 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
protected:
|
|
|
|
virtual bool SetUp () {
|
|
|
|
if (!SearchUrlsBenchmark::SetUp()) return false;
|
|
|
|
index_.Reset(urls_.begin(), urls_.end());
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
SimpleMPHIndex<StringPiece> index_;
|
|
|
|
};
|
|
|
|
|
|
|
|
class BM_STLIndexSearch : public SearchUrlsBenchmark {
|
|
|
|
public:
|
|
|
|
BM_STLIndexSearch(const std::string& urls_file, int nsearches)
|
|
|
|
: SearchUrlsBenchmark(urls_file, nsearches) { }
|
|
|
|
virtual void Run() {
|
|
|
|
for (auto it = random_.begin(); it != random_.end(); ++it) {
|
2011-06-14 08:24:40 +03:00
|
|
|
auto idx = index_.find(*it);
|
2011-06-13 09:14:15 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
protected:
|
|
|
|
virtual bool SetUp () {
|
|
|
|
if (!SearchUrlsBenchmark::SetUp()) return false;
|
2011-06-14 08:24:40 +03:00
|
|
|
unordered_map<StringPiece, uint32_t> index;
|
|
|
|
int idx = 0;
|
|
|
|
for (auto it = urls_.begin(); it != urls_.end(); ++it) {
|
|
|
|
index.insert(make_pair(*it, idx++));
|
|
|
|
}
|
|
|
|
index.swap(index_);
|
2011-06-13 09:14:15 +03:00
|
|
|
return true;
|
|
|
|
}
|
2011-11-10 20:44:37 +02:00
|
|
|
std::unordered_map<StringPiece, uint32_t> index_;
|
2011-06-13 09:14:15 +03:00
|
|
|
};
|
|
|
|
|
|
|
|
int main(int argc, char** argv) {
|
|
|
|
Benchmark::Register(new BM_MPHIndexCreate("URLS100k"));
|
|
|
|
Benchmark::Register(new BM_STLIndexCreate("URLS100k"));
|
2011-06-14 08:24:40 +03:00
|
|
|
Benchmark::Register(new BM_MPHIndexSearch("URLS100k", 100*1000*1000));
|
|
|
|
Benchmark::Register(new BM_STLIndexSearch("URLS100k", 100*1000*1000));
|
2011-06-13 09:14:15 +03:00
|
|
|
Benchmark::RunAll();
|
|
|
|
return 0;
|
|
|
|
}
|