turbonss/cxxmph/mph_index.cc

236 lines
7.4 KiB
C++
Raw Normal View History

#include <limits>
2010-10-28 03:17:09 +03:00
#include <iostream>
2011-05-16 02:47:42 +03:00
#include <vector>
2010-10-28 03:17:09 +03:00
using std::cerr;
using std::endl;
2010-06-28 22:01:18 +03:00
#include "mph_index.h"
2010-10-05 17:51:17 +03:00
using std::vector;
2010-10-28 03:17:09 +03:00
namespace {
2011-02-14 00:40:26 +02:00
static const uint8_t kUnassigned = 3;
2010-10-28 03:17:09 +03:00
// table used for looking up the number of assigned vertices to a 8-bit integer
static uint8_t kBdzLookupIndex[] =
2010-10-28 03:17:09 +03:00
{
4, 4, 4, 3, 4, 4, 4, 3, 4, 4, 4, 3, 3, 3, 3, 2,
4, 4, 4, 3, 4, 4, 4, 3, 4, 4, 4, 3, 3, 3, 3, 2,
4, 4, 4, 3, 4, 4, 4, 3, 4, 4, 4, 3, 3, 3, 3, 2,
3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 2, 2, 2, 1,
4, 4, 4, 3, 4, 4, 4, 3, 4, 4, 4, 3, 3, 3, 3, 2,
4, 4, 4, 3, 4, 4, 4, 3, 4, 4, 4, 3, 3, 3, 3, 2,
4, 4, 4, 3, 4, 4, 4, 3, 4, 4, 4, 3, 3, 3, 3, 2,
3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 2, 2, 2, 1,
4, 4, 4, 3, 4, 4, 4, 3, 4, 4, 4, 3, 3, 3, 3, 2,
4, 4, 4, 3, 4, 4, 4, 3, 4, 4, 4, 3, 3, 3, 3, 2,
4, 4, 4, 3, 4, 4, 4, 3, 4, 4, 4, 3, 3, 3, 3, 2,
3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 2, 2, 2, 1,
3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 2, 2, 2, 1,
3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 2, 2, 2, 1,
3, 3, 3, 2, 3, 3, 3, 2, 3, 3, 3, 2, 2, 2, 2, 1,
2, 2, 2, 1, 2, 2, 2, 1, 2, 2, 2, 1, 1, 1, 1, 0
};
2010-10-05 17:51:17 +03:00
2010-10-28 03:17:09 +03:00
} // anonymous namespace
namespace cxxmph {
const uint8_t MPHIndex::valuemask[] = { 0xfc, 0xf3, 0xcf, 0x3f};
2010-11-05 08:40:15 +02:00
MPHIndex::~MPHIndex() {
2011-05-16 05:04:30 +03:00
clear();
}
void MPHIndex::clear() {
2011-05-16 17:26:18 +03:00
if (!deserialized_) delete [] g_;
2011-05-16 05:04:30 +03:00
g_ = NULL;
g_size_ = 0;
2011-05-16 17:26:18 +03:00
if (!deserialized_) delete [] ranktable_;
2011-05-16 05:04:30 +03:00
ranktable_ = NULL;
ranktable_size_ = 0;
// TODO(davi) implement me
2010-10-29 09:26:37 +03:00
}
2011-05-16 05:04:30 +03:00
bool MPHIndex::GenerateQueue(
2011-02-14 00:40:26 +02:00
TriGraph* graph, vector<uint32_t>* queue_output) {
uint32_t queue_head = 0, queue_tail = 0;
uint32_t nedges = m_;
uint32_t nvertices = n_;
2010-10-05 17:51:17 +03:00
// Relies on vector<bool> using 1 bit per element
2010-10-28 05:45:43 +03:00
vector<bool> marked_edge(nedges + 1, false);
2011-02-14 00:40:26 +02:00
vector<uint32_t> queue(nvertices, 0);
for (uint32_t i = 0; i < nedges; ++i) {
const TriGraph::Edge& e = graph->edges()[i];
if (graph->vertex_degree()[e[0]] == 1 ||
graph->vertex_degree()[e[1]] == 1 ||
graph->vertex_degree()[e[2]] == 1) {
2010-10-05 17:51:17 +03:00
if (!marked_edge[i]) {
queue[queue_head++] = i;
2010-10-05 17:51:17 +03:00
marked_edge[i] = true;
}
}
}
2011-05-16 05:04:30 +03:00
/*
2010-10-28 05:45:43 +03:00
for (unsigned int i = 0; i < marked_edge.size(); ++i) {
2011-02-14 00:40:26 +02:00
cerr << "vertex with degree " << static_cast<uint32_t>(graph->vertex_degree()[i]) << " marked " << marked_edge[i] << endl;
2010-10-28 05:45:43 +03:00
}
for (unsigned int i = 0; i < queue.size(); ++i) {
cerr << "vertex " << i << " queued at " << queue[i] << endl;
}
2011-05-16 05:04:30 +03:00
*/
2010-10-28 05:45:43 +03:00
// At this point queue head is the number of edges touching at least one
// vertex of degree 1.
2010-11-09 07:51:33 +02:00
// cerr << "Queue head " << queue_head << " Queue tail " << queue_tail << endl;
// graph->DebugGraph();
2010-10-05 17:51:17 +03:00
while (queue_tail != queue_head) {
2011-02-14 00:40:26 +02:00
uint32_t current_edge = queue[queue_tail++];
2010-10-05 17:51:17 +03:00
graph->RemoveEdge(current_edge);
const TriGraph::Edge& e = graph->edges()[current_edge];
2010-10-05 17:51:17 +03:00
for (int i = 0; i < 3; ++i) {
2011-02-14 00:40:26 +02:00
uint32_t v = e[i];
if (graph->vertex_degree()[v] == 1) {
2011-02-14 00:40:26 +02:00
uint32_t first_edge = graph->first_edge()[v];
if (!marked_edge[first_edge]) {
2010-10-05 17:51:17 +03:00
queue[queue_head++] = first_edge;
marked_edge[first_edge] = true;
}
}
}
}
2011-05-16 05:04:30 +03:00
/*
2010-10-28 05:45:43 +03:00
for (unsigned int i = 0; i < queue.size(); ++i) {
cerr << "vertex " << i << " queued at " << queue[i] << endl;
}
2011-05-16 05:04:30 +03:00
*/
int cycles = queue_head - nedges;
if (cycles == 0) queue.swap(*queue_output);
return cycles == 0;
2010-06-28 22:01:18 +03:00
}
void MPHIndex::Assigning(
2011-02-14 00:40:26 +02:00
const vector<TriGraph::Edge>& edges, const vector<uint32_t>& queue) {
uint32_t current_edge = 0;
2010-11-09 06:29:39 +02:00
vector<bool> marked_vertices(n_ + 1);
2010-10-28 03:17:09 +03:00
// Initialize vector of half nibbles with all bits set.
2011-05-16 05:04:30 +03:00
g_size_ = static_cast<uint32_t>(ceil(n_/4.0));
2011-05-16 17:26:18 +03:00
if (!deserialized_) delete [] g_;
2011-05-16 05:24:12 +03:00
g_ = NULL;
uint8_t* g = new uint8_t[g_size_];
memset(g, std::numeric_limits<uint8_t>::max(), g_size_);
assert(g[g_size_ - 1] == 255);
2010-10-28 05:45:43 +03:00
2011-02-14 00:40:26 +02:00
uint32_t nedges = m_; // for legibility
for (int i = nedges - 1; i + 1 >= 1; --i) {
current_edge = queue[i];
const TriGraph::Edge& e = edges[current_edge];
2011-05-16 05:04:30 +03:00
/*
2011-05-16 04:02:34 +03:00
cerr << "B: " << e[0] << " " << e[1] << " " << e[2] << " -> "
<< get_2bit_value(g_, e[0]) << " "
<< get_2bit_value(g_, e[1]) << " "
<< get_2bit_value(g_, e[2]) << " edge " << current_edge << endl;
2011-05-16 05:04:30 +03:00
*/
if (!marked_vertices[e[0]]) {
if (!marked_vertices[e[1]]) {
2011-05-16 05:24:12 +03:00
set_2bit_value(g, e[1], kUnassigned);
marked_vertices[e[1]] = true;
}
if (!marked_vertices[e[2]]) {
2011-05-16 05:24:12 +03:00
set_2bit_value(g, e[2], kUnassigned);
2010-11-09 06:29:39 +02:00
assert(marked_vertices.size() > e[2]);
marked_vertices[e[2]] = true;
}
2011-05-16 05:24:12 +03:00
set_2bit_value(g, e[0], (6 - (get_2bit_value(g, e[1]) + get_2bit_value(g, e[2]))) % 3);
marked_vertices[e[0]] = true;
2010-10-28 03:17:09 +03:00
} else if (!marked_vertices[e[1]]) {
if (!marked_vertices[e[2]]) {
2011-05-16 05:24:12 +03:00
set_2bit_value(g, e[2], kUnassigned);
marked_vertices[e[2]] = true;
}
2011-05-16 05:24:12 +03:00
set_2bit_value(g, e[1], (7 - (get_2bit_value(g, e[0]) + get_2bit_value(g, e[2]))) % 3);
marked_vertices[e[1]] = true;
} else {
2011-05-16 05:24:12 +03:00
set_2bit_value(g, e[2], (8 - (get_2bit_value(g, e[0]) + get_2bit_value(g, e[1]))) % 3);
marked_vertices[e[2]] = true;
2010-10-05 17:51:17 +03:00
}
2011-05-16 05:04:30 +03:00
/*
2011-05-16 04:02:34 +03:00
cerr << "A: " << e[0] << " " << e[1] << " " << e[2] << " -> "
2011-05-16 05:24:12 +03:00
<< get_2bit_value(g, e[0]) << " "
<< get_2bit_value(g, e[1]) << " "
<< get_2bit_value(g, e[2]) << " " << endl;
2011-05-16 05:04:30 +03:00
*/
2010-10-05 17:51:17 +03:00
}
2011-05-16 05:24:12 +03:00
g_ = g;
2010-10-05 17:51:17 +03:00
}
void MPHIndex::Ranking() {
2011-02-14 00:40:26 +02:00
uint32_t nbytes_total = static_cast<uint32_t>(ceil(n_ / 4.0));
uint32_t size = k_ >> 2U;
2011-05-16 05:04:30 +03:00
ranktable_size_ = static_cast<uint32_t>(
2010-10-28 03:17:09 +03:00
ceil(n_ / static_cast<double>(k_)));
2011-05-16 17:26:18 +03:00
if (!deserialized_) delete [] ranktable_;
2011-05-16 05:24:12 +03:00
ranktable_ = NULL;
uint32_t* ranktable = new uint32_t[ranktable_size_];
memset(ranktable, 0, ranktable_size_*sizeof(uint32_t));
2011-02-14 00:40:26 +02:00
uint32_t offset = 0;
uint32_t count = 0;
uint32_t i = 1;
while (1) {
2011-05-16 05:04:30 +03:00
if (i == ranktable_size_) break;
2011-02-14 00:40:26 +02:00
uint32_t nbytes = size < nbytes_total ? size : nbytes_total;
for (uint32_t j = 0; j < nbytes; ++j) count += kBdzLookupIndex[g_[offset + j]];
2011-05-16 05:24:12 +03:00
ranktable[i] = count;
offset += nbytes;
nbytes_total -= size;
++i;
}
2011-05-16 05:24:12 +03:00
ranktable_ = ranktable;
2010-10-05 17:51:17 +03:00
}
uint32_t MPHIndex::Rank(uint32_t vertex) const {
2011-02-14 00:40:26 +02:00
uint32_t index = vertex >> b_;
uint32_t base_rank = ranktable_[index];
uint32_t beg_idx_v = index << b_;
uint32_t beg_idx_b = beg_idx_v >> 2;
uint32_t end_idx_b = vertex >> 2;
while (beg_idx_b < end_idx_b) base_rank += kBdzLookupIndex[g_[beg_idx_b++]];
beg_idx_v = beg_idx_b << 2;
2011-05-16 05:04:30 +03:00
// cerr << "beg_idx_v: " << beg_idx_v << endl;
// cerr << "base rank: " << base_rank << endl;
/*
2011-05-16 04:02:34 +03:00
cerr << "G: ";
for (unsigned int i = 0; i < n_; ++i) {
cerr << get_2bit_value(g_, i) << " ";
}
cerr << endl;
2011-05-16 05:04:30 +03:00
*/
while (beg_idx_v < vertex) {
2010-10-28 05:45:43 +03:00
if (get_2bit_value(g_, beg_idx_v) != kUnassigned) ++base_rank;
++beg_idx_v;
}
2010-11-09 07:51:33 +02:00
// cerr << "Base rank: " << base_rank << endl;
return base_rank;
2010-10-05 17:51:17 +03:00
}
2010-06-28 22:01:18 +03:00
uint32_t MPHIndex::serialize_bytes_needed() const {
return sizeof(MPHIndex) + g_size_ + ranktable_size_*sizeof(uint32_t);
2011-05-16 05:24:12 +03:00
}
void MPHIndex::serialize(char* memory) const {
memcpy(memory, this, sizeof(MPHIndex));
memcpy(memory + sizeof(MPHIndex), g_, g_size_);
memcpy(memory + sizeof(MPHIndex) + g_size_,
2011-05-16 05:24:12 +03:00
ranktable_, ranktable_size_*sizeof(uint32_t));
}
bool MPHIndex::deserialize(const char* serialized_memory) {
memcpy(this, serialized_memory, sizeof(MPHIndex));
g_ = reinterpret_cast<const uint8_t*>(serialized_memory + sizeof(MPHIndex));
2011-05-16 05:24:12 +03:00
ranktable_ = reinterpret_cast<const uint32_t*>(
serialized_memory + sizeof(MPHIndex) + g_size_);
2011-05-16 17:26:18 +03:00
deserialized_ = true;
2011-05-16 05:24:12 +03:00
return true;
}
} // namespace cxxmph