2022-02-23 15:25:55 +02:00
|
|
|
const std = @import("std");
|
|
|
|
|
2022-03-02 11:05:20 +02:00
|
|
|
extern fn bdz_search_packed(packed_mphf: [*]const u8, key: [*]const u8, len: c_uint) u32;
|
2022-02-23 15:25:55 +02:00
|
|
|
|
2022-03-02 11:05:20 +02:00
|
|
|
pub fn search(packed_mphf: []const u8, key: []const u8) u32 {
|
2022-06-05 23:11:13 +03:00
|
|
|
const len = std.math.cast(c_uint, key.len).?;
|
2022-07-04 07:44:20 +03:00
|
|
|
return @as(u32, bdz_search_packed(packed_mphf[4..].ptr, key.ptr, len));
|
2022-03-02 11:05:20 +02:00
|
|
|
}
|
|
|
|
|
2022-03-06 18:18:35 +02:00
|
|
|
const u32len = 5;
|
|
|
|
|
2022-03-02 11:05:20 +02:00
|
|
|
pub fn search_u32(packed_mphf: []const u8, key: u32) u32 {
|
2022-07-04 07:44:20 +03:00
|
|
|
return @as(u32, bdz_search_packed(packed_mphf[4..].ptr, &unzero(key), u32len));
|
2022-03-02 11:05:20 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
// encode a u32 to 5 bytes so no bytes is a '\0'.
|
|
|
|
//
|
|
|
|
// TODO(motiejus) figure out how to use cmph_io_byte_vector_adapter, so cmph
|
|
|
|
// packing would accept zero bytes. For now we will be doing a dance of not
|
|
|
|
// passing zero bytes.
|
|
|
|
pub fn unzero(x: u32) [5]u8 {
|
2022-03-06 18:18:35 +02:00
|
|
|
const bit: u8 = 0b10000000;
|
|
|
|
var buf: [u32len]u8 = undefined;
|
|
|
|
buf[0] = @truncate(u8, (x & 0b11111110_00000000_00000000_00000000) >> 25) | bit;
|
|
|
|
buf[1] = @truncate(u8, (x & 0b00000001_11111100_00000000_00000000) >> 18) | bit;
|
|
|
|
buf[2] = @truncate(u8, (x & 0b00000000_00000011_11110000_00000000) >> 12) | bit;
|
|
|
|
buf[3] = @truncate(u8, (x & 0b00000000_00000000_00001111_11000000) >> 6) | bit;
|
|
|
|
buf[4] = @truncate(u8, (x & 0b00000000_00000000_00000000_00111111) >> 0) | bit;
|
2022-03-02 11:05:20 +02:00
|
|
|
return buf;
|
2022-02-23 15:25:55 +02:00
|
|
|
}
|