+#include "db.h"
#include "vp4.h"
#include <algorithm>
#include <vector>
#include <zstd.h>
-#include "db.h"
-
#define P4NENC_BOUND(n) ((n + 127) / 128 + (n + 32) * sizeof(uint32_t))
#define dprintf(...)
//#define dprintf(...) fprintf(stderr, __VA_ARGS__);
}
for (uint32_t trgm : all_trigrams) {
// We don't know offset yet, so set it to zero.
- Trigram to_insert{trgm, uint32_t(corpus.invindex.find(trgm)->second.num_docids), 0};
+ Trigram to_insert{ trgm, uint32_t(corpus.invindex.find(trgm)->second.num_docids), 0 };
uint32_t bucket = hash_trigram(trgm, ht_size);
unsigned distance = 0;
unique_ptr<Trigram[]> hashtable;
uint32_t ht_size = next_prime(all_trigrams.size());
constexpr unsigned num_overflow_slots = 16;
- for ( ;; ) {
+ for (;;) {
hashtable = create_hashtable(corpus, all_trigrams, ht_size, num_overflow_slots);
if (hashtable == nullptr) {
dprintf("Failed creating hash table of size %u, increasing by 5%% and trying again.\n", ht_size);
#include "db.h"
-#include "vp4.h"
#include "io_uring_engine.h"
+#include "vp4.h"
#include <algorithm>
#include <arpa/inet.h>
void find_trigram(uint32_t trgm, function<void(const Trigram *trgmptr, size_t len)> cb);
void get_compressed_filename_block(uint32_t docid, function<void(string)> cb) const;
size_t get_num_filename_blocks() const;
- off_t offset_for_block(uint32_t docid) const {
+ off_t offset_for_block(uint32_t docid) const
+ {
return hdr.filename_index_offset_bytes + docid * sizeof(uint64_t);
}
block.resize(uncompressed_len + 1);
size_t err = ZSTD_decompress(&block[0], block.size(), compressed.data(),
- compressed.size());
+ compressed.size());
if (ZSTD_isError(err)) {
fprintf(stderr, "ZSTD_decompress(): %s\n", ZSTD_getErrorName(err));
exit(1);
for (uint32_t docid = io_docid; docid < last_docid; ++docid) {
size_t relative_offset = offsets[docid] - offsets[io_docid];
size_t len = offsets[docid + 1] - offsets[docid];
- scan_file_block(needle, {&compressed[relative_offset], len}, &access_rx_cache);
+ scan_file_block(needle, { &compressed[relative_offset], len }, &access_rx_cache);
}
}
}
break;
}
engine.submit_read(fd, len, trgmptr.offset, [trgmptr, len, &done, &in1, &in2, &out](string s) {
- if (done) return;
+ if (done)
+ return;
uint32_t trgm __attribute__((unused)) = trgmptr.trgm;
size_t num = trgmptr.num_docids;
unsigned char *pldata = reinterpret_cast<unsigned char *>(s.data());