lmdb-safe/lmdb-typed.hh

563 lines
15 KiB
C++
Raw Normal View History

#pragma once
#include <iostream>
#include "lmdb-safe.hh"
#include <boost/archive/binary_oarchive.hpp>
#include <boost/archive/binary_iarchive.hpp>
#include <boost/serialization/vector.hpp>
#include <boost/serialization/string.hpp>
#include <boost/serialization/utility.hpp>
#include <boost/iostreams/stream.hpp>
#include <boost/iostreams/stream_buffer.hpp>
#include <boost/iostreams/device/back_inserter.hpp>
#include <sstream>
using std::cout;
using std::endl;
/*
Open issues:
Everything should go into a namespace
What is an error? What is an exception?
2018-12-16 15:58:38 +01:00
could id=0 be magic? ('no such id')
Is boost the best serializer?
Perhaps use the separate index concept from multi_index
A dump function would be nice (typed)
2018-12-16 21:46:53 +01:00
including indexes
perhaps get eiter to be of same type so for(auto& a : x) works
*/
2018-12-16 20:28:49 +01:00
/** Return the highest ID used in a database. Returns 0 for an empty DB.
This makes us start everything at ID=1, which might make it possible to
treat id 0 as special
*/
unsigned int getMaxID(MDBRWTransaction& txn, MDBDbi& dbi);
2018-12-16 20:28:49 +01:00
/** This is our serialization interface.
We could/should templatize this so you could pick something else
*/
template<typename T>
std::string serToString(const T& t)
{
std::string serial_str;
boost::iostreams::back_insert_device<std::string> inserter(serial_str);
boost::iostreams::stream<boost::iostreams::back_insert_device<std::string> > s(inserter);
boost::archive::binary_oarchive oa(s, boost::archive::no_header | boost::archive::no_codecvt);
oa << t;
return serial_str;
}
template<typename T>
void serFromString(const std::string& str, T& ret)
{
ret = T();
std::istringstream istr{str};
boost::archive::binary_iarchive oi(istr,boost::archive::no_header|boost::archive::no_codecvt );
oi >> ret;
}
2018-12-16 20:28:49 +01:00
/** This is a struct that implements index operations, but
only the operations that are broadcast to all indexes.
Specifically, to deal with databases with less than the maximum
number of interfaces, this only includes calls that should be
ignored for empty indexes.
2018-12-16 20:28:49 +01:00
this only needs methods that must happen for all indexes at once
so specifically, not size<t> or get<t>, people ask for those themselves, and
should no do that on indexes that don't exist */
2018-12-16 15:58:38 +01:00
template<class Class,typename Type, typename Parent>
struct LMDBIndexOps
{
explicit LMDBIndexOps(Parent* parent) : d_parent(parent){}
void put(MDBRWTransaction& txn, const Class& t, uint32_t id)
{
2018-12-16 15:58:38 +01:00
txn.put(d_idx, d_parent->getMember(t), id);
}
void del(MDBRWTransaction& txn, const Class& t, uint32_t id)
{
2018-12-16 15:58:38 +01:00
txn.del(d_idx, d_parent->getMember(t), id);
}
void openDB(std::shared_ptr<MDBEnv>& env, string_view str, int flags)
{
d_idx = env->openDB(str, flags);
}
2018-12-16 15:58:38 +01:00
MDBDbi d_idx;
Parent* d_parent;
};
2018-12-16 20:28:49 +01:00
/** This is an index on a field in a struct, it derives from the LMDBIndexOps */
2018-12-16 15:58:38 +01:00
template<class Class,typename Type,Type Class::*PtrToMember>
struct index_on : LMDBIndexOps<Class, Type, index_on<Class, Type, PtrToMember>>
{
index_on() : LMDBIndexOps<Class, Type, index_on<Class, Type, PtrToMember>>(this)
{}
static Type getMember(const Class& c)
{
return c.*PtrToMember;
}
typedef Type type;
2018-12-16 15:58:38 +01:00
};
2018-12-16 20:28:49 +01:00
/** This is a calculated index */
2018-12-16 15:58:38 +01:00
template<class Class, typename Type, class Func>
struct index_on_function : LMDBIndexOps<Class, Type, index_on_function<Class, Type, Func> >
{
index_on_function() : LMDBIndexOps<Class, Type, index_on_function<Class, Type, Func> >(this)
{}
static Type getMember(const Class& c)
{
Func f;
return f(c);
}
typedef Type type;
};
2018-12-16 20:28:49 +01:00
/** nop index, so we can fill our N indexes, even if you don't use them all */
struct nullindex_t
{
template<typename Class>
void put(MDBRWTransaction& txn, const Class& t, uint32_t id)
{}
template<typename Class>
void del(MDBRWTransaction& txn, const Class& t, uint32_t id)
{}
2018-12-14 23:46:46 +01:00
void openDB(std::shared_ptr<MDBEnv>& env, string_view str, int flags)
{
}
typedef uint32_t type; // dummy
};
2018-12-16 20:28:49 +01:00
/** The main class. Templatized only on the indexes and typename right now */
template<typename T, class I1=nullindex_t, class I2=nullindex_t, class I3 = nullindex_t, class I4 = nullindex_t>
class TypedDBI
{
public:
TypedDBI(std::shared_ptr<MDBEnv> env, string_view name)
: d_env(env), d_name(name)
{
d_main = d_env->openDB(name, MDB_CREATE | MDB_INTEGERKEY);
2018-12-16 20:28:49 +01:00
// now you might be tempted to go all MPL on this so we can get rid of the
// ugly macro. I'm not very receptive to that idea since it will make things
// EVEN uglier.
#define openMacro(N) std::get<N>(d_tuple).openDB(d_env, std::string(name)+"_"#N, MDB_CREATE | MDB_DUPFIXED | MDB_DUPSORT);
openMacro(0);
openMacro(1);
openMacro(2);
openMacro(3);
#undef openMacro
}
2018-12-16 20:28:49 +01:00
// we get a lot of our smarts from this tuple, it enables get<0> etc
typedef std::tuple<I1, I2, I3, I4> tuple_t;
tuple_t d_tuple;
2018-12-16 20:28:49 +01:00
// We support readonly and rw transactions. Here we put the Readonly operations
// which get sourced by both kinds of transactions
template<class Parent>
struct ReadonlyOperations
{
ReadonlyOperations(Parent& parent) : d_parent(parent)
{}
2018-12-16 20:28:49 +01:00
//! Number of entries in main database
2018-12-14 23:46:46 +01:00
uint32_t size()
{
MDB_stat stat;
mdb_stat(d_parent.d_txn, d_parent.d_parent->d_main, &stat);
2018-12-14 23:46:46 +01:00
return stat.ms_entries;
}
2018-12-16 20:28:49 +01:00
//! Number of entries in the various indexes - should be the same
template<int N>
uint32_t size()
{
2018-12-15 21:06:47 +01:00
MDB_stat stat;
mdb_stat(d_parent.d_txn, std::get<N>(d_parent.d_parent->d_tuple).d_idx, &stat);
return stat.ms_entries;
}
2018-12-16 20:28:49 +01:00
//! Get item with id, from main table directly
bool get(uint32_t id, T& t)
{
MDBOutVal data;
if(d_parent.d_txn.get(d_parent.d_parent->d_main, id, data))
return false;
serFromString(data.get<std::string>(), t);
return true;
}
2018-12-14 23:46:46 +01:00
2018-12-16 20:28:49 +01:00
//! Get item through index N, then via the main database
template<int N>
uint32_t get(const typename std::tuple_element<N, tuple_t>::type::type& key, T& out)
{
MDBOutVal id;
if(!d_parent.d_txn.get(std::get<N>(d_parent.d_parent->d_tuple).d_idx, key, id))
return get(id.get<uint32_t>(), out);
return 0;
}
2018-12-16 20:28:49 +01:00
//! Cardinality of index N
template<int N>
uint32_t cardinality()
{
auto cursor = d_parent.d_txn.getCursor(std::get<N>(d_parent.d_parent->d_tuple).d_idx);
bool first = true;
MDBOutVal key, data;
uint32_t count = 0;
while(!cursor.get(key, data, first ? MDB_FIRST : MDB_NEXT_NODUP)) {
++count;
first=false;
}
return count;
}
2018-12-16 20:28:49 +01:00
//! End iderator type
struct eiter_t
{};
2018-12-15 21:06:47 +01:00
// can be on main, or on an index
// when on main, return data directly
// when on index, indirect
2018-12-16 20:28:49 +01:00
// we can be limited to one key, or iterate over entire database
// iter requires you to put the cursor in the right place first!
struct iter_t
{
2018-12-15 21:06:47 +01:00
explicit iter_t(Parent* parent, typename Parent::cursor_t&& cursor, bool on_index, bool one_key, bool end=false) :
d_parent(parent),
2018-12-15 21:06:47 +01:00
d_cursor(std::move(cursor)),
2018-12-16 20:28:49 +01:00
d_on_index(on_index), // is this an iterator on main database or on index?
d_one_key(one_key), // should we stop at end of key? (equal range)
2018-12-15 21:06:47 +01:00
d_end(end)
{
2018-12-15 21:06:47 +01:00
if(d_end)
return;
if(d_cursor.get(d_key, d_id, MDB_GET_CURRENT)) {
d_end = true;
return;
}
2018-12-15 21:06:47 +01:00
if(d_on_index) {
if(d_parent->d_txn.get(d_parent->d_parent->d_main, d_id, d_data))
throw std::runtime_error("Missing id in constructor");
serFromString(d_data.get<std::string>(), d_t);
}
else
serFromString(d_id.get<std::string>(), d_t);
}
bool operator!=(const eiter_t& rhs)
{
return !d_end;
}
bool operator==(const eiter_t& rhs)
{
return d_end;
}
const T& operator*()
{
return d_t;
}
const T* operator->()
{
return &d_t;
}
2018-12-16 20:28:49 +01:00
// implements generic ++ or --
2018-12-16 15:58:38 +01:00
iter_t& genoperator(MDB_cursor_op dupop, MDB_cursor_op op)
{
2018-12-15 21:06:47 +01:00
MDBOutVal data;
2018-12-16 15:58:38 +01:00
int rc = d_cursor.get(d_key, d_id, d_one_key ? dupop : op);
if(rc == MDB_NOTFOUND) {
d_end = true;
}
else {
2018-12-15 21:06:47 +01:00
if(d_on_index) {
if(d_parent->d_txn.get(d_parent->d_parent->d_main, d_id, data))
throw std::runtime_error("Missing id field");
serFromString(data.get<std::string>(), d_t);
}
else
serFromString(d_id.get<std::string>(), d_t);
}
return *this;
}
2018-12-15 21:06:47 +01:00
2018-12-16 15:58:38 +01:00
iter_t& operator++()
{
return genoperator(MDB_NEXT_DUP, MDB_NEXT);
}
iter_t& operator--()
{
return genoperator(MDB_PREV_DUP, MDB_PREV);
}
2018-12-16 20:28:49 +01:00
// get ID this iterator points to
2018-12-15 21:06:47 +01:00
uint32_t getID()
{
if(d_on_index)
return d_id.get<uint32_t>();
else
return d_key.get<uint32_t>();
}
2018-12-16 20:28:49 +01:00
// transaction we are part of
Parent* d_parent;
typename Parent::cursor_t d_cursor;
2018-12-16 20:28:49 +01:00
// gcc complains if I don't zero-init these, which is worrying XXX
2018-12-16 15:58:38 +01:00
MDBOutVal d_key{0,0}, d_data{0,0}, d_id{0,0};
2018-12-15 21:06:47 +01:00
bool d_on_index;
bool d_one_key;
bool d_end{false};
T d_t;
};
template<int N>
2018-12-15 21:06:47 +01:00
iter_t begin()
{
2018-12-15 21:06:47 +01:00
typename Parent::cursor_t cursor = d_parent.d_txn.getCursor(std::get<N>(d_parent.d_parent->d_tuple).d_idx);
MDBOutVal out, id;
2018-12-16 15:58:38 +01:00
if(cursor.get(out, id, MDB_FIRST))
{ // on_index, one_key, end
return iter_t{&d_parent, std::move(cursor), true, false, true};
2018-12-15 21:06:47 +01:00
}
return iter_t{&d_parent, std::move(cursor), true, false};
};
iter_t begin()
{
typename Parent::cursor_t cursor = d_parent.d_txn.getCursor(d_parent.d_parent->d_main);
MDBOutVal out, id;
if(cursor.get(out, id, MDB_FIRST)) {
2018-12-16 15:58:38 +01:00
// on_index, one_key, end
return iter_t{&d_parent, std::move(cursor), false, false, true};
2018-12-15 21:06:47 +01:00
}
return iter_t{&d_parent, std::move(cursor), false, false};
};
2018-12-16 20:28:49 +01:00
eiter_t end()
{
return eiter_t();
}
// basis for find, lower_bound
2018-12-15 21:06:47 +01:00
template<int N>
2018-12-16 20:28:49 +01:00
iter_t genfind(const typename std::tuple_element<N, tuple_t>::type::type& key, MDB_cursor_op op)
2018-12-15 21:06:47 +01:00
{
typename Parent::cursor_t cursor = d_parent.d_txn.getCursor(std::get<N>(d_parent.d_parent->d_tuple).d_idx);
MDBInVal in(key);
MDBOutVal out, id;
out.d_mdbval = in.d_mdbval;
2018-12-16 20:28:49 +01:00
if(cursor.get(out, id, op)) {
2018-12-16 15:58:38 +01:00
// on_index, one_key, end
return iter_t{&d_parent, std::move(cursor), true, false, true};
}
return iter_t{&d_parent, std::move(cursor), true, false};
};
2018-12-16 20:28:49 +01:00
template<int N>
iter_t find(const typename std::tuple_element<N, tuple_t>::type::type& key)
{
return genfind<N>(key, MDB_SET);
}
template<int N>
iter_t lower_bound(const typename std::tuple_element<N, tuple_t>::type::type& key)
{
return genfind<N>(key, MDB_SET_RANGE);
}
//! equal range - could possibly be expressed through genfind
2018-12-16 15:58:38 +01:00
template<int N>
std::pair<iter_t,eiter_t> equal_range(const typename std::tuple_element<N, tuple_t>::type::type& key)
{
typename Parent::cursor_t cursor = d_parent.d_txn.getCursor(std::get<N>(d_parent.d_parent->d_tuple).d_idx);
MDBInVal in(key);
MDBOutVal out, id;
out.d_mdbval = in.d_mdbval;
if(cursor.get(out, id, MDB_SET)) {
// on_index, one_key, end
return {iter_t{&d_parent, std::move(cursor), true, true, true}, eiter_t()};
2018-12-15 21:06:47 +01:00
}
2018-12-16 15:58:38 +01:00
return {iter_t{&d_parent, std::move(cursor), true, true}, eiter_t()};
};
2018-12-16 15:58:38 +01:00
Parent& d_parent;
};
class ROTransaction : public ReadonlyOperations<ROTransaction>
{
public:
explicit ROTransaction(TypedDBI* parent) : ReadonlyOperations<ROTransaction>(*this), d_parent(parent), d_txn(d_parent->d_env->getROTransaction())
{
}
ROTransaction(ROTransaction&& rhs) :
ReadonlyOperations<ROTransaction>(*this), d_parent(rhs.d_parent),d_txn(std::move(rhs.d_txn))
{
rhs.d_parent = 0;
}
typedef MDBROCursor cursor_t;
TypedDBI* d_parent;
MDBROTransaction d_txn;
};
class RWTransaction : public ReadonlyOperations<RWTransaction>
{
public:
explicit RWTransaction(TypedDBI* parent) : ReadonlyOperations<RWTransaction>(*this), d_parent(parent), d_txn(d_parent->d_env->getRWTransaction())
{
}
RWTransaction(RWTransaction&& rhs) :
ReadonlyOperations<RWTransaction>(*this),
d_parent(rhs.d_parent), d_txn(std::move(rhs.d_txn))
{
rhs.d_parent = 0;
}
2018-12-16 20:28:49 +01:00
// insert something, with possibly a specific id
2018-12-16 21:46:53 +01:00
uint32_t put(const T& t, uint32_t id=0)
{
if(!id)
id = getMaxID(d_txn, d_parent->d_main) + 1;
d_txn.put(d_parent->d_main, id, serToString(t));
#define insertMacro(N) std::get<N>(d_parent->d_tuple).put(d_txn, t, id);
insertMacro(0);
insertMacro(1);
insertMacro(2);
insertMacro(3);
#undef insertMacro
return id;
}
2018-12-16 20:28:49 +01:00
// modify an item 'in place', plus update indexes
void modify(uint32_t id, std::function<void(T&)> func)
{
T t;
if(!this->get(id, t))
return; // XXX should be exception
func(t);
del(id); // this is the lazy way. We could test for changed index fields
2018-12-16 21:46:53 +01:00
put(t, id);
}
2018-12-16 20:28:49 +01:00
//! delete an item, and from indexes
void del(uint32_t id)
{
T t;
if(!this->get(id, t))
return;
d_txn.del(d_parent->d_main, id);
clearIndex(id, t);
}
2018-12-16 20:28:49 +01:00
//! clear database & indexes (by hand!)
void clear()
{
auto cursor = d_txn.getCursor(d_parent->d_main);
bool first = true;
MDBOutVal key, data;
while(!cursor.get(key, data, first ? MDB_FIRST : MDB_NEXT)) {
first = false;
T t;
serFromString(data.get<std::string>(), t);
clearIndex(key.get<uint32_t>(), t);
cursor.del();
}
}
2018-12-16 20:28:49 +01:00
//! commit this transaction
void commit()
{
d_txn.commit();
}
2018-12-16 20:28:49 +01:00
//! abort this transaction
void abort()
{
d_txn.abort();
}
typedef MDBRWCursor cursor_t;
2018-12-14 23:46:46 +01:00
private:
2018-12-16 20:28:49 +01:00
// clear this ID from all indexes
2018-12-14 23:46:46 +01:00
void clearIndex(uint32_t id, const T& t)
{
#define clearMacro(N) std::get<N>(d_parent->d_tuple).del(d_txn, t, id);
clearMacro(0);
clearMacro(1);
clearMacro(2);
clearMacro(3);
#undef clearMacro
2018-12-14 23:46:46 +01:00
}
public:
2018-12-14 23:46:46 +01:00
TypedDBI* d_parent;
MDBRWTransaction d_txn;
};
2018-12-16 20:28:49 +01:00
//! Get an RW transaction
2018-12-14 23:46:46 +01:00
RWTransaction getRWTransaction()
{
return RWTransaction(this);
}
2018-12-16 20:28:49 +01:00
//! Get an RO transaction
ROTransaction getROTransaction()
{
return ROTransaction(this);
}
2018-12-14 23:46:46 +01:00
private:
std::shared_ptr<MDBEnv> d_env;
MDBDbi d_main;
std::string d_name;
};