pyflo/pybtc/_lru/lru.c
2019-05-12 21:59:24 +04:00

713 lines
21 KiB
C

#include <Python.h>
/*
* This is a simple implementation of LRU Dict that uses a Python dict and an associated doubly linked
* list to keep track of recently inserted/accessed items.
*
* Dict will store: key -> Node mapping, where Node is a linked list node.
* The Node itself will contain the value as well as the key.
*
* For eg:
*
* >>> l = LRU(2)
* >>> l[0] = 'foo'
* >>> l[1] = 'bar'
*
* can be visualised as:
*
* ---+--(hash(0)--+--hash(1)--+
* self->dict ...| | |
* ---+-----|------+---------|-+
* | |
* +-----v------+ +-----v------+
* self->first--->|<'foo'>, <0>|-->|<'bar'>, <1>|<---self->last
* +--| |<--| |--+
* | +------------+ +------------+ |
* v v
* NULL NULL
*
* The invariant is to maintain the list to reflect the LRU order of items in the dict.
* self->first will point to the MRU item and self-last to LRU item. Size of list will not
* grow beyond size of LRU dict.
*
*/
#ifndef Py_TYPE
#define Py_TYPE(ob) (((PyObject*)(ob))->ob_type)
#endif
#define GET_NODE(d, key) (Node *) Py_TYPE(d)->tp_as_mapping->mp_subscript((d), (key))
#define PUT_NODE(d, key, node) Py_TYPE(d)->tp_as_mapping->mp_ass_subscript((d), (key), ((PyObject *)node))
/* If someone figures out how to enable debug builds with setuptools, you can delete this */
#if 0
#undef assert
#define str(s) #s
#define assert(v) \
do { \
if (!(v)) { \
fprintf(stderr, "Assertion failed: %s on %s:%d\n", \
str(v), __FILE__, __LINE__); \
fflush(stderr); \
abort(); \
} \
} while(0)
#endif
typedef struct _Node {
PyObject_HEAD
PyObject * value;
PyObject * key;
struct _Node * prev;
struct _Node * next;
} Node;
static void node_dealloc(Node* self)
{
Py_DECREF(self->key);
Py_DECREF(self->value);
assert(self->prev == NULL);
assert(self->next == NULL);
PyObject_Del((PyObject*)self);
}
static PyObject*node_repr(Node* self) { return PyObject_Repr(self->value);}
static PyTypeObject NodeType = {
PyVarObject_HEAD_INIT(NULL, 0)
"lru.Node", /* tp_name */
sizeof(Node), /* tp_basicsize */
0, /* tp_itemsize */
(destructor)node_dealloc,/* tp_dealloc */
0, /* tp_print */
0, /* tp_getattr */
0, /* tp_setattr */
0, /* tp_compare */
(reprfunc)node_repr, /* tp_repr */
0, /* tp_as_number */
0, /* tp_as_sequence */
0, /* tp_as_mapping */
0, /* tp_hash */
0, /* tp_call */
0, /* tp_str */
0, /* tp_getattro */
0, /* tp_setattro */
0, /* tp_as_buffer */
Py_TPFLAGS_DEFAULT, /* tp_flags */
"Linked List Node", /* tp_doc */
0, /* tp_traverse */
0, /* tp_clear */
0, /* tp_richcompare */
0, /* tp_weaklistoffset */
0, /* tp_iter */
0, /* tp_iternext */
0, /* tp_methods */
0, /* tp_members */
0, /* tp_getset */
0, /* tp_base */
0, /* tp_dict */
0, /* tp_descr_get */
0, /* tp_descr_set */
0, /* tp_dictoffset */
0, /* tp_init */
0, /* tp_alloc */
0, /* tp_new */
};
typedef struct {
PyObject_HEAD
PyObject * dict;
Node * first;
Node * last;
Py_ssize_t size;
} LRU;
static void lru_remove_node(LRU *self, Node* node)
{
if (self->first == node) {
self->first = node->next;
}
if (self->last == node) {
self->last = node->prev;
}
if (node->prev) {
node->prev->next = node->next;
}
if (node->next) {
node->next->prev = node->prev;
}
node->next = node->prev = NULL;
}
static void lru_add_node_at_head(LRU *self, Node* node)
{
node->prev = NULL;
if (!self->first) {
self->first = self->last = node;
node->next = NULL;
} else {
node->next = self->first;
if (node->next) {
node->next->prev = node;
}
self->first = node;
}
}
static void lru_add_node_at_tail(LRU *self, Node* node)
{
node->next = NULL;
if (!self->first) {
self->first = self->last = node;
node->prev = NULL;
} else {
node->prev = self->last;
if (node->prev) {
node->prev->next = node;
}
self->last = node;
}
}
static void lru_delete_last(LRU *self)
{
Node* n = self->last;
if (!self->last) return;
lru_remove_node(self, n);
PUT_NODE(self->dict, n->key, NULL);
}
static Py_ssize_t lru_length(LRU *self) { return PyDict_Size(self->dict); }
static PyObject *LRU_contains_key(LRU *self, PyObject *key)
{
if (PyDict_Contains(self->dict, key)) {
Py_RETURN_TRUE;
} else {
Py_RETURN_FALSE;
}
}
static PyObject *LRU_contains(LRU *self, PyObject *args)
{
PyObject *key;
if (!PyArg_ParseTuple(args, "O", &key)) return NULL;
return LRU_contains_key(self, key);
}
static int LRU_seq_contains(LRU *self, PyObject *key) { return PyDict_Contains(self->dict, key); }
static PyObject *lru_subscript(LRU *self, register PyObject *key)
{
Node *node = GET_NODE(self->dict, key);
if (!node) return NULL;
Py_INCREF(node->value);
Py_DECREF(node);
return node->value;
}
static PyObject *LRU_pop(LRU *self)
{
if (self->last) {
PyObject *tuple = PyTuple_New(2);
Py_INCREF(self->last->key);
PyTuple_SET_ITEM(tuple, 0, self->last->key);
Py_INCREF(self->last->value);
PyTuple_SET_ITEM(tuple, 1, self->last->value);
Node* n = self->last;
lru_remove_node(self, n);
PUT_NODE(self->dict, n->key, NULL);
return tuple;
}
else Py_RETURN_NONE;
}
static PyObject *LRU_get(LRU *self, PyObject *args)
{
PyObject *key;
PyObject *instead = NULL;
PyObject *result;
if (!PyArg_ParseTuple(args, "O|O", &key, &instead)) return NULL;
result = lru_subscript(self, key);
PyErr_Clear(); /* GET_NODE sets an exception on miss. Shut it up. */
if (result) return result;
if (!instead) { Py_RETURN_NONE; }
Py_INCREF(instead);
return instead;
}
static PyObject *LRU_delete(LRU *self, PyObject *args)
{
PyObject *key;
PyObject *instead = NULL;
PyObject *tuple = PyTuple_New(2);
if (!PyArg_ParseTuple(args, "O|O", &key, &instead)) return NULL;
Node *node = GET_NODE(self->dict, key);
if (!node) {
if (!instead) { Py_RETURN_NONE; }
Py_INCREF(instead);
return instead;
} else {
Py_INCREF(node->key);
PyTuple_SET_ITEM(tuple, 0, node->key);
Py_INCREF(node->value);
PyTuple_SET_ITEM(tuple, 1, node->value);
lru_remove_node(self, node);
PUT_NODE(self->dict, node->key, NULL);
return tuple;
}
}
static int lru_append(LRU *self, PyObject *key, PyObject *value)
{
int res = 0;
Node *node = GET_NODE(self->dict, key);
PyErr_Clear(); /* GET_NODE sets an exception on miss. Shut it up. */
if (value) {
if (node) {
Py_INCREF(value);
Py_DECREF(node->value);
node->value = value;
res = 0;
} else {
node = PyObject_NEW(Node, &NodeType);
node->key = key;
node->value = value;
node->next = node->prev = NULL;
Py_INCREF(key);
Py_INCREF(value);
res = PUT_NODE(self->dict, key, node);
if (res == 0) {
if (self->size > 0 && lru_length(self) > self->size) lru_delete_last(self);
lru_add_node_at_tail(self, node);
}
}
} else {
if (PUT_NODE(self->dict, key, NULL) == 0) lru_remove_node(self, node);
}
Py_XDECREF(node);
return res;
}
static int lru_ass_sub(LRU *self, PyObject *key, PyObject *value)
{
int res = 0;
Node *node = GET_NODE(self->dict, key);
PyErr_Clear(); /* GET_NODE sets an exception on miss. Shut it up. */
if (value) {
if (node) {
Py_INCREF(value);
Py_DECREF(node->value);
node->value = value;
res = 0;
} else {
node = PyObject_NEW(Node, &NodeType);
node->key = key;
node->value = value;
node->next = node->prev = NULL;
Py_INCREF(key);
Py_INCREF(value);
res = PUT_NODE(self->dict, key, node);
if (res == 0) {
if (self->size > 0 && lru_length(self) > self->size) lru_delete_last(self);
lru_add_node_at_head(self, node);
}
}
} else {
if (PUT_NODE(self->dict, key, NULL) == 0) lru_remove_node(self, node);
}
Py_XDECREF(node);
return res;
}
static int lru_put(LRU *self, PyObject *key, PyObject *value)
{
int res = 0;
Node *node = PyObject_NEW(Node, &NodeType);
node->key = key;
node->value = value;
node->next = node->prev = NULL;
Py_INCREF(key);
Py_INCREF(value);
res = PUT_NODE(self->dict, key, node);
if (res == 0) {
if (self->size > 0 && lru_length(self) > self->size) lru_delete_last(self);
lru_add_node_at_head(self, node);
}
Py_XDECREF(node);
return res;
}
static PyMappingMethods LRU_as_mapping = {
(lenfunc)lru_length, /*mp_length*/
(binaryfunc)lru_subscript, /*mp_subscript*/
(objobjargproc)lru_ass_sub, /*mp_ass_subscript*/
};
static PyObject *collect(LRU *self, PyObject * (*getterfunc)(Node *))
{
register PyObject *v;
Node *curr;
int i;
v = PyList_New(lru_length(self));
if (v == NULL)
return NULL;
curr = self->first;
i = 0;
while (curr) {
PyList_SET_ITEM(v, i++, getterfunc(curr));
curr = curr->next;
}
assert(i == lru_length(self));
return v;
}
static PyObject *get_key(Node *node)
{
Py_INCREF(node->key);
return node->key;
}
static PyObject *LRU_append(LRU *self, PyObject *args, PyObject *kwargs)
{
PyObject *key, *value;
PyObject *arg = NULL;
Py_ssize_t pos = 0;
if ((PyArg_ParseTuple(args, "|O", &arg))) {
if (arg && PyDict_Check(arg)) {
while (PyDict_Next(arg, &pos, &key, &value))
lru_append(self, key, value);
}
}
if (kwargs != NULL && PyDict_Check(kwargs)) {
while (PyDict_Next(kwargs, &pos, &key, &value))
lru_append(self, key, value);
}
Py_RETURN_NONE;
}
static PyObject *LRU_update(LRU *self, PyObject *args, PyObject *kwargs)
{
PyObject *key, *value;
PyObject *arg = NULL;
Py_ssize_t pos = 0;
if ((PyArg_ParseTuple(args, "|O", &arg))) {
if (arg && PyDict_Check(arg)) {
while (PyDict_Next(arg, &pos, &key, &value))
lru_ass_sub(self, key, value);
}
}
if (kwargs != NULL && PyDict_Check(kwargs)) {
while (PyDict_Next(kwargs, &pos, &key, &value))
lru_ass_sub(self, key, value);
}
Py_RETURN_NONE;
}
static PyObject *LRU_put(LRU *self, PyObject *args, PyObject *kwargs)
{
PyObject *key, *value;
PyObject *arg = NULL;
Py_ssize_t pos = 0;
if ((PyArg_ParseTuple(args, "|O", &arg))) {
if (arg && PyDict_Check(arg)) {
while (PyDict_Next(arg, &pos, &key, &value))
lru_put(self, key, value);
}
}
if (kwargs != NULL && PyDict_Check(kwargs)) {
while (PyDict_Next(kwargs, &pos, &key, &value))
lru_put(self, key, value);
}
Py_RETURN_NONE;
}
static PyObject *LRU_peek_first_item(LRU *self)
{
if (self->first) {
PyObject *tuple = PyTuple_New(2);
Py_INCREF(self->first->key);
PyTuple_SET_ITEM(tuple, 0, self->first->key);
Py_INCREF(self->first->value);
PyTuple_SET_ITEM(tuple, 1, self->first->value);
return tuple;
}
else Py_RETURN_NONE;
}
static PyObject *LRU_peek_last_item(LRU *self)
{
if (self->last) {
PyObject *tuple = PyTuple_New(2);
Py_INCREF(self->last->key);
PyTuple_SET_ITEM(tuple, 0, self->last->key);
Py_INCREF(self->last->value);
PyTuple_SET_ITEM(tuple, 1, self->last->value);
return tuple;
}
else Py_RETURN_NONE;
}
static PyObject *LRU_keys(LRU *self) { return collect(self, get_key); }
static PyObject *get_value(Node *node)
{
Py_INCREF(node->value);
return node->value;
}
static PyObject *LRU_values(LRU *self) { return collect(self, get_value); }
static PyObject *get_item(Node *node)
{
PyObject *tuple = PyTuple_New(2);
Py_INCREF(node->key);
PyTuple_SET_ITEM(tuple, 0, node->key);
Py_INCREF(node->value);
PyTuple_SET_ITEM(tuple, 1, node->value);
return tuple;
}
static PyObject *LRU_items(LRU *self) { return collect(self, get_item); }
static PyObject *LRU_set_size(LRU *self, PyObject *args, PyObject *kwds)
{
Py_ssize_t newSize;
if (!PyArg_ParseTuple(args, "n", &newSize)) return NULL;
if (newSize < 0) {
PyErr_SetString(PyExc_ValueError, "Size should be a positive number");
return NULL;
}
while (lru_length(self) > newSize) lru_delete_last(self);
self->size = newSize;
Py_RETURN_NONE;
}
static PyObject *LRU_clear(LRU *self)
{
Node *c = self->first;
while (c) {
Node* n = c;
c = c->next;
lru_remove_node(self, n);
}
PyDict_Clear(self->dict);
Py_RETURN_NONE;
}
static PyObject *LRU_get_size(LRU *self) { return Py_BuildValue("i", self->size); }
/* Hack to implement "key in lru" */
static PySequenceMethods lru_as_sequence = {
0, /* sq_length */
0, /* sq_concat */
0, /* sq_repeat */
0, /* sq_item */
0, /* sq_slice */
0, /* sq_ass_item */
0, /* sq_ass_slice */
(objobjproc) LRU_seq_contains, /* sq_contains */
0, /* sq_inplace_concat */
0, /* sq_inplace_repeat */
};
static PyMethodDef LRU_methods[] = {
{"__contains__", (PyCFunction)LRU_contains_key, METH_O | METH_COEXIST,
PyDoc_STR("L.__contains__(key) -> Check if key is there in L")},
{"keys", (PyCFunction)LRU_keys, METH_NOARGS,
PyDoc_STR("L.keys() -> list of L's keys in MRU order")},
{"values", (PyCFunction)LRU_values, METH_NOARGS,
PyDoc_STR("L.values() -> list of L's values in MRU order")},
{"items", (PyCFunction)LRU_items, METH_NOARGS,
PyDoc_STR("L.items() -> list of L's items (key,value) in MRU order")},
{"has_key", (PyCFunction)LRU_contains, METH_VARARGS,
PyDoc_STR("L.has_key(key) -> Check if key is there in L")},
{"get", (PyCFunction)LRU_get, METH_VARARGS,
PyDoc_STR("L.get(key, instead) -> If L has key return its value, otherwise instead")},
{"delete", (PyCFunction)LRU_delete, METH_VARARGS,
PyDoc_STR("L.get(key, instead) -> If L has key return its value, otherwise instead")},
{"set_size", (PyCFunction)LRU_set_size, METH_VARARGS,
PyDoc_STR("L.set_size() -> set size of LRU")},
{"get_size", (PyCFunction)LRU_get_size, METH_NOARGS,
PyDoc_STR("L.get_size() -> get size of LRU")},
{"clear", (PyCFunction)LRU_clear, METH_NOARGS,
PyDoc_STR("L.clear() -> clear LRU")},
{"peek_first_item", (PyCFunction)LRU_peek_first_item, METH_NOARGS,
PyDoc_STR("L.peek_first_item() -> returns the MRU item (key,value) without changing key order")},
{"peek_last_item", (PyCFunction)LRU_peek_last_item, METH_NOARGS,
PyDoc_STR("L.peek_last_item() -> returns the LRU item (key,value) without changing key order")},
{"pop", (PyCFunction)LRU_pop, METH_NOARGS,
PyDoc_STR("L.pop() -> returns the LRU item (key,value) without changing key order")},
{"update", (PyCFunction)LRU_update, METH_VARARGS | METH_KEYWORDS,
PyDoc_STR("L.update() -> update value for key in LRU")},
{"put", (PyCFunction)LRU_put, METH_VARARGS | METH_KEYWORDS,
PyDoc_STR("L.append() -> append value for key in LRU")},
{"append", (PyCFunction)LRU_append, METH_VARARGS | METH_KEYWORDS,
PyDoc_STR("L.append() -> append value for key in LRU")},
{NULL, NULL},
};
static PyObject*LRU_repr(LRU* self) { return PyObject_Repr(self->dict); }
static int LRU_init(LRU *self, PyObject *args, PyObject *kwds)
{
static char *kwlist[] = {"size", NULL};
if (!PyArg_ParseTupleAndKeywords(args, kwds, "|n", kwlist, &self->size)) self->size = 0;
if ((Py_ssize_t)self->size < 0) {
PyErr_SetString(PyExc_ValueError, "Size should be a positive number");
return -1;
}
self->dict = PyDict_New();
self->first = self->last = NULL;
return 0;
}
static void
LRU_dealloc(LRU *self)
{
if (self->dict) {
LRU_clear(self);
Py_DECREF(self->dict);
}
PyObject_Del((PyObject*)self);
}
PyDoc_STRVAR(lru_doc,
"LRU(size) -> new LRU dict that can store up to size elements\n"
"An LRU dict behaves like a standard dict, except that it stores only fixed\n"
"set of elements. Once the size overflows, it evicts least recently used\n"
"items. \n\n"
"Eg:\n"
">>> l = LRU(3)\n"
">>> for i in range(5):\n"
">>> l[i] = str(i)\n"
">>> l.keys()\n"
"[2,3,4]\n\n"
"Note: An LRU(n) can be thought of as a dict that will have the most\n"
"recently accessed n items.\n");
static PyTypeObject LRUType = {
PyVarObject_HEAD_INIT(NULL, 0)
"_lru.LRU", /* tp_name */
sizeof(LRU), /* tp_basicsize */
0, /* tp_itemsize */
(destructor)LRU_dealloc, /* tp_dealloc */
0, /* tp_print */
0, /* tp_getattr */
0, /* tp_setattr */
0, /* tp_compare */
(reprfunc)LRU_repr, /* tp_repr */
0, /* tp_as_number */
&lru_as_sequence, /* tp_as_sequence */
&LRU_as_mapping, /* tp_as_mapping */
0, /* tp_hash */
0, /* tp_call */
0, /* tp_str */
0, /* tp_getattro */
0, /* tp_setattro */
0, /* tp_as_buffer */
Py_TPFLAGS_DEFAULT, /* tp_flags */
lru_doc, /* tp_doc */
0, /* tp_traverse */
0, /* tp_clear */
0, /* tp_richcompare */
0, /* tp_weaklistoffset */
0, /* tp_iter */
0, /* tp_iternext */
LRU_methods, /* tp_methods */
0, /* tp_members */
0, /* tp_getset */
0, /* tp_base */
0, /* tp_dict */
0, /* tp_descr_get */
0, /* tp_descr_set */
0, /* tp_dictoffset */
(initproc)LRU_init, /* tp_init */
0, /* tp_alloc */
0, /* tp_new */
};
static struct PyModuleDef moduledef = {
PyModuleDef_HEAD_INIT,
"_lru", /* m_name */
lru_doc, /* m_doc */
-1, /* m_size */
NULL, /* m_methods */
NULL, /* m_reload */
NULL, /* m_traverse */
NULL, /* m_clear */
NULL, /* m_free */
};
static PyObject *moduleinit(void) {
PyObject *m;
NodeType.tp_new = PyType_GenericNew;
if (PyType_Ready(&NodeType) < 0) return NULL;
LRUType.tp_new = PyType_GenericNew;
if (PyType_Ready(&LRUType) < 0) return NULL;
m = PyModule_Create(&moduledef);
if (m == NULL) return NULL;
Py_INCREF(&NodeType);
Py_INCREF(&LRUType);
PyModule_AddObject(m, "LRU", (PyObject *) &LRUType);
return m;
}
PyMODINIT_FUNC PyInit__lru(void) { return moduleinit(); }