Commit 35eb95c2 authored by Kirill Smelkov's avatar Kirill Smelkov

bigfile: Python wrapper around virtual memory subsystem

Exposes BigFile - this way users can define BigFile backend in Python.

Also exposed are BigFile handles, and VMA objects which are results of
mmaping.
parent 8ba39a60
......@@ -16,3 +16,7 @@
# warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
#
# See COPYING file for full licensing terms.
"""TODO big module-level picture description"""
from ._bigfile import BigFile, WRITEOUT_STORE, WRITEOUT_MARKSTORED, ram_reclaim
This diff is collapsed.
# Wendeling.core.bigfile | Basic tests
# Copyright (C) 2014-2015 Nexedi SA and Contributors.
# Kirill Smelkov <kirr@nexedi.com>
#
# This program is free software: you can Use, Study, Modify and Redistribute
# it under the terms of the GNU General Public License version 3, or (at your
# option) any later version, as published by the Free Software Foundation.
#
# You can also Link and Combine this program with other software covered by
# the terms of any of the Open Source Initiative approved licenses and Convey
# the resulting work. Corresponding source of such a combination shall include
# the source code for all other software used.
#
# This program is distributed WITHOUT ANY WARRANTY; without even the implied
# warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
#
# See COPYING file for full licensing terms.
# TODO description
from wendelin.bigfile import BigFile, WRITEOUT_STORE, WRITEOUT_MARKSTORED
import struct
import weakref
import sys
from pytest import raises
from six import PY2
# read-only attributes are reported differently on py2 & py3
ROAttributeError = (PY2 and TypeError or AttributeError)
# on python2 memoryview[i] returns str, on python3 uint
bchr_py2 = (PY2 and chr or (lambda _: _))
bord_py3 = (PY2 and (lambda _: _) or ord)
# Synthetic bigfile that for #blk
# - loads generated ~ #blk bytes and
# - remembers stores #blk in .storev[]
class XBigFile(BigFile):
def __new__(cls, head, blksize):
obj = BigFile.__new__(cls, blksize)
obj.head = head
obj.storev = []
return obj
# load: fill head with head, later with #blk
def loadblk(self, blk, buf):
# head + <byte-fill> to tail...
hlen = len(self.head)
tlen = self.blksize - hlen
fillbyte = blk & 0xff
v = [self.head] + [fillbyte]*tlen
struct.pack_into("%is%iB" % (hlen, tlen), buf, 0, *v)
# store: store #blk in storev
def storeblk(self, blk, buf):
self.storev.append(blk)
# XXX hack, hardcoded
MB = 1024*1024
PS = 2*MB
# basic loadblk/storeblk test
def test_basic():
f = XBigFile(b'abcd', PS)
assert f.blksize == PS
raises(ROAttributeError, "f.blksize = 1") # RO attribute
assert f.head == b'abcd'
fh = f.fileh_open() # TODO + ram
vma = fh.mmap(100, 4)
m = memoryview(vma)
if PY2:
b = buffer(vma) # `buffer` is not available in python3
else:
b = memoryview(vma) # no harm testing with memoryview twice
assert len(m) == 4*PS
assert len(b) == 4*PS
# read
for p in range(4):
_ = p*PS
assert b[_+0:_+4] == b'abcd'
assert b[_+5] == bchr_py2(100+p)
assert b[_+PS-1] == bchr_py2(100+p)
assert m[_+0:_+4] == b'abcd'
assert m[_+5] == bchr_py2(100+p)
assert m[_+PS-1] == bchr_py2(100+p)
# write
m[2*PS + 7] = bord_py3(b'A') # write -> page[102]
assert b[2*PS + 7] == bord_py3('A') # ensure b & m point to the same memory
m[7] = bord_py3(b'B') # write -> page[100]
assert f.storev == []
fh.dirty_writeout(WRITEOUT_STORE)
assert f.storev == [100, 102] # pages we wrote in ascending order
f.storev = []
fh.dirty_writeout(WRITEOUT_STORE)
assert f.storev == [100, 102] # again, because was not marked yet
f.storev = []
fh.dirty_writeout(WRITEOUT_STORE | WRITEOUT_MARKSTORED)
assert f.storev == [100, 102] # again, because was not marked yet
f.storev = []
fh.dirty_writeout(WRITEOUT_STORE)
assert f.storev == [] # nothing wrote - all dirty were just marked
# TODO close f
# test that python exception state is preserved across pagefaulting
def test_pagefault_savestate():
class BadFile(BigFile):
def loadblk(self, blk, buf):
# simulate some errors in-between to overwrite thread exception
# state, and say we are done ok
try:
1/0
except ZeroDivisionError:
pass
exc_type, exc_value, exc_traceback = sys.exc_info()
if PY2:
assert exc_type is ZeroDivisionError
else:
# on python3 exception state is cleared upon exiting from `except`
assert exc_type is None
# NOTE there is a loop created here:
#
# exc_traceback
# | ^
# | |
# v .f_localsplus
# frame
#
# Since upon returning we can't hold a reference to buf, let's
# break the loop explicitly.
#
# Otherwise both exc_traceback and frame will be alive until next
# gc.collect() which cannot be perform in pagefault handler.
#
# Not breaking this loop will BUG with `buf.refcnt != 1` on return
del exc_traceback
self.loadblk_run = 1
f = BadFile(PS)
fh = f.fileh_open()
vma = fh.mmap(0, 1)
m = memoryview(vma)
f.loadblk_run = 0
try:
raise RuntimeError('hello')
except RuntimeError:
exc_type, exc_value, exc_tb = sys.exc_info()
assert exc_type is RuntimeError
assert exc_value.args == ('hello',)
assert m[0] == bchr_py2(0) # NOTE causes pagefault handler to run
assert f.loadblk_run == 1
exc_type2, exc_value2, exc_tb2 = sys.exc_info()
assert exc_type is exc_type2
assert exc_value is exc_value2
assert exc_tb is exc_tb2
# TODO close f
# test that vma/fileh/file correctly refcount each other
def test_refcounting():
# fileh holds file
f = XBigFile(b'abcd', PS)
wf = weakref.ref(f)
assert wf() is f
fh = f.fileh_open()
assert wf() is f
idf = id(f)
del f
f_ = wf()
assert f_ is not None
assert id(f_) == idf
del f_, fh
assert wf() is None
# vma holds fileh
f = XBigFile(b'abcd', PS)
fh = f.fileh_open()
wfh = weakref.ref(fh)
assert wfh() is fh
vma = fh.mmap(0, 1)
assert wfh() is fh
idfh = id(fh)
del fh
fh_ = wfh()
assert fh_ is not None
assert id(fh_) == idfh
del fh_, vma
assert wfh() is None
# vma is weakly-referencable too
fh = f.fileh_open()
vma = fh.mmap(0, 1)
wvma= weakref.ref(vma)
assert wvma() is vma
idvma = id(vma)
m = memoryview(vma)
del vma
vma_ = wvma()
assert vma_ is not None
assert id(vma_) == idvma
del vma_
assert wvma() is not None
del m
assert wvma() is None
#ifndef _WENDELIN_COMPAT_PY2_H
#define _WENDELIN_COMPAT_PY2_H
/* compatibility with python2 */
#include <Python.h>
/* in python2 it was indicating support for memoryview */
#ifndef Py_TPFLAGS_HAVE_NEWBUFFER
# define Py_TPFLAGS_HAVE_NEWBUFFER 0L
#endif
/* PyMemoryView_FromMemory for python2
* (taking PY2 PyMemoryView_FromBuffer, and
* PY3 PyMemoryView_FromMemory as templates)
*/
#if PY_MAJOR_VERSION < 3
static inline PyObject *
PyMemoryView_FromMemory(char *mem, Py_ssize_t size, int flags)
{
PyMemoryViewObject *mview;
int readonly;
mview = (PyMemoryViewObject *)
PyObject_GC_New(PyMemoryViewObject, &PyMemoryView_Type);
if (mview == NULL)
return NULL;
mview->base = NULL;
readonly = (flags == PyBUF_WRITE) ? 0 : 1;
(void)PyBuffer_FillInfo(&mview->view, NULL, mem, size, readonly,
PyBUF_FULL_RO);
_PyObject_GC_TRACK(mview);
return (PyObject *)mview;
}
#endif
#endif
......@@ -183,6 +183,8 @@ setup(
find_packages(exclude='3rdparty')],
install_requires = [
'numpy', # lib/mem
'six', # compat py2/py3
],
extras_require = {
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment