bigfile: Basic benchmarks

- for virtual memory subsytem - for ZBigFiles They are not currently great, e.g. for virtmem we have in-kernel overhead of page clearing - in perf profiles, for bigfile_mmap compared to file_read kernel's clear_page_c raises significantly. That is the worker for clearing page memory and we currently cannot avoid that - any memory obtained from kernel (MAP_ANONYMOUS, mmap(file) with hole, etc...) comes pre-initialized to zeros to userspace. This can be seen in the benchmarks as well: file_readbig differs from file_read in only that the latter uses 1 small buffer and the first allocates large memory (cleared by kernel + python does the memset). bigfile/tests/bench_virtmem.py@125::bench_file_mmap_adler32 0.47 (0.86 0.49 0.47) bigfile/tests/bench_virtmem.py@126::bench_file_read_adler32 0.69 (1.11 0.71 0.69) bigfile/tests/bench_virtmem.py@127::bench_file_readbig_adler32 1.41 (1.70 1.42 1.41) bigfile/tests/bench_virtmem.py@128::bench_bigfile_mmap_adler32 1.42 (1.45 1.42 1.51) bigfile/tests/bench_virtmem.py@130::bench_file_mmap_md5 1.52 (1.91 1.54 1.52) bigfile/tests/bench_virtmem.py@131::bench_file_read_md5 1.73 (2.10 1.75 1.73) bigfile/tests/bench_virtmem.py@132::bench_file_readbig_md5 2.44 (2.73 2.46 2.44) bigfile/tests/bench_virtmem.py@133::bench_bigfile_mmap_md5 2.40 (2.48 2.40 2.53) There is MAP_UNINITIALIZED which works only for non-mmu targets and only if explicitly allowed when configuring kernel (off by default). There were patches to disable that pages zeroing, as it gives significant speedup for people's workloads, e.g. [1,2] but all of them did not got merged for security reasons. [1] http://marc.info/?t=132691315900001&r=1&w=2 [2] http://thread.gmane.org/gmane.linux.kernel/548926 ~~~~ For ZBigFile - it is the storage who is dominating in profiles.

bigfile: Basic benchmarks
- for virtual memory subsytem - for ZBigFiles They are not currently great, e.g. for virtmem we have in-kernel overhead of page clearing - in perf profiles, for bigfile_mmap compared to file_read kernel's clear_page_c raises significantly. That is the worker for clearing page memory and we currently cannot avoid that - any memory obtained from kernel (MAP_ANONYMOUS, mmap(file) with hole, etc...) comes pre-initialized to zeros to userspace. This can be seen in the benchmarks as well: file_readbig differs from file_read in only that the latter uses 1 small buffer and the first allocates large memory (cleared by kernel + python does the memset). bigfile/tests/bench_virtmem.py@125::bench_file_mmap_adler32 0.47 (0.86 0.49 0.47) bigfile/tests/bench_virtmem.py@126::bench_file_read_adler32 0.69 (1.11 0.71 0.69) bigfile/tests/bench_virtmem.py@127::bench_file_readbig_adler32 1.41 (1.70 1.42 1.41) bigfile/tests/bench_virtmem.py@128::bench_bigfile_mmap_adler32 1.42 (1.45 1.42 1.51) bigfile/tests/bench_virtmem.py@130::bench_file_mmap_md5 1.52 (1.91 1.54 1.52) bigfile/tests/bench_virtmem.py@131::bench_file_read_md5 1.73 (2.10 1.75 1.73) bigfile/tests/bench_virtmem.py@132::bench_file_readbig_md5 2.44 (2.73 2.46 2.44) bigfile/tests/bench_virtmem.py@133::bench_bigfile_mmap_md5 2.40 (2.48 2.40 2.53) There is MAP_UNINITIALIZED which works only for non-mmu targets and only if explicitly allowed when configuring kernel (off by default). There were patches to disable that pages zeroing, as it gives significant speedup for people's workloads, e.g. [1,2] but all of them did not got merged for security reasons. [1] http://marc.info/?t=132691315900001&r=1&w=2 [2] http://thread.gmane.org/gmane.linux.kernel/548926 ~~~~ For ZBigFile - it is the storage who is dominating in profiles.
bb9d8bf1 · Kirill Smelkov · bcab1246 · bb9d8bf1 · bb9d8bf1 · bb9d8bf1
Commit bb9d8bf1 authored Apr 03, 2015 by Kirill Smelkov
Showing with 400 additions and 0 deletions

bigfile/tests/bench_0virtmem.py bigfile/tests/bench_0virtmem.py +177 -0

bigfile/tests/bench_1filezodb.py bigfile/tests/bench_1filezodb.py +68 -0

lib/testing.py lib/testing.py +155 -0

No files found.
--- a/bigfile/tests/bench_0virtmem.py
+++ b/bigfile/tests/bench_0virtmem.py
+# Wendelin.bigfile | benchmarks for virtmem
+#
+# benchmark computing adler32 sum of a whole-hole file via BigFile_File backend
+# and compare that to baseline of doing the same via standard OS services.
+#
+# then do the same benchmarks for file with data.
+import os
+from os import ftruncate, close, unlink, O_RDONLY, O_RDWR, O_TRUNC
+from mmap import mmap, MAP_SHARED, MAP_ANONYMOUS, PROT_READ, PROT_WRITE
+from io import FileIO
+from wendelin.bigfile.file_file import BigFile_File
+from wendelin.bigfile import WRITEOUT_STORE, WRITEOUT_MARKSTORED
+from wendelin.lib.testing import Adler32, nulladler32_bysize, ffadler32_bysize
+from wendelin.lib.mem import bzero, memset
+from tempfile import NamedTemporaryFile
+
+from six import PY2
+from six.moves import range as xrange
+
+# PY2 -> buffer
+# PY3 -> memoryview
+# (rationale: a lot of functions do not accept memoryview on py2 - e.g. adler32)
+def xbuffer(obj, offset=0, size=None):
+    if size is None:
+        size = len(obj) - offset
+    if PY2:
+        return buffer(obj, offset, size)
+    else:
+        return memoryview(obj)[offset:offset+size]
+
+
+tmpf = None
+blksize  =   2*1024*1024   # XXX hardcoded
+filesize = 512*1024*1024
+nulladler32 = nulladler32_bysize(filesize)
+ffadler32   = ffadler32_bysize(filesize)
+
+
+
+# setup whole-hole OS file
+def setup_module():
+    global tmpf
+    tmpf = NamedTemporaryFile(prefix='hole.', delete=False)
+    tmpf.close()
+
+    fd = os.open(tmpf.name, O_RDWR | O_TRUNC)
+    ftruncate(fd, filesize)
+    close(fd)
+
+def teardown_module():
+    unlink(tmpf.name)
+
+
+# compute hash via mmaping the file at OS-level
+def _bench_file_mmapread(hasher, expect):
+    fd = os.open(tmpf.name, O_RDONLY)
+    fmap = mmap(fd, filesize, MAP_SHARED, PROT_READ)
+    h = hasher()
+    h.update(fmap)
+
+    fmap.close()
+    close(fd)
+    assert h.digest() == expect
+
+
+# compute hash via reading the file at OS-level
+# uses intermediate 1-blksize buffer
+def _bench_file_read(hasher, expect):
+    f = FileIO(tmpf.name, 'r')
+    b = bytearray(blksize)
+
+    h = hasher()
+    while 1:
+        n = f.readinto(b)
+        if n == 0:
+            break
+
+        h.update(xbuffer(b, 0, n))  # NOTE b[:n] does copy
+
+    f.close()
+    assert h.digest() == expect
+
+
+# compute hash via reading the file at OS-level
+# uses memory buffer ~ filesize
+def _bench_file_readbig(hasher, expect):
+    f = FileIO(tmpf.name, 'r')
+    #b = mmap(-1, filesize, MAP_SHARED | MAP_ANONYMOUS, PROT_READ | PROT_WRITE)
+    b = bytearray(filesize)
+    bm= memoryview(b)
+
+    h = hasher()
+    pos = 0
+    while 1:
+        n = f.readinto(bm[pos:])
+        if n == 0:
+            break
+
+        h.update(xbuffer(b, pos,n)) # NOTE b[pos:n] does copy
+        pos += n
+
+    del bm
+    del b
+    f.close()
+    assert h.digest() == expect
+
+
+# compute hash via mmaped BigFile_File
+def _bench_bigf_read(hasher, expect):
+    # bigfile & mapping
+    f   = BigFile_File(tmpf.name, blksize)
+    fh  = f.fileh_open()
+    vma = fh.mmap(0, filesize//blksize)
+
+    # hash of the whole content
+    h = hasher()
+    h.update(vma)
+
+    # TODO cleanup
+    del vma #vma.close()
+    del fh  #fh.close()
+    del f   #f.close()
+    assert h.digest() == expect
+
+
+def bench_file_mmapread_hole():     _bench_file_mmapread(Adler32,   nulladler32)
+def bench_file_read_hole():         _bench_file_read    (Adler32,   nulladler32)
+def bench_file_readbig_hole():      _bench_file_readbig (Adler32,   nulladler32)
+def bench_bigf_read_hole():         _bench_bigf_read    (Adler32,   nulladler32)
+
+
+# write to file via mmap at OS-level
+def bench_file_mmapwrite0():
+    fd = os.open(tmpf.name, O_RDWR)
+    fmap = mmap(fd, filesize, MAP_SHARED, PROT_READ | PROT_WRITE)
+    bzero(fmap)
+    fmap.close()
+    # NOTE calls munmap - thus no fmap.flush() is needed (and flush calls
+    # msync(MS_SYNC) which also does fsync() which we don't want here)
+    del fmap
+    close(fd)
+
+
+# write to file via OS write
+def bench_file_write55():
+    f = FileIO(tmpf.name, 'r+')
+    zblk = b'\x55' * blksize
+    for i in xrange(filesize // blksize):
+        pos = 0
+        while pos < blksize:
+            n = f.write(memoryview(zblk)[pos:])
+            assert n != 0
+            pos += n
+    f.close()
+
+
+# write to file via mmaped BigFile_File
+def bench_bigf_writeff():
+    # bigfile & mapping
+    f   = BigFile_File(tmpf.name, blksize)
+    fh  = f.fileh_open()
+    vma = fh.mmap(0, filesize//blksize)
+
+    memset(vma, 0xff)
+    fh.dirty_writeout(WRITEOUT_STORE | WRITEOUT_MARKSTORED)
+
+    # TODO cleanup
+    del vma #vma.close()
+    del fh  #fh.close()
+    del f   #f.close()
+
+
+
+def bench_file_mmapread():          _bench_file_mmapread(Adler32,   ffadler32)
+def bench_file_read():              _bench_file_read    (Adler32,   ffadler32)
+def bench_file_readbig():           _bench_file_readbig (Adler32,   ffadler32)
+def bench_bigf_read():              _bench_bigf_read    (Adler32,   ffadler32)
--- a/bigfile/tests/bench_1filezodb.py
+++ b/bigfile/tests/bench_1filezodb.py
+# Wendelin.bigfile | benchmarks for zodb backend
+#
+# TODO text
+from wendelin.bigfile.file_zodb import ZBigFile
+from wendelin.lib.mem import memset
+from wendelin.lib.testing import Adler32, nulladler32_bysize, ffadler32_bysize
+from wendelin.bigfile.tests.common_zodb import dbopen, dbclose
+import transaction
+from tempfile import mkdtemp
+from shutil import rmtree
+
+tmpd = None
+from wendelin.bigfile.tests.bench_0virtmem import filesize, blksize # to get comparable timings
+blen = filesize // blksize
+nulladler32 = nulladler32_bysize(blen * blksize)
+ffadler32   = ffadler32_bysize(blen * blksize)
+
+
+def setup_module():
+    global tmpd
+    tmpd = mkdtemp('', 'bigzodb.')
+
+    root = dbopen('%s/1.fs' % tmpd)
+    root['zfile'] = ZBigFile(blksize)
+    transaction.commit()
+
+    dbclose(root)
+
+
+def teardown_module():
+    rmtree(tmpd)
+
+
+# NOTE runs before _writeff
+def bench_bigz_readhole():  _bench_bigz_hash(Adler32,   nulladler32)
+
+def bench_bigz_writeff():
+    root = dbopen('%s/1.fs' % tmpd)
+    f   = root['zfile']
+    fh  = f.fileh_open()    # TODO + ram
+    vma = fh.mmap(0, blen)  # XXX assumes blksize == pagesize
+
+    memset(vma, 0xff)
+    transaction.commit()
+
+    del vma # TODO vma.close()
+    del fh  # TODO fh.close()
+    del f   # XXX  f.close() ?
+    dbclose(root)
+
+
+def _bench_bigz_hash(hasher, expect):
+    root = dbopen('%s/1.fs' % tmpd)
+    f   = root['zfile']
+    fh  = f.fileh_open()    # TODO + ram
+    vma = fh.mmap(0, blen)  # XXX assumes blksize == pagesize
+
+    h = hasher()
+    h.update(vma)
+
+    del vma # vma.close()
+    del fh  # fh.close()
+    del f   # f.close()
+    dbclose(root)
+    assert h.digest() == expect
+
+
+def bench_bigz_read():      _bench_bigz_hash(Adler32,   ffadler32)
--- a/lib/testing.py
+++ b/lib/testing.py
+# Wendelin. Testing utilities
+# Copyright (C) 2014-2015  Nexedi SA and Contributors.
+#                          Kirill Smelkov <kirr@nexedi.com>
+#
+# This program is free software: you can Use, Study, Modify and Redistribute
+# it under the terms of the GNU General Public License version 3, or (at your
+# option) any later version, as published by the Free Software Foundation.
+#
+# You can also Link and Combine this program with other software covered by
+# the terms of any of the Open Source Initiative approved licenses and Convey
+# the resulting work. Corresponding source of such a combination shall include
+# the source code for all other software used.
+#
+# This program is distributed WITHOUT ANY WARRANTY; without even the implied
+# warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
+#
+# See COPYING file for full licensing terms.
+
+from zlib import adler32
+from struct import pack
+import codecs
+import math
+
+# hashlib-like interface to adler32
+class Adler32:
+    def __init__(self):
+        self.v = adler32(b'')
+
+    def update(self, data):
+        self.v = adler32(data, self.v)
+
+    def digest(self):
+        return pack('>I', self.v & 0xffffffff)    # see zlib docs about 0xffffffff
+
+
+def _hex(*args):
+    return tuple(codecs.decode(_, 'hex') for _ in args)
+
+# adler32('\0' * 2^n)
+_nulladler32_byorder = _hex(
+    '00010001',    # 0
+    '00020001',    # 1
+    '00040001',    # 2
+    '00080001',    # 3
+    '00100001',    # 4
+    '00200001',    # 5
+    '00400001',    # 6
+    '00800001',    # 7
+    '01000001',    # 8
+    '02000001',    # 9
+    '04000001',    # 10
+    '08000001',    # 11
+    '10000001',    # 12
+    '20000001',    # 13
+    '40000001',    # 14
+    '80000001',    # 15
+    '000f0001',    # 16
+    '001e0001',    # 17
+    '003c0001',    # 18
+    '00780001',    # 19
+    '00f00001',    # 20
+    '01e00001',    # 21
+    '03c00001',    # 22
+    '07800001',    # 23
+    '0f000001',    # 24
+    '1e000001',    # 25
+    '3c000001',    # 26
+    '78000001',    # 27
+    'f0000001',    # 28
+    'e00f0001',    # 29
+    'c02d0001',    # 30
+)
+
+# adler32('\xff' * 2^n)
+_ffadler32_byorder = _hex(
+    '01000100',    # 0
+    '02ff01ff',    # 1
+    '09fa03fd',    # 2
+    '23e407f9',    # 3
+    '87880ff1',    # 4
+    '0e2e1fe1',    # 5
+    '18983fc1',    # 6
+    '22207f81',    # 7
+    '0800ff01',    # 8
+    '1ef1fe10',    # 9
+    '79a6fc2e',    # 10
+    'e26bf86a',    # 11
+    '8161f0e2',    # 12
+    'f4a3e1d2',    # 13
+    'b0d9c3b2',    # 14
+    '7fc28772',    # 15
+    '77970ef2',    # 16
+    'cf5c1de3',    # 17
+    '1f7f3bc5',    # 18
+    '41c07789',    # 19
+    '8e88ef11',    # 20
+    '493fde30',    # 21
+    '430dbc6e',    # 22
+    '484778ea',    # 23
+    '9933f1d3',    # 24
+    '5509e3b4',    # 25
+    '3471c776',    # 26
+    '92408efa',    # 27
+    'ca071e02',    # 28
+    '2a2a3c03',    # 29
+    'ac6a7805',    # 30
+)
+
+
+# md5sum('\0' * (2^n))
+_nullmd5_byorder = _hex(
+    '93b885adfe0da089cdf634904fd59f71',    # 0
+    'c4103f122d27677c9db144cae1394a66',    # 1
+    'f1d3ff8443297732862df21dc4e57262',    # 2
+    '7dea362b3fac8e00956a4952a3d4f474',    # 3
+    '4ae71336e44bf9bf79d2752e234818a5',    # 4
+    '70bc8f4b72a86921468bf8e8441dce51',    # 5
+    '3b5d3c7d207e37dceeedd301e35e2e58',    # 6
+    'f09f35a5637839458e462e6350ecbce4',    # 7
+    '348a9791dc41b89796ec3808b5b5262f',    # 8
+    'bf619eac0cdf3f68d496ea9344137e8b',    # 9
+    '0f343b0931126a20f133d67c2b018a3b',    # 10
+    'c99a74c555371a433d121f551d6c6398',    # 11
+    '620f0b67a91f7f74151bc5be745b7110',    # 12
+    '0829f71740aab1ab98b33eae21dee122',    # 13
+    'ce338fe6899778aacfc28414f2d9498b',    # 14
+    'bb7df04e1b0a2570657527a7e108ae23',    # 15
+    'fcd6bcb56c1689fcef28b57c22475bad',    # 16
+    '0dfbe8aa4c20b52e1b8bf3cb6cbdf193',    # 17
+    'ec87a838931d4d5d2e94a04644788a55',    # 18
+    '59071590099d21dd439896592338bf95',    # 19
+    'b6d81b360a5672d80c27430f39153e2c',    # 20
+    'b2d1236c286a3c0704224fe4105eca49',    # 21
+    'b5cfa9d6c8febd618f91ac2843d50a1c',    # 22
+    '96995b58d4cbf6aaa9041b4f00c7f6ae',    # 23
+    '2c7ab85a893283e98c931e9511add182',    # 24
+    '58f06dd588d8ffb3beb46ada6309436b',    # 25
+    '7f614da9329cd3aebf59b91aadc30bf0',    # 26
+    'fde9e0818281836e4fc0edfede2b8762',    # 27
+    '1f5039e50bd66b290c56684d8550c6c2',    # 28
+    'aa559b4e3523a6c931f08f4df52d58f2',    # 29
+    'cd573cfaace07e7949bc0c46028904ff',    # 30
+)
+
+
+def ilog2_exact(x):
+    xlog2 = int(math.log(x, 2))
+    if x != (1 << xlog2):
+        raise ValueError('Only 2^n supported')
+    return xlog2
+
+def nulladler32_bysize(size):   return _nulladler32_byorder [ilog2_exact(size)]
+def nullmd5_bysize(size):       return _nullmd5_byorder     [ilog2_exact(size)]
+
+def ffadler32_bysize(size):     return _ffadler32_byorder   [ilog2_exact(size)]