Commit a54b1631 authored by Mark Florisson's avatar Mark Florisson

Support atomics in acquisition counting

parent 0e579823
...@@ -723,11 +723,15 @@ memviewslice_declare_code = load_memview_c_utility( ...@@ -723,11 +723,15 @@ memviewslice_declare_code = load_memview_c_utility(
proto_block='utility_code_proto_before_types', proto_block='utility_code_proto_before_types',
context=context) context=context)
atomic_utility = load_memview_c_utility("Atomics", context,
proto_block='utility_code_proto_before_types')
memviewslice_init_code = load_memview_c_utility( memviewslice_init_code = load_memview_c_utility(
"MemviewSliceInit", "MemviewSliceInit",
context=dict(context, BUF_MAX_NDIMS=Options.buffer_max_dims), context=dict(context, BUF_MAX_NDIMS=Options.buffer_max_dims),
requires=[memviewslice_declare_code, requires=[memviewslice_declare_code,
Buffer.acquire_utility_code], Buffer.acquire_utility_code,
atomic_utility],
) )
memviewslice_index_helpers = load_memview_c_utility("MemviewSliceIndex") memviewslice_index_helpers = load_memview_c_utility("MemviewSliceIndex")
...@@ -737,7 +741,11 @@ typeinfo_to_format_code = load_memview_cy_utility( ...@@ -737,7 +741,11 @@ typeinfo_to_format_code = load_memview_cy_utility(
is_contig_utility = load_memview_c_utility("MemviewSliceIsContig", context) is_contig_utility = load_memview_c_utility("MemviewSliceIsContig", context)
overlapping_utility = load_memview_c_utility("OverlappingSlices", context) overlapping_utility = load_memview_c_utility("OverlappingSlices", context)
copy_contents_new_utility = load_memview_c_utility("MemviewSliceCopyTemplate", context) copy_contents_new_utility = load_memview_c_utility(
"MemviewSliceCopyTemplate",
context,
requires=[], # require cython_array_utility_code
)
view_utility_code = load_memview_cy_utility( view_utility_code = load_memview_cy_utility(
"View.MemoryView", "View.MemoryView",
...@@ -756,6 +764,8 @@ cython_array_utility_code = load_memview_cy_utility( ...@@ -756,6 +764,8 @@ cython_array_utility_code = load_memview_cy_utility(
context=context, context=context,
requires=[view_utility_code]) requires=[view_utility_code])
copy_contents_new_utility.requires.append(cython_array_utility_code)
# memview_fromslice_utility_code = load_memview_cy_utility( # memview_fromslice_utility_code = load_memview_cy_utility(
# "MemviewFromSlice", # "MemviewFromSlice",
# context=context, # context=context,
......
...@@ -237,6 +237,9 @@ cdef extern from *: ...@@ -237,6 +237,9 @@ cdef extern from *:
PyBUF_STRIDES PyBUF_STRIDES
PyBUF_INDIRECT PyBUF_INDIRECT
cdef extern from *:
ctypedef int __pyx_atomic_int
cdef extern from "stdlib.h": cdef extern from "stdlib.h":
void *malloc(size_t) nogil void *malloc(size_t) nogil
void free(void *) nogil void free(void *) nogil
...@@ -283,7 +286,7 @@ cdef class memoryview(object): ...@@ -283,7 +286,7 @@ cdef class memoryview(object):
cdef object _size cdef object _size
cdef object _array_interface cdef object _array_interface
cdef PyThread_type_lock lock cdef PyThread_type_lock lock
cdef int acquisition_count cdef __pyx_atomic_int acquisition_count
cdef Py_buffer view cdef Py_buffer view
cdef int flags cdef int flags
......
...@@ -11,6 +11,113 @@ typedef struct { ...@@ -11,6 +11,113 @@ typedef struct {
Py_ssize_t suboffsets[{{max_dims}}]; Py_ssize_t suboffsets[{{max_dims}}];
} {{memviewslice_name}}; } {{memviewslice_name}};
/////////// Atomics.proto /////////////
#include <pythread.h>
#ifndef CYTHON_ATOMICS
#define CYTHON_ATOMICS 1
#endif
/* todo: Portland pgcc, maybe OS X's OSAtomicIncrement32,
libatomic + autotools-like distutils support? Such a pain... */
#if CYTHON_ATOMICS && __GNUC__ >= 4 && (__GNUC_MINOR__ > 1 || \
(__GNUC_MINOR__ == 1 && __GNUC_PATHLEVEL >= 2))
/* gcc >= 4.1.2 */
typedef volatile int __pyx_atomic_int;
#define __pyx_atomic_incr_aligned(value, lock) __sync_fetch_and_add(value, 1)
#define __pyx_atomic_decr_aligned(value, lock) __sync_fetch_and_sub(value, 1)
#ifdef __PYX_DEBUG_ATOMICS
#warning "Using GNU atomics"
#endif
#elif CYTHON_ATOMICS && MSC_VER
/* msvc */
#include <Windows.h>
typedef volatile LONG __pyx_atomic_int;
#define __pyx_atomic_incr_aligned(value, lock) InterlockedIncrement(value)
#define __pyx_atomic_decr_aligned(value, lock) InterlockedDecrement(value)
#ifdef __PYX_DEBUG_ATOMICS
#warning "Using MSVC atomics"
#endif
#elif CYTHON_ATOMICS && (defined(__ICC) || defined(__INTEL_COMPILER))
typedef volatile int __pyx_atomic_int;
#define __pyx_atomic_incr_aligned(value, lock) _InterlockedIncrement(value)
#define __pyx_atomic_decr_aligned(value, lock) _InterlockedDecrement(value)
#ifdef __PYX_DEBUG_ATOMICS
#warning "Using Intel atomics"
#endif
#else
typedef volatile int __pyx_atomic_int;
#define CYTHON_ATOMICS 0
#ifdef __PYX_DEBUG_ATOMICS
#warning "Not using atomics"
#endif
#endif
#if CYTHON_ATOMICS
__pyx_atomic_int CYTHON_INLINE
__pyx_atomic_incr_maybealigned(__pyx_atomic_int *value, PyThread_type_lock lock);
__pyx_atomic_int CYTHON_INLINE
__pyx_atomic_decr_maybealigned(__pyx_atomic_int *value, PyThread_type_lock lock);
#define __pyx_add_acquisition_count(memview) \
__pyx_atomic_incr_maybealigned(&memview->acquisition_count, memview->lock)
#define __pyx_sub_acquisition_count(memview) \
__pyx_atomic_decr_maybealigned(&memview->acquisition_count, memview->lock)
#else
#define __pyx_add_acquisition_count(memview) \
__pyx_add_acquisition_count_locked(&memview->acquisition_count, memview->lock)
#define __pyx_sub_acquisition_count(memview) \
__pyx_sub_acquisition_count_locked(&memview->acquisition_count, memview->lock)
#endif
////////// Atomics //////////
#if CYTHON_ATOMICS
#define __pyx_check_unaligned(type, pointer) \
(((type) pointer) & (sizeof(pointer) - 1))
int CYTHON_INLINE
__pyx_atomic_unaligned(__pyx_atomic_int *p)
{
/* uintptr_t is optional in C99, try other stuff */
if (sizeof(unsigned long) >= sizeof(p))
return __pyx_check_unaligned(unsigned long, p);
else if (sizeof(size_t) >= sizeof(p))
return __pyx_check_unaligned(size_t, p);
#if __STDC_VERSION__ >= 199901L
if (sizeof(unsigned long long) >= sizeof(p))
return __pyx_check_unaligned(unsigned long long, p);
#endif
return 1;
}
__pyx_atomic_int CYTHON_INLINE
__pyx_atomic_incr_maybealigned(__pyx_atomic_int *value, PyThread_type_lock lock)
{
if (unlikely(__pyx_atomic_unaligned(value)))
return __pyx_add_acquisition_count_locked(value, lock);
else
return __pyx_atomic_incr_aligned(value, lock);
}
__pyx_atomic_int CYTHON_INLINE
__pyx_atomic_decr_maybealigned(__pyx_atomic_int *value, PyThread_type_lock lock)
{
if (unlikely(__pyx_atomic_unaligned(value)))
return __pyx_sub_acquisition_count_locked(value, lock);
else
return __pyx_atomic_decr_aligned(value, lock);
}
#endif
/////////////// ObjectToMemviewSlice.proto /////////////// /////////////// ObjectToMemviewSlice.proto ///////////////
static CYTHON_INLINE {{memviewslice_name}} {{funcname}}(PyObject *); static CYTHON_INLINE {{memviewslice_name}} {{funcname}}(PyObject *);
...@@ -37,8 +144,10 @@ static int __Pyx_init_memviewslice( ...@@ -37,8 +144,10 @@ static int __Pyx_init_memviewslice(
int ndim, int ndim,
__Pyx_memviewslice *memviewslice); __Pyx_memviewslice *memviewslice);
static int CYTHON_INLINE __pyx_add_acquisition_count(struct {{memview_struct_name}} *memview); static int CYTHON_INLINE __pyx_add_acquisition_count_locked(__pyx_atomic_int *acquisition_count,
static int CYTHON_INLINE __pyx_del_acquisition_count(struct {{memview_struct_name}} *memview); PyThread_type_lock lock);
static int CYTHON_INLINE __pyx_sub_acquisition_count_locked(__pyx_atomic_int *acquisition_count,
PyThread_type_lock lock);
#define __PYX_INC_MEMVIEW(slice, have_gil) __Pyx_INC_MEMVIEW(slice, have_gil, __LINE__) #define __PYX_INC_MEMVIEW(slice, have_gil) __Pyx_INC_MEMVIEW(slice, have_gil, __LINE__)
#define __PYX_XDEC_MEMVIEW(slice, have_gil) __Pyx_XDEC_MEMVIEW(slice, have_gil, __LINE__) #define __PYX_XDEC_MEMVIEW(slice, have_gil) __Pyx_XDEC_MEMVIEW(slice, have_gil, __LINE__)
static CYTHON_INLINE void __Pyx_INC_MEMVIEW({{memviewslice_name}} *, int, int); static CYTHON_INLINE void __Pyx_INC_MEMVIEW({{memviewslice_name}} *, int, int);
...@@ -277,22 +386,24 @@ static CYTHON_INLINE void __pyx_fatalerror(const char *fmt, ...) { ...@@ -277,22 +386,24 @@ static CYTHON_INLINE void __pyx_fatalerror(const char *fmt, ...) {
} }
static int CYTHON_INLINE static int CYTHON_INLINE
__pyx_add_acquisition_count(struct {{memview_struct_name}} *memview) __pyx_add_acquisition_count_locked(__pyx_atomic_int *acquisition_count,
PyThread_type_lock lock)
{ {
int result; int result;
PyThread_acquire_lock(memview->lock, 1); PyThread_acquire_lock(lock, 1);
result = memview->acquisition_count++; result = (*acquisition_count)++;
PyThread_release_lock(memview->lock); PyThread_release_lock(lock);
return result; return result;
} }
static int CYTHON_INLINE static int CYTHON_INLINE
__pyx_del_acquisition_count(struct {{memview_struct_name}} *memview) __pyx_sub_acquisition_count_locked(__pyx_atomic_int *acquisition_count,
PyThread_type_lock lock)
{ {
int result; int result;
PyThread_acquire_lock(memview->lock, 1); PyThread_acquire_lock(lock, 1);
result = memview->acquisition_count--; result = (*acquisition_count)--;
PyThread_release_lock(memview->lock); PyThread_release_lock(lock);
return result; return result;
} }
...@@ -333,7 +444,7 @@ static CYTHON_INLINE void __Pyx_XDEC_MEMVIEW({{memviewslice_name}} *memslice, ...@@ -333,7 +444,7 @@ static CYTHON_INLINE void __Pyx_XDEC_MEMVIEW({{memviewslice_name}} *memslice,
__pyx_fatalerror("Acquisition count is %d (line %d)", __pyx_fatalerror("Acquisition count is %d (line %d)",
memview->acquisition_count, lineno); memview->acquisition_count, lineno);
last_time = __pyx_del_acquisition_count(memview) == 1; last_time = __pyx_sub_acquisition_count(memview) == 1;
memslice->data = NULL; memslice->data = NULL;
if (last_time) { if (last_time) {
if (have_gil) { if (have_gil) {
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment