Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
21 changes: 20 additions & 1 deletion meson.build
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@ project(
check: true
).stdout().strip(),
default_options: [
'c_std=c11',
'buildtype=release',
]
)
Expand All @@ -18,6 +19,13 @@ c_args = ['-DNDEBUG']
thread_dep = dependency('threads')

cc = meson.get_compiler('c')
if cc.get_id() == 'msvc'
add_project_arguments(
'/experimental:c11atomics',
language: 'c'
)
endif

mkl_dep = dependency('MKL', method: 'cmake',
modules: ['MKL::MKL'],
cmake_args: [
Expand All @@ -43,7 +51,7 @@ py.extension_module(
subdir: 'mkl'
)

# Cython extension
# Cython extensions
py.extension_module(
'_py_mkl_service',
sources: ['mkl/_py_mkl_service.pyx'],
Expand All @@ -54,6 +62,17 @@ py.extension_module(
subdir: 'mkl'
)

py.extension_module(
'_mkl_memory',
sources: ['mkl/_mkl_memory.pyx'],
dependencies: [mkl_dep],
c_args: c_args,
install_rpath: rpath,
install: true,
subdir: 'mkl'
)


# Python sources
py.install_sources(
[
Expand Down
1 change: 1 addition & 0 deletions mkl/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -57,6 +57,7 @@ def __exit__(self, *args):
del RTLD_for_MKL
del sys

from ._mkl_memory import MKLMemory
from ._py_mkl_service import *
from ._version import __version__

Expand Down
231 changes: 231 additions & 0 deletions mkl/_mkl_memory.pyx
Original file line number Diff line number Diff line change
@@ -0,0 +1,231 @@
# Copyright (c) 2018, Intel Corporation
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are met:
#
# * Redistributions of source code must retain the above copyright notice,
# this list of conditions and the following disclaimer.
# * Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
# * Neither the name of Intel Corporation nor the names of its contributors
# may be used to endorse or promote products derived from this software
# without specific prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

# distutils: language = c
# cython: language_level=3

import numbers

from cpython cimport Py_buffer
from libc.string cimport memcpy

from mkl._mkl_service cimport mkl_calloc, mkl_free, mkl_malloc, mkl_realloc


cdef extern from "stdatomic.h" nogil:
ctypedef int atomic_int "_Atomic int"
void atomic_init(atomic_int *obj, int value)
int atomic_fetch_add(atomic_int *obj, int value)
int atomic_fetch_sub(atomic_int *obj, int value)
int atomic_load(atomic_int *obj)


def _mkl_memory_from_bytes(bytes data, Py_ssize_t alignment):
cdef Py_ssize_t nbytes = len(data)
cdef MKLMemory mem = MKLMemory(nbytes, alignment=alignment)

cdef void *dst = mem._memory_ptr
cdef char *src = data

with nogil:
memcpy(dst, src, nbytes)

return mem


cdef class MKLMemory:
cdef void *_memory_ptr
cdef Py_ssize_t nbytes
cdef Py_ssize_t alignment
cdef atomic_int exported_buffers

cdef _cinit_empty(self):
self._memory_ptr = NULL
self.nbytes = 0
self.alignment = 0
atomic_init(&self.exported_buffers, 0)

cdef _cinit_malloc(self, Py_ssize_t nbytes, Py_ssize_t alignment):
self._cinit_empty()

if (nbytes > 0):
with nogil:
p = mkl_malloc(nbytes, alignment)

if (p):
self._memory_ptr = p
self.nbytes = nbytes
self.alignment = alignment
else:
raise MemoryError(
"MKL memory allocation failed."
)
else:
raise ValueError(
"Number of bytes of requested allocation must be positive."
)

cdef _cinit_calloc(self, Py_ssize_t num, Py_ssize_t size, Py_ssize_t alignment):
self._cinit_empty()

if (num > 0 and size > 0):
with nogil:
p = mkl_calloc(num, size, alignment)

if (p):
self._memory_ptr = p
self.nbytes = num * size
self.alignment = alignment
else:
raise MemoryError(
"MKL memory allocation failed."
)
else:
raise ValueError(
"Number of elements and size of requested allocation must be "
"positive."
)

cdef _cinit_mklmemory(self, object other, Py_ssize_t alignment):
other_mem = <MKLMemory> other

self._cinit_malloc(other_mem.nbytes, alignment)
with nogil:
memcpy(self._memory_ptr, other_mem._memory_ptr, self.nbytes)

def __cinit__(self, *args, **kwargs):
cdef Py_ssize_t alignment

n_args = len(args)
if not (0 < n_args < 3):
raise TypeError(
"MKLMemory constructor takes 1 or 2 arguments, but "
f"{n_args} were given"
)
if n_args == 1:
arg = args[0]
if isinstance(arg, numbers.Integral):
alignment = kwargs.get("alignment", 64)
self._cinit_malloc(arg, alignment)
elif isinstance(arg, MKLMemory):
alignment = kwargs.get("alignment", arg.alignment)
self._cinit_mklmemory(arg, alignment)
else:
raise TypeError(
"MKLMemory single argument constructor expects an integer "
f"or MKLMemory instance, but got {type(arg)}"
)

elif n_args == 2:
arg0, arg1 = args[0], args[1]
alignment = kwargs.get("alignment", 64)
if not isinstance(arg0, numbers.Integral):
raise TypeError(
"MKLMemory constructor expects first argument "
f"to be an integer, but got {type(arg0)}"
)
if not isinstance(arg1, numbers.Integral):
raise TypeError(
"MKLMemory constructor expects second argument "
f"to be an integer, but got {type(arg1)}"
)
self._cinit_calloc(arg0, arg1, alignment)

def __dealloc__(self):
if not (self._memory_ptr is NULL):
mkl_free(self._memory_ptr)
self._cinit_empty()

cdef void *get_data_ptr(self):
return self._memory_ptr

def __getbuffer__(self, Py_buffer *buffer, int flags):
buffer.buf = <void *>self._memory_ptr
buffer.format = "B" # byte
buffer.internal = NULL # see References
buffer.itemsize = 1
buffer.len = self.nbytes
buffer.ndim = 1
buffer.obj = self
buffer.readonly = 0
buffer.shape = &self.nbytes
buffer.strides = &buffer.itemsize
buffer.suboffsets = NULL # for pointer arrays only

atomic_fetch_add(&self.exported_buffers, 1)

def __releasebuffer__(self, Py_buffer *buffer):
atomic_fetch_sub(&self.exported_buffers, 1)

def realloc(self, Py_ssize_t new_nbytes):
if atomic_load(&self.exported_buffers) > 0:
raise BufferError("Cannot realloc memory while there are exported buffers.")
if new_nbytes <= 0:
raise ValueError("New number of bytes must be positive.")

cdef void *p
with nogil:
p = mkl_realloc(self._memory_ptr, new_nbytes)

if not p:
raise MemoryError("MKL memory reallocation failed.")

self._memory_ptr = p
self.nbytes = new_nbytes

def tobytes(self):
cdef char* data_ptr = <char*>self._memory_ptr
return data_ptr[:self.nbytes]

@property
def nbytes(self):
return self.nbytes

@property
def size(self):
return self.nbytes

@property
def alignment(self):
return self.alignment

@property
def _pointer(self):
return <size_t>(self._memory_ptr)

def __repr__(self):
return (
f"<MKL memory allocation of {self.nbytes} bytes at "
f"{hex(<object>(<size_t>self._memory_ptr))}>"
)

def __len__(self):
return self.nbytes

def __sizeof__(self):
return self.nbytes

def __reduce__(self):
return (_mkl_memory_from_bytes, (self.tobytes(), self.alignment))
6 changes: 5 additions & 1 deletion mkl/_mkl_service.pxd
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,7 @@ ctypedef unsigned long long MKL_UINT64
ctypedef int MKL_INT


cdef extern from "mkl.h":
cdef extern from "mkl.h" nogil:
# MKL Function Domains Constants
int MKL_DOMAIN_BLAS
int MKL_DOMAIN_FFT
Expand Down Expand Up @@ -151,6 +151,10 @@ cdef extern from "mkl.h":
MKL_INT64 mkl_mem_stat(int* buf)
MKL_INT64 mkl_peak_mem_usage(int mode)
int mkl_set_memory_limit(int mem_type, size_t limit)
void *mkl_malloc(size_t size, int alignment)
void *mkl_realloc(void *ptr, size_t size)
void *mkl_calloc(size_t num, size_t size, int alignment)
void mkl_free(void *ptr)

# Conditional Numerical Reproducibility
int mkl_cbwr_set(int settings)
Expand Down
6 changes: 4 additions & 2 deletions mkl/_py_mkl_service.pyx
Original file line number Diff line number Diff line change
Expand Up @@ -601,7 +601,8 @@ cdef inline void __free_buffers() noexcept:
"""
Frees unused memory allocated by the Intel(R) MKL Memory Allocator.
"""
mkl.mkl_free_buffers()
with nogil:
mkl.mkl_free_buffers()
return


Expand All @@ -610,7 +611,8 @@ cdef inline void __thread_free_buffers() noexcept:
Frees unused memory allocated by the Intel(R) MKL Memory Allocator in the current
thread.
"""
mkl.mkl_thread_free_buffers()
with nogil:
mkl.mkl_thread_free_buffers()
return


Expand Down
Loading
Loading