Skip to content
Snippets Groups Projects

Fix field size

Merged Markus Holzer requested to merge holzer/pystencils:FixFieldSize into master
Files
3
+ 37
9
@@ -59,6 +59,7 @@ from appdirs import user_cache_dir, user_config_dir
@@ -59,6 +59,7 @@ from appdirs import user_cache_dir, user_config_dir
from pystencils import FieldType
from pystencils import FieldType
from pystencils.backends.cbackend import generate_c, get_headers
from pystencils.backends.cbackend import generate_c, get_headers
 
from pystencils.data_types import cast_func, VectorType
from pystencils.include import get_pystencils_include_path
from pystencils.include import get_pystencils_include_path
from pystencils.kernel_wrapper import KernelWrapper
from pystencils.kernel_wrapper import KernelWrapper
from pystencils.utils import atomic_file_write, file_handle_for_atomic_write, recursive_dict_update
from pystencils.utils import atomic_file_write, file_handle_for_atomic_write, recursive_dict_update
@@ -266,7 +267,6 @@ type_mapping = {
@@ -266,7 +267,6 @@ type_mapping = {
np.complex128: (('PyComplex_RealAsDouble', 'PyComplex_ImagAsDouble'), 'ComplexDouble'),
np.complex128: (('PyComplex_RealAsDouble', 'PyComplex_ImagAsDouble'), 'ComplexDouble'),
}
}
template_extract_scalar = """
template_extract_scalar = """
PyObject * obj_{name} = PyDict_GetItemString(kwargs, "{name}");
PyObject * obj_{name} = PyDict_GetItemString(kwargs, "{name}");
if( obj_{name} == NULL) {{ PyErr_SetString(PyExc_TypeError, "Keyword argument '{name}' missing"); return NULL; }};
if( obj_{name} == NULL) {{ PyErr_SetString(PyExc_TypeError, "Keyword argument '{name}' missing"); return NULL; }};
@@ -357,7 +357,7 @@ def equal_size_check(fields):
@@ -357,7 +357,7 @@ def equal_size_check(fields):
return template_size_check.format(cond=cond)
return template_size_check.format(cond=cond)
def create_function_boilerplate_code(parameter_info, name, insert_checks=True):
def create_function_boilerplate_code(parameter_info, name, ast_node, insert_checks=True):
pre_call_code = ""
pre_call_code = ""
parameters = []
parameters = []
post_call_code = ""
post_call_code = ""
@@ -375,6 +375,25 @@ def create_function_boilerplate_code(parameter_info, name, insert_checks=True):
@@ -375,6 +375,25 @@ def create_function_boilerplate_code(parameter_info, name, insert_checks=True):
np_dtype = field.dtype.numpy_dtype
np_dtype = field.dtype.numpy_dtype
item_size = np_dtype.itemsize
item_size = np_dtype.itemsize
 
aligned = False
 
if ast_node.assignments:
 
aligned = any([a.lhs.args[2] for a in ast_node.assignments
 
if hasattr(a, 'lhs') and isinstance(a.lhs, cast_func)
 
and hasattr(a.lhs, 'dtype') and isinstance(a.lhs.dtype, VectorType)])
 
 
if ast_node.instruction_set and aligned:
 
byte_width = ast_node.instruction_set['width'] * item_size
 
offset = max(max(ast_node.ghost_layers)) * item_size
 
offset_cond = f"(((uintptr_t) buffer_{field.name}.buf) + {offset}) % {byte_width} == 0"
 
 
message = str(offset) + ". This is probably due to a different number of ghost_layers chosen for " \
 
"the arrays and the kernel creation. If the number of ghost layers for " \
 
"the kernel creation is not specified it will choose a suitable value " \
 
"automatically. This value might not " \
 
"be compatible with the allocated arrays."
 
pre_call_code += template_check_array.format(cond=offset_cond, what="offset", name=field.name,
 
expected=message)
 
if (np_dtype.isbuiltin and FieldType.is_generic(field)
if (np_dtype.isbuiltin and FieldType.is_generic(field)
and not np.issubdtype(field.dtype.numpy_dtype, np.complexfloating)):
and not np.issubdtype(field.dtype.numpy_dtype, np.complexfloating)):
dtype_cond = "buffer_{name}.format[0] == '{format}'".format(name=field.name,
dtype_cond = "buffer_{name}.format[0] == '{format}'".format(name=field.name,
@@ -418,7 +437,7 @@ def create_function_boilerplate_code(parameter_info, name, insert_checks=True):
@@ -418,7 +437,7 @@ def create_function_boilerplate_code(parameter_info, name, insert_checks=True):
extract_function_imag=extract_function[1],
extract_function_imag=extract_function[1],
target_type=target_type,
target_type=target_type,
real_type="float" if target_type == "ComplexFloat"
real_type="float" if target_type == "ComplexFloat"
else "double",
else "double",
name=param.symbol.name)
name=param.symbol.name)
else:
else:
pre_call_code += template_extract_scalar.format(extract_function=extract_function,
pre_call_code += template_extract_scalar.format(extract_function=extract_function,
@@ -475,12 +494,13 @@ def run_compile_step(command):
@@ -475,12 +494,13 @@ def run_compile_step(command):
class ExtensionModuleCode:
class ExtensionModuleCode:
def __init__(self, module_name='generated', custom_backend=None):
def __init__(self, module_name='generated', custom_backend=None, generated_code=None):
self.module_name = module_name
self.module_name = module_name
self._ast_nodes = []
self._ast_nodes = []
self._function_names = []
self._function_names = []
self._custom_backend = custom_backend
self._custom_backend = custom_backend
 
self._generated_code = generated_code
def add_function(self, ast, name=None):
def add_function(self, ast, name=None):
self._ast_nodes.append(ast)
self._ast_nodes.append(ast)
@@ -504,8 +524,11 @@ class ExtensionModuleCode:
@@ -504,8 +524,11 @@ class ExtensionModuleCode:
for ast, name in zip(self._ast_nodes, self._function_names):
for ast, name in zip(self._ast_nodes, self._function_names):
old_name = ast.function_name
old_name = ast.function_name
ast.function_name = "kernel_" + name
ast.function_name = "kernel_" + name
print(generate_c(ast, custom_backend=self._custom_backend), file=file)
if self._generated_code:
print(create_function_boilerplate_code(ast.get_parameters(), name), file=file)
print(self._generated_code, file=file)
 
else:
 
print(generate_c(ast, custom_backend=self._custom_backend), file=file)
 
print(create_function_boilerplate_code(ast.get_parameters(), name, ast), file=file)
ast.function_name = old_name
ast.function_name = old_name
print(create_module_boilerplate_code(self.module_name, self._function_names), file=file)
print(create_module_boilerplate_code(self.module_name, self._function_names), file=file)
@@ -564,9 +587,14 @@ def compile_module(code, code_hash, base_dir):
@@ -564,9 +587,14 @@ def compile_module(code, code_hash, base_dir):
def compile_and_load(ast, custom_backend=None):
def compile_and_load(ast, custom_backend=None):
cache_config = get_cache_config()
cache_config = get_cache_config()
code_hash_str = "mod_" + hashlib.sha256(generate_c(ast, dialect='c',
custom_backend=custom_backend).encode()).hexdigest()
generated_code = generate_c(ast, dialect='c', custom_backend=custom_backend)
code = ExtensionModuleCode(module_name=code_hash_str, custom_backend=custom_backend)
fields_accessed = str(ast.fields_accessed)
 
 
# Also the information of the field size should be contained in the hash string. Due to padding the generated code
 
# can look similar for different field sizes.
 
code_hash_str = "mod_" + hashlib.sha256((generated_code + fields_accessed).encode()).hexdigest()
 
code = ExtensionModuleCode(module_name=code_hash_str, custom_backend=custom_backend, generated_code=generated_code)
code.add_function(ast, ast.function_name)
code.add_function(ast, ast.function_name)
if cache_config['object_cache'] is False:
if cache_config['object_cache'] is False:
Loading