Add some extra flags to TorchModule.compile and remove GOOGLE_CUDA from Template

26df2dfb · Stephan Seitz · c143c626 · 26df2dfb · 26df2dfb · 26df2dfb
Commit 26df2dfb authored 5 years ago by Stephan Seitz
--- a/src/pystencils_autodiff/backends/astnodes.py
+++ b/src/pystencils_autodiff/backends/astnodes.py
@@ -137,7 +137,7 @@ class TorchModule(JinjaCppFile):
        return WrapperFunction(cls.DESTRUCTURING_CLASS(generate_kernel_call(kernel_ast)),
                               function_name='call_' + kernel_ast.function_name)
-    def compile(self):
+    def compile(self, extra_source_files=[], extra_cuda_flags=[], with_cuda=None):
        from torch.utils.cpp_extension import load
        file_extension = '.cu' if self.is_cuda else '.cpp'
        source_code = str(self)
@@ -155,10 +155,12 @@ class TorchModule(JinjaCppFile):
        os.environ['CXX'] = get_compiler_config()['command']
        torch_extension = load(hash,
-                               [file_name],
+                               [file_name] + extra_source_files,
-                               with_cuda=self.is_cuda,
+                               with_cuda=self.is_cuda or with_cuda,
-                               extra_cflags=['--std=c++14', get_compiler_config()['flags'].replace('--std=c++11', '')],
+                               extra_cflags=['--std=c++14', get_compiler_config()
-                               extra_cuda_cflags=['-std=c++14', '-ccbin', get_compiler_config()['command']],
+                                             ['flags'].replace('--std=c++11', '')],
+                               extra_cuda_cflags=['-std=c++14', '-ccbin',
+                                                  get_compiler_config()['command']] + extra_cuda_flags,
                               build_directory=build_dir,
                               extra_include_paths=[get_pycuda_include_path(),
                                                    get_pystencils_include_path(),

--- a/src/pystencils_autodiff/backends/module.tmpl.cpp
+++ b/src/pystencils_autodiff/backends/module.tmpl.cpp
 #define RESTRICT __restrict__
-#if GOOGLE_CUDA
+//#if GOOGLE_CUDA
-#define EIGEN_USE_GPU
+//#define EIGEN_USE_GPU
-#include "third_party/eigen3/unsupported/Eigen/CXX11/Tensor"
+//#include "third_party/eigen3/unsupported/Eigen/CXX11/Tensor"
-#endif
+//#endif
 {% for header in headers -%}
 #include {{ header }}

--- a/src/pystencils_autodiff/framework_integration/astnodes.py
+++ b/src/pystencils_autodiff/framework_integration/astnodes.py
@@ -369,14 +369,18 @@ class CustomFunctionDeclaration(JinjaCppFile):
 class CustomFunctionCall(JinjaCppFile):
    TEMPLATE = jinja2.Template("""{{function_name}}({{ args | join(', ') }});""", undefined=jinja2.StrictUndefined)
-    def __init__(self, function_name, *args, fields_accessed=[]):
+    def __init__(self, function_name, *args, fields_accessed=[], custom_signature=None):
        ast_dict = {
            'function_name': function_name,
            'args': args,
            'fields_accessed': [f.center for f in fields_accessed]
        }
        super().__init__(ast_dict)
-        self.required_global_declarations = [CustomFunctionDeclaration(self.ast_dict.function_name, self.ast_dict.args)]
+        if custom_signature:
+            self.required_global_declarations = [CustomCodeNode(custom_signature, (), ())]
+        else:
+            self.required_global_declarations = [CustomFunctionDeclaration(
+                self.ast_dict.function_name, self.ast_dict.args)]
    @property
    def symbols_defined(self):