Bugfixes in pystencils_walberla and lbmpy_walberla

- missing pragma once added - static variable to member in overlap sweep, when called with changing block sizes this lead to wrong results

Bugfixes in pystencils_walberla and lbmpy_walberla
b83706cd · Martin Bauer · 2712293e · b83706cd · b83706cd · b83706cd
Commit b83706cd authored 6 years ago by Martin Bauer
--- a/pystencils_walberla/templates/GpuPackInfo.tmpl.h
+++ b/pystencils_walberla/templates/GpuPackInfo.tmpl.h
+#pragma once
 #include "stencil/Directions.h"
 #include "core/cell/CellInterval.h"
 #include "cuda/GPUField.h"

--- a/pystencils_walberla/templates/SweepInnerOuter.tmpl.cpp
+++ b/pystencils_walberla/templates/SweepInnerOuter.tmpl.cpp
@@ -85,38 +85,36 @@ void {{class_name}}::inner( IBlock * block{%if target is equalto 'gpu'%} , cudaS
 void {{class_name}}::outer( IBlock * block{%if target is equalto 'gpu'%} , cudaStream_t stream {% endif %} )
 {
-    static std::vector<CellInterval> layers;
    {{kernel|generate_block_data_to_field_extraction|indent(4)}}
-    if( layers.size() == 0 )
+    if( layers_.size() == 0 )
    {
        CellInterval ci;
        {{field}}->getSliceBeforeGhostLayer(stencil::T, ci, 1, false);
-        layers.push_back(ci);
+        layers_.push_back(ci);
        {{field}}->getSliceBeforeGhostLayer(stencil::B, ci, 1, false);
-        layers.push_back(ci);
+        layers_.push_back(ci);
        {{field}}->getSliceBeforeGhostLayer(stencil::N, ci, 1, false);
        ci.expand(Cell(0, 0, -1));
-        layers.push_back(ci);
+        layers_.push_back(ci);
        {{field}}->getSliceBeforeGhostLayer(stencil::S, ci, 1, false);
        ci.expand(Cell(0, 0, -1));
-        layers.push_back(ci);
+        layers_.push_back(ci);
        {{field}}->getSliceBeforeGhostLayer(stencil::E, ci, 1, false);
        ci.expand(Cell(0, -1, -1));
-        layers.push_back(ci);
+        layers_.push_back(ci);
        {{field}}->getSliceBeforeGhostLayer(stencil::W, ci, 1, false);
        ci.expand(Cell(0, -1, -1));
-        layers.push_back(ci);
+        layers_.push_back(ci);
    }
    {%if target is equalto 'gpu'%}
    {
        auto parallelSection_ = parallelStreams_.parallelSection( stream );
-        for( auto & ci: layers )
+        for( auto & ci: layers_ )
        {
            parallelSection_.run([&]( auto s ) {
                {{kernel|generate_call(stream='s', cell_interval='ci')|indent(16)}}
@@ -124,7 +122,7 @@ void {{class_name}}::outer( IBlock * block{%if target is equalto 'gpu'%} , cudaS
        }
    }
    {% else %}
-    for( auto & ci: layers )
+    for( auto & ci: layers_ )
    {
        {{kernel|generate_call(cell_interval='ci')|indent(8)}}
    }

--- a/pystencils_walberla/templates/SweepInnerOuter.tmpl.h
+++ b/pystencils_walberla/templates/SweepInnerOuter.tmpl.h
@@ -97,6 +97,8 @@ private:
    {%if target is equalto 'gpu'%}
    cuda::ParallelStreams parallelStreams_;
    {% endif %}
+    std::vector<CellInterval> layers_;
 };