Skip to content
Snippets Groups Projects
Select Git revision
  • c78e6088ed55249ae77678472accfd7a4300ad45
  • master default protected
  • v2.0-dev protected
  • zikeliml/Task-96-dotExporterForAST
  • zikeliml/124-rework-tutorials
  • fma
  • fhennig/v2.0-deprecations
  • holzer-master-patch-46757
  • 66-absolute-access-is-probably-not-copied-correctly-after-_eval_subs
  • gpu_bufferfield_fix
  • hyteg
  • vectorization_sqrt_fix
  • target_dh_refactoring
  • const_fix
  • improved_comm
  • gpu_liveness_opts
  • release/1.3.7 protected
  • release/1.3.6 protected
  • release/2.0.dev0 protected
  • release/1.3.5 protected
  • release/1.3.4 protected
  • release/1.3.3 protected
  • release/1.3.2 protected
  • release/1.3.1 protected
  • release/1.3 protected
  • release/1.2 protected
  • release/1.1.1 protected
  • release/1.1 protected
  • release/1.0.1 protected
  • release/1.0 protected
  • release/0.4.4 protected
  • last/Kerncraft
  • last/OpenCL
  • last/LLVM
  • release/0.4.3 protected
  • release/0.4.2 protected
36 results

test_fd_derivation.ipynb

Blame
  • test_blocking.py 3.37 KiB
    import numpy as np
    import sympy as sp
    import pytest
    
    import pystencils as ps
    
    
    def jacobi(dst, src):
        assert dst.spatial_dimensions == src.spatial_dimensions
        assert src.index_dimensions == 0 and dst.index_dimensions == 0
        neighbors = []
        for d in range(src.spatial_dimensions):
            neighbors += [src.neighbor(d, offset) for offset in (1, -1)]
        return ps.Assignment(dst.center, sp.Add(*neighbors) / len(neighbors))
    
    
    def check_equivalence(assignments, src_arr):
        for openmp in (False, True):
            for vectorization in [False, {'assume_inner_stride_one': True}]:
                with_blocking = ps.create_kernel(assignments, cpu_blocking=(8, 16, 4), cpu_openmp=openmp,
                                                 cpu_vectorize_info=vectorization).compile()
                with_blocking_only_over_y = ps.create_kernel(assignments, cpu_blocking=(0, 16, 0), cpu_openmp=openmp,
                                                             cpu_vectorize_info=vectorization).compile()
                without_blocking = ps.create_kernel(assignments).compile()
    
                only_omp = ps.create_kernel(assignments, cpu_openmp=2).compile()
    
                print(f"  openmp {openmp}, vectorization {vectorization}")
                dst_arr = np.zeros_like(src_arr)
                dst2_arr = np.zeros_like(src_arr)
                dst3_arr = np.zeros_like(src_arr)
                ref_arr = np.zeros_like(src_arr)
                np.copyto(src_arr, np.random.rand(*src_arr.shape))
                with_blocking(src=src_arr, dst=dst_arr)
                with_blocking_only_over_y(src=src_arr, dst=dst2_arr)
                without_blocking(src=src_arr, dst=ref_arr)
                only_omp(src=src_arr, dst=dst3_arr)
                np.testing.assert_almost_equal(ref_arr, dst_arr)
                np.testing.assert_almost_equal(ref_arr, dst2_arr)
                np.testing.assert_almost_equal(ref_arr, dst3_arr)
    
    
    @pytest.mark.xfail(reason="CPU blocking is not yet implemented in the new backend")
    def test_jacobi3d_var_size():
        src, dst = ps.fields("src, dst: double[3D]", layout='c')
    
        print("Var Size: Smaller than block sizes")
        arr = np.empty([4, 5, 6])
        check_equivalence(jacobi(dst, src), arr)
    
        print("Var Size: Large non divisible sizes")
        arr = np.empty([100, 80, 9])
        check_equivalence(jacobi(dst, src), arr)
    
        print("Var Size: Multiples of block sizes")
        arr = np.empty([8*4, 16*2, 4*3])
        check_equivalence(jacobi(dst, src), arr)
    
    
    @pytest.mark.xfail(reason="CPU blocking is not yet implemented in the new backend")
    def test_jacobi3d_fixed_size():
        print("Fixed Size: Large non divisible sizes")
        arr = np.empty([10, 10, 9])
        src, dst = ps.fields("src, dst: double[3D]", src=arr, dst=arr)
        check_equivalence(jacobi(dst, src), arr)
    
        print("Fixed Size: Smaller than block sizes")
        arr = np.empty([4, 5, 6])
        src, dst = ps.fields("src, dst: double[3D]", src=arr, dst=arr)
        check_equivalence(jacobi(dst, src), arr)
    
        print("Fixed Size: Multiples of block sizes")
        arr = np.empty([8*4, 16*2, 4*3])
        src, dst = ps.fields("src, dst: double[3D]", src=arr, dst=arr)
        check_equivalence(jacobi(dst, src), arr)
    
    
    @pytest.mark.xfail(reason="CPU blocking is not yet implemented in the new backend")
    def test_jacobi3d_fixed_field_size():
        src, dst = ps.fields("src, dst: double[3, 5, 6]", layout='c')
    
        print("Fixed Field Size: Smaller than block sizes")
        arr = np.empty([3, 5, 6])
        check_equivalence(jacobi(dst, src), arr)