Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
pystencils
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Wiki
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Model registry
Operate
Environments
Monitor
Incidents
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Terms and privacy
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
Alexander Reinauer
pystencils
Commits
269c0bfa
Commit
269c0bfa
authored
4 years ago
by
Markus Holzer
Browse files
Options
Downloads
Plain Diff
Merge branch 'qemu' into 'master'
Add CI job for non-x86 vectorization See merge request
!244
parents
0b740d1f
78c2cbc0
Branches
Branches containing commit
Tags
release/0.3.3
Tags containing commit
No related merge requests found
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
.gitlab-ci.yml
+46
-0
46 additions, 0 deletions
.gitlab-ci.yml
pystencils/backends/simd_instruction_sets.py
+3
-0
3 additions, 0 deletions
pystencils/backends/simd_instruction_sets.py
pystencils/include/arm_neon_helpers.h
+1
-1
1 addition, 1 deletion
pystencils/include/arm_neon_helpers.h
with
50 additions
and
1 deletion
.gitlab-ci.yml
+
46
−
0
View file @
269c0bfa
...
@@ -124,6 +124,52 @@ ubuntu:
...
@@ -124,6 +124,52 @@ ubuntu:
reports
:
reports
:
junit
:
report.xml
junit
:
report.xml
.multiarch_template
:
stage
:
test
except
:
variables
:
-
$ENABLE_NIGHTLY_BUILDS
before_script
:
&multiarch_before_script
-
python3 -c "import pystencils as ps; ps.cpu.cpujit.read_config()"
-
sed -i '/^fail_under.*/d' pytest.ini
script
:
-
export NUM_CORES=$(nproc --all)
-
mkdir -p ~/.config/matplotlib
-
echo "backend:template" > ~/.config/matplotlib/matplotlibrc
-
sed -i 's/--doctest-modules //g' pytest.ini
-
env
-
pip3 list
-
pytest-3 -v -n $NUM_CORES --cov-report html --cov-report term --cov=. --junitxml=report.xml pystencils_tests/test_*vec*.py pystencils_tests/test_random.py
-
python3 -m coverage xml
tags
:
-
docker
artifacts
:
when
:
always
paths
:
-
coverage_report
reports
:
cobertura
:
coverage.xml
junit
:
report.xml
arm64
:
extends
:
.multiarch_template
image
:
i10git.cs.fau.de:5005/pycodegen/pycodegen/arm64
variables
:
PYSTENCILS_SIMD
:
"
neon"
QEMU_CPU
:
"
cortex-a72"
before_script
:
-
*multiarch_before_script
-
sed -i s/march=native/march=armv8-a/g ~/.config/pystencils/config.json
ppc64le
:
extends
:
.multiarch_template
image
:
i10git.cs.fau.de:5005/pycodegen/pycodegen/ppc64le
variables
:
PYSTENCILS_SIMD
:
"
vsx"
before_script
:
-
*multiarch_before_script
-
sed -i s/mcpu=native/mcpu=power8/g ~/.config/pystencils/config.json
minimal-conda
:
minimal-conda
:
stage
:
test
stage
:
test
except
:
except
:
...
...
This diff is collapsed.
Click to expand it.
pystencils/backends/simd_instruction_sets.py
+
3
−
0
View file @
269c0bfa
import
math
import
math
import
os
import
platform
import
platform
from
ctypes
import
CDLL
from
ctypes
import
CDLL
...
@@ -25,6 +26,8 @@ def get_supported_instruction_sets():
...
@@ -25,6 +26,8 @@ def get_supported_instruction_sets():
global
_cache
global
_cache
if
_cache
is
not
None
:
if
_cache
is
not
None
:
return
_cache
.
copy
()
return
_cache
.
copy
()
if
'
PYSTENCILS_SIMD
'
in
os
.
environ
:
return
os
.
environ
[
'
PYSTENCILS_SIMD
'
].
split
(
'
,
'
)
if
platform
.
system
()
==
'
Darwin
'
and
platform
.
machine
()
==
'
arm64
'
:
# not supported by cpuinfo
if
platform
.
system
()
==
'
Darwin
'
and
platform
.
machine
()
==
'
arm64
'
:
# not supported by cpuinfo
return
[
'
neon
'
]
return
[
'
neon
'
]
elif
platform
.
machine
().
startswith
(
'
ppc64
'
):
# no flags reported by cpuinfo
elif
platform
.
machine
().
startswith
(
'
ppc64
'
):
# no flags reported by cpuinfo
...
...
This diff is collapsed.
Click to expand it.
pystencils/include/arm_neon_helpers.h
+
1
−
1
View file @
269c0bfa
...
@@ -32,7 +32,7 @@ inline int32x4_t makeVec_s32(int a, int b, int c, int d)
...
@@ -32,7 +32,7 @@ inline int32x4_t makeVec_s32(int a, int b, int c, int d)
#endif
#endif
inline
void
cachelineZero
(
void
*
p
)
{
inline
void
cachelineZero
(
void
*
p
)
{
__asm__
volatile
(
"dc zva, %0"
::
"r"
(
p
));
__asm__
volatile
(
"dc zva, %0"
::
"r"
(
p
)
:
"memory"
);
}
}
inline
size_t
_cachelineSize
()
{
inline
size_t
_cachelineSize
()
{
...
...
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment