Skip to content
Snippets Groups Projects
Commit 374d0fd5 authored by Stephan Seitz's avatar Stephan Seitz
Browse files

Make Torch CUDA compilation pass

parent e47d321f
Branches
Tags
No related merge requests found
...@@ -20,10 +20,12 @@ __global__ void {{ kernel_name }}_cuda_forward_kernel( ...@@ -20,10 +20,12 @@ __global__ void {{ kernel_name }}_cuda_forward_kernel(
{% for i in range(tensor.spatial_dimensions )-%} {% for i in range(tensor.spatial_dimensions )-%}
int _stride_{{ tensor.name }}_{{ i }} {{- ", " }} int _stride_{{ tensor.name }}_{{ i }} {{- ", " }}
{% endfor -%} {% endfor -%}
{% for i in range(tensor.spatial_dimensions )-%}
int _size_{{ tensor.name }}_{{ i }} {{- ", " }}
{% endfor -%}
{% endfor -%} {% endfor -%}
{% for i in range(forward_output_tensors[0].spatial_dimensions )-%} int _unused
int _size_{{ forward_output_tensors[0] }}_{{ i }} {{- "," if not loop.last }} )
{% endfor %})
{ {
{{forward_kernel}} {{forward_kernel}}
} }
...@@ -36,10 +38,12 @@ __global__ void {{ kernel_name }}_cuda_backward_kernel( ...@@ -36,10 +38,12 @@ __global__ void {{ kernel_name }}_cuda_backward_kernel(
{% for i in range(tensor.spatial_dimensions )-%} {% for i in range(tensor.spatial_dimensions )-%}
int _stride_{{ tensor.name }}_{{ i }} {{- ", " }} int _stride_{{ tensor.name }}_{{ i }} {{- ", " }}
{% endfor -%} {% endfor -%}
{% for i in range(tensor.spatial_dimensions )-%}
int _size_{{ tensor.name }}_{{ i }} {{- ", " }}
{% endfor -%}
{% endfor -%} {% endfor -%}
{% for i in range(forward_output_tensors[0].spatial_dimensions )-%} int _unused
int _size_{{ forward_output_tensors[0].name }}_{{ i }} {{- "," if not loop.last }} )
{% endfor %})
{ {
{{backward_kernel}} {{backward_kernel}}
} }
...@@ -50,9 +54,14 @@ void {{ kernel_name }}_cuda_forward( ...@@ -50,9 +54,14 @@ void {{ kernel_name }}_cuda_forward(
{%- endfor -%}) {%- endfor -%})
{ {
{% for i in range(forward_output_tensors[0].spatial_dimensions )-%} {% for tensor in forward_tensors -%}
int _size_{{ forward_output_tensors[0].name }}_{{ i }} = {{ forward_output_tensors[0].name }}.size({{ i }}); {% for i in dimensions -%}
{% endfor %} int _stride_{{tensor}}_{{i}} = {{tensor}}.strides()[{{ i }}];
{% endfor -%}
{% for i in dimensions -%}
int _size_{{tensor}}_{{i}} = {{tensor}}.size({{ i }});
{% endfor -%}
{% endfor -%}
/*at:: at::device(at::kCUDA).dtype(k{{ dtype }})*/ /*at:: at::device(at::kCUDA).dtype(k{{ dtype }})*/
AT_DISPATCH_FLOATING_TYPES({{ forward_input_tensors[0].name }}.type(), "{{ kernel_name }}_forward_cuda", ([&] { AT_DISPATCH_FLOATING_TYPES({{ forward_input_tensors[0].name }}.type(), "{{ kernel_name }}_forward_cuda", ([&] {
...@@ -63,10 +72,11 @@ void {{ kernel_name }}_cuda_forward( ...@@ -63,10 +72,11 @@ void {{ kernel_name }}_cuda_forward(
{% for i in range(tensor.spatial_dimensions) -%} {% for i in range(tensor.spatial_dimensions) -%}
{{tensor.name}}.strides()[{{ i }}] {{- "," }} {{tensor.name}}.strides()[{{ i }}] {{- "," }}
{% endfor -%} {% endfor -%}
{% for i in range(tensor.spatial_dimensions) -%}
{{tensor.name}}.size({{ i }}) {{- "," }}
{% endfor -%}
{% endfor -%} {% endfor -%}
{% for i in range(forward_output_tensors[0].spatial_dimensions) -%} 0
{{ forward_output_tensors[0].name }}.size({{ i }}) {{- "," if not loop.last }}
{% endfor %}
); );
})); }));
cudaError_t err = cudaGetLastError(); cudaError_t err = cudaGetLastError();
...@@ -82,9 +92,14 @@ void {{ kernel_name }}_cuda_backward( ...@@ -82,9 +92,14 @@ void {{ kernel_name }}_cuda_backward(
{%- endfor %}) {%- endfor %})
{ {
{% for i in range(backward_output_tensors[0].spatial_dimensions )-%} {% for tensor in backward_tensors -%}
int _size_{{ backward_output_tensors[0].name }}_{{ i }} = {{ backward_output_tensors[0].name }}.size({{ i }}); {% for i in dimensions -%}
{% endfor %} int _stride_{{tensor}}_{{i}} = {{tensor}}.strides()[{{ i }}];
{% endfor -%}
{% for i in dimensions -%}
int _size_{{tensor}}_{{i}} = {{tensor}}.size({{ i }});
{% endfor -%}
{% endfor -%}
/*at:: at::device(at::kCUDA).dtype(k{{ dtype }})*/ /*at:: at::device(at::kCUDA).dtype(k{{ dtype }})*/
AT_DISPATCH_FLOATING_TYPES({{ backward_input_tensors[0].name }}.type(), "{{ kernel_name }}_backward_cuda", ([&] { AT_DISPATCH_FLOATING_TYPES({{ backward_input_tensors[0].name }}.type(), "{{ kernel_name }}_backward_cuda", ([&] {
...@@ -95,10 +110,11 @@ void {{ kernel_name }}_cuda_backward( ...@@ -95,10 +110,11 @@ void {{ kernel_name }}_cuda_backward(
{% for i in range(tensor.spatial_dimensions )-%} {% for i in range(tensor.spatial_dimensions )-%}
{{tensor.name}}.strides()[{{ i }}]{{- ", " }} {{tensor.name}}.strides()[{{ i }}]{{- ", " }}
{% endfor -%} {% endfor -%}
{% for i in range(tensor.spatial_dimensions )-%}
{{tensor.name}}.size({{ i }}){{- ", " }}
{% endfor -%}
{% endfor -%} {% endfor -%}
{% for i in range(backward_output_tensors[0].spatial_dimensions )-%} 0
{{ backward_output_tensors[0].name }}.size({{ i }}) {{- "," if not loop.last }}
{% endfor %}
); );
})); }));
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment