Skip to content
Snippets Groups Projects
Commit 04fd3c7a authored by Andreas Klöckner's avatar Andreas Klöckner Committed by GitHub
Browse files

Merge pull request #167 from hightower8083/bugfix-apple-radeon-scan

Apple AMD Radeon GPU bug-fix
parents 52610646 3021f0fb
No related branches found
No related tags found
No related merge requests found
Pipeline #
...@@ -295,8 +295,11 @@ void ${kernel_name}( ...@@ -295,8 +295,11 @@ void ${kernel_name}(
if (LID_0 == 0 && unit_base != interval_begin) if (LID_0 == 0 && unit_base != interval_begin)
{ {
scan_type tmp = ldata[K][WG_SIZE - 1].value;
scan_type tmp_aux = ldata[0][0].value;
ldata[0][0].value = SCAN_EXPR( ldata[0][0].value = SCAN_EXPR(
ldata[K][WG_SIZE - 1].value, ldata[0][0].value, tmp, tmp_aux,
%if is_segmented: %if is_segmented:
(l_segment_start_flags[0][0]) (l_segment_start_flags[0][0])
%else: %else:
...@@ -760,7 +763,7 @@ _PREFIX_WORDS = set(""" ...@@ -760,7 +763,7 @@ _PREFIX_WORDS = set("""
group_base seg_end my_val DEBUG ARGS group_base seg_end my_val DEBUG ARGS
ints_to_store ints_per_wg scan_types_per_int linear_index ints_to_store ints_per_wg scan_types_per_int linear_index
linear_scan_data_idx dest src store_base wrapped_scan_type linear_scan_data_idx dest src store_base wrapped_scan_type
dummy scan_tmp dummy scan_tmp tmp_aux
LID_2 LID_1 LID_0 LID_2 LID_1 LID_0
LDIM_0 LDIM_1 LDIM_2 LDIM_0 LDIM_1 LDIM_2
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment