diff --git a/MEMO b/MEMO index 05cc2f804837eaab69d3b997d50cd0af1f7a7fae..511306dbab09ec61559443629b1b5ab904b88cae 100644 --- a/MEMO +++ b/MEMO @@ -49,6 +49,10 @@ To-do - Make tests run on GPUs +- Fuse: store/fetch elimination? + +- divisibility constraints + Fixes: - Group instructions by dependency/inames for scheduling, to @@ -62,8 +66,6 @@ Fixes: Future ideas ^^^^^^^^^^^^ -- Fuse: store/fetch elimination? - - Expose iname-duplicate-and-rename as a primitive. - Array language diff --git a/loopy/codegen/loop.py b/loopy/codegen/loop.py index 650ce34f4562ae36ba4e9ac2342cb57b690d3d75..efb70c5389b1c95c8ad24ab20b8dd1313a0b8174 100644 --- a/loopy/codegen/loop.py +++ b/loopy/codegen/loop.py @@ -61,11 +61,11 @@ def get_slab_decomposition(kernel, iname, sched_index, codegen_state): .add_constraint( isl.Constraint.inequality_from_aff( iname_rel_aff(space, - iname, ">=", upper_bound_aff-upper_incr)))) + iname, ">", upper_bound_aff-upper_incr)))) upper_bulk_bound = ( isl.Constraint.inequality_from_aff( iname_rel_aff(space, - iname, "<", upper_bound_aff-upper_incr))) + iname, "<=", upper_bound_aff-upper_incr))) else: lower_slab = None