diff --git a/test/test_linalg.py b/test/test_linalg.py index cfc3df7da4ef30a5ffb511aa8e966e1b19a690f7..b1ebacb1e477e2cb2529fed263b94faa787e334d 100644 --- a/test/test_linalg.py +++ b/test/test_linalg.py @@ -106,8 +106,8 @@ def test_axpy(ctx_factory): outer_tag="unr", inner_tag="l.0") return knl - for variant in [variant_cpu, variant_gpu]: #for variant in [ variant_gpu]: + for variant in [variant_cpu, variant_gpu]: lp.auto_test_vs_ref(seq_knl, ctx, variant(knl), op_count=[np.dtype(dtype).itemsize*n*3/1e9], op_label=["GBytes"], @@ -218,6 +218,41 @@ def test_variable_size_matrix_mul(ctx_factory): parameters={"n": n}) +def test_funny_shape_matrix_mul(ctx_factory): + ctx = ctx_factory() + + n = get_suitable_size(ctx) + m = n+12 + l = m+12 + + knl = lp.make_kernel( + "[n,m,l] -> {[i,k,j]: 0<=i