diff --git a/test.py b/test.py index 84ce34cd09065f089a920d1a8778f269720d3a1a..0a73b472fe00649a513dfe68b3078548658b50f4 100644 --- a/test.py +++ b/test.py @@ -114,6 +114,8 @@ def test_compute_flux_derivatives_gpu(ctx_factory): flux_derivatives_dev = cl.array.empty(queue, (nvars, ndim, nx+6, ny+6, nz+6), dtype=np.float32, order="F") + prg = prg.copy(target=lp.PyOpenCLTarget(queue.device)) + if 1: with open("gen-code.cl", "w") as outf: outf.write(lp.generate_code_v2(prg).device_code()) @@ -146,11 +148,12 @@ def benchmark_compute_flux_derivatives_gpu(ctx_factory): flux_derivatives_dev = cl.array.empty(queue, (nvars, ndim, nx+6, ny+6, nz+6), dtype=np.float32, order="F") + prg = prg.copy(target=lp.PyOpenCLTarget(queue.device)) + if 0: with open("gen-code.cl", "w") as outf: outf.write(lp.generate_code_v2(prg).device_code()) - prg = prg.copy(target=lp.PyOpenCLTarget(queue.device)) prg = lp.set_options(prg, ignore_boostable_into=True, write_wrapper=True) #op_map = lp.get_op_map(prg, count_redundant_work=False) #print(op_map)