Only use 'go-faster' options in matrix multiply example on Nvidia.

0ec05353 · Andreas Klöckner · 819c807e · 0ec05353
Commit 0ec05353 authored 14 years ago by Andreas Klöckner
--- a/examples/matrix-multiply.py
+++ b/examples/matrix-multiply.py
@@ -161,8 +161,12 @@ h_c = numpy.empty((c_height, c_width)).astype(numpy.float32)
 kernel_params = {"block_size": block_size,
        "w_a":a_width, "h_a":a_height, "w_b":b_width}
+if "NVIDIA" in queue.device.vendor:
+    options = "-cl-mad-enable -cl-fast-relaxed-math"
+else:
+    options = None
 prg = cl.Program(ctx, KERNEL_CODE % kernel_params,
-        ).build(options="-cl-mad-enable -cl-fast-relaxed-math")
+        ).build(options=options)
 kernel = prg.matrixMul
 #print prg.binaries[0]