We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
:fastmath
1 parent f42d1cf commit 5d88d3cCopy full SHA for 5d88d3c
1 file changed
src/ptx.jl
@@ -291,9 +291,11 @@ function optimize_module!(@nospecialize(job::CompilerJob{PTXCompilerTarget}),
291
register!(pb, NVVMReflectPass())
292
add!(pb, NVVMReflectPass())
293
end
294
- add!(pb, PTXRSqrtFastPass())
295
- add!(pb, PTXFDivFastPass())
296
- add!(pb, PTXFSqrtFastPass())
+ if get(optimization_options(job), :fastmath, true)
+ add!(pb, PTXRSqrtFastPass())
+ add!(pb, PTXFDivFastPass())
297
+ add!(pb, PTXFSqrtFastPass())
298
+ end
299
300
add!(pb, NewPMFunctionPassManager()) do fpm
301
# needed by GemmKernels.jl-like code
0 commit comments