Skip to content

Commit

Permalink
[Intel] Add fast_dividef (#902)
Browse files Browse the repository at this point in the history
Signed-off-by: Whitney Tsang <whitney.tsang@intel.com>
  • Loading branch information
whitneywhtsang authored Apr 17, 2024
1 parent 9a0605c commit b10a970
Showing 1 changed file with 7 additions and 0 deletions.
7 changes: 7 additions & 0 deletions python/triton/language/extra/intel/libdevice.py
Original file line number Diff line number Diff line change
Expand Up @@ -127,6 +127,13 @@ def saturatef(arg0, _builder=None):
}, is_pure=True, _builder=_builder)


@core.extern
def fast_dividef(arg0, arg1, _builder=None):
return core.extern_elementwise("", "", [arg0, arg1], {
(core.dtype("fp32"), core.dtype("fp32")): ("__imf_fast_fdividef", core.dtype("fp32")),
}, is_pure=True, _builder=_builder)


@core.extern
def div_rn(arg0, arg1, _builder=None):
return core.extern_elementwise(
Expand Down

0 comments on commit b10a970

Please sign in to comment.