mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-05-28 22:56:32 +00:00
use __hmul2 instead of __hmul2_rn (#15852)
### Description <!-- Describe your changes. --> ### Motivation and Context <!-- - Why is this change required? What problem does it solve? - If it fixes an open issue, please link to the issue here. --> https://github.com/microsoft/onnxruntime/issues/15840
This commit is contained in:
parent
34cb293c6b
commit
475f661acd
1 changed files with 1 additions and 1 deletions
|
|
@ -156,7 +156,7 @@ struct TypeMapper : public V_vec_m_<T, size> {};
|
|||
// The following operator overriding is not common so we put it in anonymous namespace
|
||||
#if defined(__CUDA_ARCH__) && __CUDA_ARCH__ > 530
|
||||
inline __device__ half2 operator*(const float a, const half2 b) {
|
||||
return __hmul2_rn(__float2half2_rn(a), b);
|
||||
return __hmul2(__float2half2_rn(a), b);
|
||||
}
|
||||
#else
|
||||
inline __device__ half2 operator*(const float a, const half2 b) {
|
||||
|
|
|
|||
Loading…
Reference in a new issue