We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 23f944c commit 4102c9bCopy full SHA for 4102c9b
fbgemm_gpu/include/fbgemm_gpu/utils/float.cuh
@@ -51,10 +51,9 @@ struct Half4 {
51
52
__device__ inline void store(at::Half* p) {
53
#ifdef USE_ROCM
54
- p[0] = __low2half(a);
55
- p[1] = __high2half(a);
56
- p[2] = __low2half(b);
57
- p[3] = __high2half(b);
+ *reinterpret_cast<unsigned int*>(p) = *reinterpret_cast<unsigned int*>(&a);
+ *reinterpret_cast<unsigned int*>(p + 2) =
+ *reinterpret_cast<unsigned int*>(&b);
58
#elif CUDA_VERSION >= 9000
59
60
#ifndef __HALF2_TO_UI
0 commit comments