mirror of https://github.com/NVIDIA/nccl.git
Merge 51f51741d5
into 593de54e52
This commit is contained in:
commit
2b3b197e35
|
@ -260,7 +260,7 @@ struct Apply_Cast<float ,__nv_bfloat16, /*EltPerPack=*/2> {
|
|||
template<> \
|
||||
struct Apply_Cast<A, B, EltPerPack> { \
|
||||
__device__ __forceinline__ static BytePack<sizeof(B)*EltPerPack> cast(BytePack<sizeof(A)*EltPerPack> a) { \
|
||||
return toPack(VecB(fromPack<VecA>(a))); \
|
||||
return toPack(static_cast<VecB>(fromPack<VecA>(a))); \
|
||||
} \
|
||||
}; \
|
||||
template<> \
|
||||
|
|
Loading…
Reference in New Issue