Skip to content

Commit 49e625b

Browse files
committed
enabled for MI series only
1 parent ddc83ad commit 49e625b

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

aten/src/ATen/native/cuda/Copy.cu

+1-1
Original file line numberDiff line numberDiff line change
@@ -341,7 +341,7 @@ void direct_copy_kernel_cuda(TensorIteratorBase &iter) {
341341
AT_DISPATCH_BIT_TYPES(dtype, "copy_", [&] {
342342
gpu_kernel_nocast(iter, [] GPU_LAMBDA(scalar_t x) { return x; });
343343
});
344-
} else if (is_permute_021(iter) && (dtype == kBFloat16 || dtype == kHalf) && !at::detail::getCUDAHooks().isGPUArch({"gfx1100"})) {
344+
} else if (is_permute_021(iter) && (dtype == kBFloat16 || dtype == kHalf) && at::detail::getCUDAHooks().isGPUArch({{"gfx94", "gfx942", "gfx950"}})) {
345345
transpose_last2dim(iter);
346346
} else {
347347
AT_DISPATCH_V2(

0 commit comments

Comments
 (0)