Skip to content

Commit 85c5880

Browse files
zjing14carlushuang
authored andcommitted
disable tensor contraction f64 on MI100 (#602)
1 parent c84efbc commit 85c5880

File tree

2 files changed

+7
-2
lines changed

2 files changed

+7
-2
lines changed

include/ck/tensor_operation/gpu/device/impl/device_contraction_multiple_d_xdl_cshuffle.hpp

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -586,6 +586,11 @@ struct DeviceContractionMultipleD_Xdl_CShuffle
586586
return false;
587587
}
588588

589+
if(ck::get_device_name() != "gfx90a" && std::is_same<ADataType, double>::value)
590+
{
591+
return false;
592+
}
593+
589594
if(!GridwiseGemm::CheckValidity(arg.a_grid_desc_m_k_,
590595
arg.b_grid_desc_n_k_,
591596
arg.ds_grid_desc_m_n_,

script/cmake-ck-dev.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,8 +10,8 @@ cmake
1010
-D CMAKE_CXX_COMPILER=/opt/rocm/bin/hipcc \
1111
-D CMAKE_CXX_FLAGS="-O3 -ftemplate-backtrace-limit=0 -gline-tables-only -save-temps=$PWD" \
1212
-D CMAKE_BUILD_TYPE=Release \
13-
-D BUILD_DEV=OFF \
14-
-D GPU_TARGETS="gfx90a" \
13+
-D BUILD_DEV=ON \
14+
-D GPU_TARGETS="gfx908;gfx90a" \
1515
-D CMAKE_VERBOSE_MAKEFILE:BOOL=ON \
1616
-D USE_BITINT_EXTENSION_INT4=OFF \
1717
${MY_PROJECT_SOURCE}

0 commit comments

Comments
 (0)