Skip to content

Commit

Permalink
update cuda archCoresPerSM
Browse files Browse the repository at this point in the history
  • Loading branch information
yhmtsai committed Nov 3, 2022
1 parent 1fd207a commit 2ce0fb8
Showing 1 changed file with 4 additions and 1 deletion.
5 changes: 4 additions & 1 deletion common/cuda_hip/base/executor.hpp.inc
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@ namespace {


// The function is copied from _ConvertSMVer2Cores of
// cuda-11.0/samples/common/inc/helper_cuda.h
// cuda-samples:Common/helper_cuda.h
inline int convert_sm_ver_to_cores(int major, int minor)
{
// Defines for GPU Architecture types (using the SM version to determine
Expand All @@ -60,6 +60,9 @@ inline int convert_sm_ver_to_cores(int major, int minor)
{0x72, 64}, // Volta Generation (SM 7.2) GV11b class
{0x75, 64}, // Turing Generation (SM 7.5) TU1xx class
{0x80, 64}, // Ampere Generation (SM 8.0) GA100 class
{0x86, 128}, // Ampere Generation (SM 8.6)
{0x87, 128}, // Ampere Generation (SM 8.7)
{0x90, 128}, // Hopper Generation (SM 9.0)
{-1, -1}};

int index = 0;
Expand Down

0 comments on commit 2ce0fb8

Please sign in to comment.