Skip to content

Commit

Permalink
use default 128 cores per sm instead of throws error (#3884)
Browse files Browse the repository at this point in the history
use default 128 cores per sm instead of throws error
  • Loading branch information
liqiangxl authored Feb 17, 2025
1 parent 53bd0a7 commit 2e755b7
Showing 1 changed file with 6 additions and 20 deletions.
26 changes: 6 additions & 20 deletions csrc/scheduler/utils.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -2822,30 +2822,16 @@ namespace {
int getCoresPerSM(int major, int minor) {
int sm_version = (major << 4) + minor;
std::unordered_map<int, int> cores_per_sm_map = {
{0x30, 192},
{0x32, 192},
{0x35, 192},
{0x37, 192},
{0x50, 128},
{0x52, 128},
{0x53, 128},
{0x60, 64},
{0x61, 128},
{0x62, 128},
{0x70, 64},
{0x72, 64},
{0x75, 64},
{0x80, 64},
{0x86, 128},
{0x87, 128},
{0x89, 128},
{0x90, 128},
{0xa0, 128}};
{0x30, 192}, {0x32, 192}, {0x35, 192}, {0x37, 192}, {0x50, 128},
{0x52, 128}, {0x53, 128}, {0x60, 64}, {0x61, 128}, {0x62, 128},
{0x70, 64}, {0x72, 64}, {0x75, 64}, {0x80, 64}, {0x86, 128},
{0x87, 128}, {0x89, 128}, {0x90, 128}, {0xa0, 128}, {0xc0, 128}};
auto it = cores_per_sm_map.find(sm_version);
if (it != cores_per_sm_map.end()) {
return it->second;
}
NVF_THROW("Unknown GPU architecture: ", major, ".", minor);
// Use the default value of 128 for any architecture not listed,
// applicable to all current Blackwell GPUs.
return 128;
}
} // namespace
Expand Down

0 comments on commit 2e755b7

Please sign in to comment.