Skip to content

Commit 0894698

Browse files
authored
Merge pull request #271 from Hezcriko/master
Add support for RTX 50 Series
2 parents 0b0593b + 0f3be52 commit 0894698

File tree

1 file changed

+4
-3
lines changed

1 file changed

+4
-3
lines changed

src/cudart/gpucard.cpp

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -101,7 +101,7 @@ static void getDeviceAttribute(DeviceAttribute& a, int device = 0)
101101
bool found_cc = true;
102102

103103
// Maximum number of resident blocks per multiprocessor
104-
if (a.cc > 90)
104+
if (a.cc > 120)
105105
found_cc = false;
106106
else if (a.cc >= 90)
107107
a.max_blocks_per_multiprocessor = 32;
@@ -122,16 +122,17 @@ static void getDeviceAttribute(DeviceAttribute& a, int device = 0)
122122

123123
// Number of CUDA cores (FP32) per multiprocessor, not tabulated;
124124
// documented in "Compute Capability - architecture"
125+
// 12.0: 128
125126
// 9.0: 128
126127
// 8.6, 8.7, 8.9: 128
127128
// 7.0 7.2 7.5 8.0: 64
128129
// 6.1 6.2: 128
129130
// 6.0: 64
130131
// 5.0 5.2: 128
131132
// 3.0 3.5 3.7: 192
132-
if (a.cc > 90)
133+
if (a.cc > 120)
133134
found_cc = false;
134-
else if (a.cc >= 90)
135+
else if (a.cc >= 86)
135136
a.cores_per_multiprocessor = 128;
136137
else if (a.cc >= 80)
137138
a.cores_per_multiprocessor = 64;

0 commit comments

Comments
 (0)