File tree Expand file tree Collapse file tree 2 files changed +3
-3
lines changed
Expand file tree Collapse file tree 2 files changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -182,9 +182,6 @@ namespace ctranslate2 {
182182
183183 bool gpu_supports_int8 (int device) {
184184 const cudaDeviceProp& device_prop = get_device_properties (device);
185- // Disable INT8 for sm120: https://github.com/OpenNMT/CTranslate2/issues/1865
186- if (device_prop.major == 12 && device_prop.minor == 0 )
187- return false ;
188185 return device_prop.major > 6 || (device_prop.major == 6 && device_prop.minor == 1 );
189186 }
190187
Original file line number Diff line number Diff line change @@ -350,6 +350,9 @@ namespace ctranslate2 {
350350 if ((compute_type == ComputeType::FLOAT16 || compute_type == ComputeType::BFLOAT16)
351351 && cuda::gpu_has_fp16_tensor_cores (device_index))
352352 return 8 ;
353+ else if ((compute_type == ComputeType::INT8_FLOAT16 || compute_type == ComputeType::INT8_BFLOAT16 || compute_type == ComputeType::INT8_FLOAT32)
354+ && cuda::gpu_has_int8_tensor_cores (device_index))
355+ return 16 ;
353356 }
354357#else
355358 (void )compute_type;
You can’t perform that action at this time.
0 commit comments