CUDA: verify CC is supported by target library (#13298)

This commit is contained in:
Daniel Hiltgen
2025-12-02 09:28:41 -08:00
committed by GitHub
parent d3e0a0dee4
commit f8f1071818

View File

@@ -509,11 +509,9 @@ func GetVisibleDevicesEnv(l []DeviceInfo) map[string]string {
// to crash at inference time and requires deeper validation before we include // to crash at inference time and requires deeper validation before we include
// it in the supported devices list. // it in the supported devices list.
func (d DeviceInfo) NeedsInitValidation() bool { func (d DeviceInfo) NeedsInitValidation() bool {
// At this time the only library we know needs a 2nd pass is ROCm since // ROCm: rocblas will crash on unsupported devices.
// rocblas will crash on unsupported devices. We want to find those crashes // CUDA: verify CC is supported by the version of the library
// during bootstrap discovery so we can eliminate those GPUs before the user return d.Library == "ROCm" || d.Library == "CUDA"
// tries to run inference on them
return d.Library == "ROCm"
} }
// Set the init validation environment variable // Set the init validation environment variable