Enable Vulkan Flash attention in FlashAttentionSupported
This commit is contained in:
parent
e6da524ab7
commit
49c4d154ae
|
|
@ -422,8 +422,7 @@ func GetGPUInfo() GpuInfoList {
|
|||
C.free(unsafe.Pointer(memInfo.err))
|
||||
continue
|
||||
}
|
||||
|
||||
gpuInfo.FlashAttention = true
|
||||
|
||||
gpuInfo.TotalMemory = uint64(memInfo.total)
|
||||
gpuInfo.FreeMemory = uint64(memInfo.free)
|
||||
gpuInfo.ID = C.GoString(&memInfo.gpu_id[0])
|
||||
|
|
|
|||
|
|
@ -182,7 +182,8 @@ func (l GpuInfoList) FlashAttentionSupported() bool {
|
|||
supportsFA := gpu.Library == "cpu" ||
|
||||
gpu.Library == "metal" ||
|
||||
(gpu.Library == "cuda" && gpu.DriverMajor >= 7) ||
|
||||
gpu.Library == "rocm"
|
||||
gpu.Library == "rocm" ||
|
||||
gpu.Library == "vulkan"
|
||||
|
||||
if !supportsFA {
|
||||
return false
|
||||
|
|
|
|||
Loading…
Reference in New Issue