Last active
August 19, 2025 07:39
-
-
Save ugovaretto/89474f357f80f3130c96f4db18d37df8 to your computer and use it in GitHub Desktop.
Fix to make ollama work with gfx1151 with 128GB GTT Memory
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
diff --git a/discover/amd_linux.go b/discover/amd_linux.go | |
index ebffbdf6..bbb5ec49 100644 | |
--- a/discover/amd_linux.go | |
+++ b/discover/amd_linux.go | |
@@ -315,15 +315,15 @@ func AMDGetGPUInfo() ([]RocmGPUInfo, error) { | |
gpuOrdinalID += 1 | |
// iGPU detection, remove this check once we can support an iGPU variant of the rocm library | |
- if totalMemory < IGPUMemLimit { | |
- reason := "unsupported Radeon iGPU detected skipping" | |
- slog.Info(reason, "id", gpuInfo.ID, "total", format.HumanBytes2(totalMemory)) | |
- unsupportedGPUs = append(unsupportedGPUs, UnsupportedGPUInfo{ | |
- GpuInfo: gpuInfo.GpuInfo, | |
- Reason: reason, | |
- }) | |
- continue | |
- } | |
+ // if totalMemory < IGPUMemLimit { | |
+ // reason := "unsupported Radeon iGPU detected skipping" | |
+ // slog.Info(reason, "id", gpuInfo.ID, "total", format.HumanBytes2(totalMemory)) | |
+ // unsupportedGPUs = append(unsupportedGPUs, UnsupportedGPUInfo{ | |
+ // GpuInfo: gpuInfo.GpuInfo, | |
+ // Reason: reason, | |
+ // }) | |
+ // continue | |
+ // } | |
minVer, err := strconv.Atoi(RocmComputeMajorMin) | |
if err != nil { | |
slog.Error("invalid RocmComputeMajorMin setting", "value", RocmComputeMajorMin, "error", err) | |
@@ -437,7 +437,9 @@ func AMDValidateLibDir() (string, error) { | |
} | |
// Well known ollama installer path | |
- installedRocmDir := "/usr/share/ollama/lib/rocm" | |
+// installedRocmDir := "/usr/share/ollama/lib/rocm" | |
+ installedRocmDir := "~/opt/rocm-6.4" | |
+ return installedRocmDir, nil | |
if rocmLibUsable(installedRocmDir) { | |
return installedRocmDir, nil | |
} | |
diff --git a/server/routes.go b/server/routes.go | |
index 99b1b300..647001db 100644 | |
--- a/server/routes.go | |
+++ b/server/routes.go | |
@@ -53,7 +53,7 @@ var useClient2 = experimentEnabled("client2") | |
// Low VRAM mode is based on the sum of total VRAM (not free) and triggers | |
// reduced context length on some models | |
-var lowVRAMThreshold uint64 = 20 * format.GibiByte | |
+var lowVRAMThreshold uint64 = 0; //20 * format.GibiByte |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment