Skip to content

Instantly share code, notes, and snippets.

@ugovaretto
Last active August 19, 2025 07:39
Show Gist options
  • Save ugovaretto/89474f357f80f3130c96f4db18d37df8 to your computer and use it in GitHub Desktop.
Save ugovaretto/89474f357f80f3130c96f4db18d37df8 to your computer and use it in GitHub Desktop.
Fix to make ollama work with gfx1151 with 128GB GTT Memory
diff --git a/discover/amd_linux.go b/discover/amd_linux.go
index ebffbdf6..bbb5ec49 100644
--- a/discover/amd_linux.go
+++ b/discover/amd_linux.go
@@ -315,15 +315,15 @@ func AMDGetGPUInfo() ([]RocmGPUInfo, error) {
gpuOrdinalID += 1
// iGPU detection, remove this check once we can support an iGPU variant of the rocm library
- if totalMemory < IGPUMemLimit {
- reason := "unsupported Radeon iGPU detected skipping"
- slog.Info(reason, "id", gpuInfo.ID, "total", format.HumanBytes2(totalMemory))
- unsupportedGPUs = append(unsupportedGPUs, UnsupportedGPUInfo{
- GpuInfo: gpuInfo.GpuInfo,
- Reason: reason,
- })
- continue
- }
+ // if totalMemory < IGPUMemLimit {
+ // reason := "unsupported Radeon iGPU detected skipping"
+ // slog.Info(reason, "id", gpuInfo.ID, "total", format.HumanBytes2(totalMemory))
+ // unsupportedGPUs = append(unsupportedGPUs, UnsupportedGPUInfo{
+ // GpuInfo: gpuInfo.GpuInfo,
+ // Reason: reason,
+ // })
+ // continue
+ // }
minVer, err := strconv.Atoi(RocmComputeMajorMin)
if err != nil {
slog.Error("invalid RocmComputeMajorMin setting", "value", RocmComputeMajorMin, "error", err)
@@ -437,7 +437,9 @@ func AMDValidateLibDir() (string, error) {
}
// Well known ollama installer path
- installedRocmDir := "/usr/share/ollama/lib/rocm"
+// installedRocmDir := "/usr/share/ollama/lib/rocm"
+ installedRocmDir := "~/opt/rocm-6.4"
+ return installedRocmDir, nil
if rocmLibUsable(installedRocmDir) {
return installedRocmDir, nil
}
diff --git a/server/routes.go b/server/routes.go
index 99b1b300..647001db 100644
--- a/server/routes.go
+++ b/server/routes.go
@@ -53,7 +53,7 @@ var useClient2 = experimentEnabled("client2")
// Low VRAM mode is based on the sum of total VRAM (not free) and triggers
// reduced context length on some models
-var lowVRAMThreshold uint64 = 20 * format.GibiByte
+var lowVRAMThreshold uint64 = 0; //20 * format.GibiByte
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment