|
7 | 7 | "log/slog"
|
8 | 8 | "os"
|
9 | 9 | "path/filepath"
|
10 |
| - "strconv" |
| 10 | + "runtime" |
11 | 11 | "strings"
|
12 | 12 | )
|
13 | 13 |
|
@@ -35,22 +35,64 @@ func GetSupportedGFX(libDir string) ([]string, error) {
|
35 | 35 | return ret, nil
|
36 | 36 | }
|
37 | 37 |
|
38 |
| -func amdSetVisibleDevices(ids []int, skip map[int]interface{}) { |
39 |
| - // Set the visible devices if not already set |
40 |
| - // TODO - does sort order matter? |
41 |
| - devices := []string{} |
42 |
| - for i := range ids { |
43 |
| - if _, skipped := skip[i]; skipped { |
| 38 | +func rocmGetVisibleDevicesEnv(gpuInfo []GpuInfo) (string, string) { |
| 39 | + ids := []string{} |
| 40 | + for _, info := range gpuInfo { |
| 41 | + if info.Library != "rocm" { |
| 42 | + // TODO shouldn't happen if things are wired correctly... |
| 43 | + slog.Debug("rocmGetVisibleDevicesEnv skipping over non-rocm device", "library", info.Library) |
44 | 44 | continue
|
45 | 45 | }
|
46 |
| - devices = append(devices, strconv.Itoa(i)) |
| 46 | + ids = append(ids, info.ID) |
47 | 47 | }
|
| 48 | + return "HIP_VISIBLE_DEVICES", strings.Join(ids, ",") |
| 49 | +} |
48 | 50 |
|
49 |
| - val := strings.Join(devices, ",") |
50 |
| - err := os.Setenv("HIP_VISIBLE_DEVICES", val) |
51 |
| - if err != nil { |
52 |
| - slog.Warn(fmt.Sprintf("failed to set env: %s", err)) |
53 |
| - } else { |
54 |
| - slog.Info("Setting HIP_VISIBLE_DEVICES=" + val) |
| 51 | +func commonAMDValidateLibDir() (string, error) { |
| 52 | + // We try to favor system paths first, so that we can wire up the subprocess to use |
| 53 | + // the system version. Only use our bundled version if the system version doesn't work |
| 54 | + // This gives users a more recovery options if versions have subtle problems at runtime |
| 55 | + |
| 56 | + // Prefer explicit HIP env var |
| 57 | + hipPath := os.Getenv("HIP_PATH") |
| 58 | + if hipPath != "" { |
| 59 | + hipLibDir := filepath.Join(hipPath, "bin") |
| 60 | + if rocmLibUsable(hipLibDir) { |
| 61 | + slog.Debug("detected ROCM via HIP_PATH=" + hipPath) |
| 62 | + return hipLibDir, nil |
| 63 | + } |
| 64 | + } |
| 65 | + |
| 66 | + // Scan the LD_LIBRARY_PATH or PATH |
| 67 | + pathEnv := "LD_LIBRARY_PATH" |
| 68 | + if runtime.GOOS == "windows" { |
| 69 | + pathEnv = "PATH" |
| 70 | + } |
| 71 | + |
| 72 | + paths := os.Getenv(pathEnv) |
| 73 | + for _, path := range filepath.SplitList(paths) { |
| 74 | + d, err := filepath.Abs(path) |
| 75 | + if err != nil { |
| 76 | + continue |
| 77 | + } |
| 78 | + if rocmLibUsable(d) { |
| 79 | + return d, nil |
| 80 | + } |
| 81 | + } |
| 82 | + |
| 83 | + // Well known location(s) |
| 84 | + if rocmLibUsable(RocmStandardLocation) { |
| 85 | + return RocmStandardLocation, nil |
| 86 | + } |
| 87 | + |
| 88 | + // Installer payload location if we're running the installed binary |
| 89 | + exe, err := os.Executable() |
| 90 | + if err == nil { |
| 91 | + rocmTargetDir := filepath.Join(filepath.Dir(exe), "rocm") |
| 92 | + if rocmLibUsable(rocmTargetDir) { |
| 93 | + slog.Debug("detected ROCM next to ollama executable " + rocmTargetDir) |
| 94 | + return rocmTargetDir, nil |
| 95 | + } |
55 | 96 | }
|
| 97 | + return "", fmt.Errorf("no suitable rocm found, falling back to CPU") |
56 | 98 | }
|
0 commit comments