ollama · dhiltgen · May 8, 2024 · dims · May 9, 2024 · dhiltgen
diff --git a/gpu/amd_linux.go b/gpu/amd_linux.go
@@ -13,6 +13,7 @@ import (
 	"strings"
 
 	"github.com/ollama/ollama/format"
+	"github.com/ollama/ollama/server/envconfig"
 )
 
 // Discovery logic for AMD/ROCm GPUs
@@ -51,9 +52,9 @@ func AMDGetGPUInfo() []GpuInfo {
 
 	// Determine if the user has already pre-selected which GPUs to look at, then ignore the others
 	var visibleDevices []string
-	hipVD := os.Getenv("HIP_VISIBLE_DEVICES")   // zero based index only
-	rocrVD := os.Getenv("ROCR_VISIBLE_DEVICES") // zero based index or UUID, but consumer cards seem to not support UUID
-	gpuDO := os.Getenv("GPU_DEVICE_ORDINAL")    // zero based index
+	hipVD := envconfig.HipVisibleDevices   // zero based index only
+	rocrVD := envconfig.RocrVisibleDevices // zero based index or UUID, but consumer cards seem to not support UUID
+	gpuDO := envconfig.GpuDeviceOrdinal    // zero based index
 	switch {
 	// TODO is this priorty order right?
 	case hipVD != "":
@@ -66,7 +67,7 @@ func AMDGetGPUInfo() []GpuInfo {
 		visibleDevices = strings.Split(gpuDO, ",")
 	}
 
-	gfxOverride := os.Getenv("HSA_OVERRIDE_GFX_VERSION")
+	gfxOverride := envconfig.HsaOverrideGfxVersion
 	var supported []string
 	libDir := ""
 

diff --git a/gpu/amd_windows.go b/gpu/amd_windows.go
@@ -11,6 +11,7 @@ import (
 	"strings"
 
 	"github.com/ollama/ollama/format"
+	"github.com/ollama/ollama/server/envconfig"
 )
 
 const (
@@ -54,7 +55,7 @@ func AMDGetGPUInfo() []GpuInfo {
 	}
 
 	var supported []string
-	gfxOverride := os.Getenv("HSA_OVERRIDE_GFX_VERSION")
+	gfxOverride := envconfig.HsaOverrideGfxVersion
 	if gfxOverride == "" {
 		supported, err = GetSupportedGFX(libDir)
 		if err != nil {

diff --git a/server/envconfig/config.go b/server/envconfig/config.go
@@ -31,10 +31,21 @@ var (
 	RunnersDir string
 	// Set via OLLAMA_TMPDIR in the environment
 	TmpDir string
+
+	// Set via CUDA_VISIBLE_DEVICES in the environment
+	CudaVisibleDevices string
+	// Set via HIP_VISIBLE_DEVICES in the environment
+	HipVisibleDevices string
+	// Set via ROCR_VISIBLE_DEVICES in the environment
+	RocrVisibleDevices string
+	// Set via GPU_DEVICE_ORDINAL in the environment
+	GpuDeviceOrdinal string
+	// Set via HSA_OVERRIDE_GFX_VERSION in the environment
+	HsaOverrideGfxVersion string
 )
 
 func AsMap() map[string]string {
-	return map[string]string{
+	ret := map[string]string{
 		"OLLAMA_ORIGINS":           fmt.Sprintf("%v", AllowOrigins),
 		"OLLAMA_DEBUG":             fmt.Sprintf("%v", Debug),
 		"OLLAMA_LLM_LIBRARY":       fmt.Sprintf("%v", LLMLibrary),
@@ -46,6 +57,14 @@ func AsMap() map[string]string {
 		"OLLAMA_RUNNERS_DIR":       fmt.Sprintf("%v", RunnersDir),
 		"OLLAMA_TMPDIR":            fmt.Sprintf("%v", TmpDir),
 	}
+	if runtime.GOOS != "darwin" {
+		ret["CUDA_VISIBLE_DEVICES"] = fmt.Sprintf("%v", CudaVisibleDevices)
+		ret["HIP_VISIBLE_DEVICES"] = fmt.Sprintf("%v", HipVisibleDevices)
+		ret["ROCR_VISIBLE_DEVICES"] = fmt.Sprintf("%v", RocrVisibleDevices)
+		ret["GPU_DEVICE_ORDINAL"] = fmt.Sprintf("%v", GpuDeviceOrdinal)
+		ret["HSA_OVERRIDE_GFX_VERSION"] = fmt.Sprintf("%v", HsaOverrideGfxVersion)
+	}
+	return ret
 }
 
 var defaultAllowOrigins = []string{
@@ -163,12 +182,19 @@ func LoadConfig() {
 		}
 	}
 
-	if onp := os.Getenv("OLLAMA_MAX_QUEUE"); onp != "" {
+	if onp := clean("OLLAMA_MAX_QUEUE"); onp != "" {
 		p, err := strconv.Atoi(onp)
 		if err != nil || p <= 0 {
 			slog.Error("invalid setting", "OLLAMA_MAX_QUEUE", onp, "error", err)
 		} else {
 			MaxQueuedRequests = p
 		}
 	}
+
+	CudaVisibleDevices = clean("CUDA_VISIBLE_DEVICES")
 func cudaGetVisibleDevicesEnv(gpuInfo []GpuInfo) (string, string) { 
 func cudaGetVisibleDevicesEnv(gpuInfo []GpuInfo) (string, string) { 
+	HipVisibleDevices = clean("HIP_VISIBLE_DEVICES")
+	RocrVisibleDevices = clean("ROCR_VISIBLE_DEVICES")
+	GpuDeviceOrdinal = clean("GPU_DEVICE_ORDINAL")
+	HsaOverrideGfxVersion = clean("HSA_OVERRIDE_GFX_VERSION")
+
 }