feat: add ability to pass request-specific env vars to chat completion

thedadams · thedadams · commit bda5f60310b8 · 2024-11-04T10:47:27.000-05:00
This will allow authentication per-request in model providers.

Signed-off-by: Donnie Adams &lt;donnie@acorn.io&gt;
diff --git a/go.mod b/go.mod
@@ -15,7 +15,7 @@ require (
 	github.com/google/shlex v0.0.0-20191202100458-e7afc7fbc510
 	github.com/google/uuid v1.6.0
 	github.com/gptscript-ai/broadcaster v0.0.0-20240625175512-c43682019b86
-	github.com/gptscript-ai/chat-completion-client v0.0.0-20240813051153-a440ada7e3c3
+	github.com/gptscript-ai/chat-completion-client v0.0.0-20241104122544-5fe75f07c131
 	github.com/gptscript-ai/cmd v0.0.0-20240802230653-326b7baf6fcb
 	github.com/gptscript-ai/go-gptscript v0.9.5-rc5.0.20240927213153-2af51434b93e
 	github.com/gptscript-ai/tui v0.0.0-20240923192013-172e51ccf1d6
diff --git a/go.sum b/go.sum
@@ -200,8 +200,8 @@ github.com/gorilla/css v1.0.0 h1:BQqNyPTi50JCFMTw/b67hByjMVXZRwGha6wxVGkeihY=
 github.com/gorilla/css v1.0.0/go.mod h1:Dn721qIggHpt4+EFCcTLTU/vk5ySda2ReITrtgBl60c=
 github.com/gptscript-ai/broadcaster v0.0.0-20240625175512-c43682019b86 h1:m9yLtIEd0z1ia8qFjq3u0Ozb6QKwidyL856JLJp6nbA=
 github.com/gptscript-ai/broadcaster v0.0.0-20240625175512-c43682019b86/go.mod h1:lK3K5EZx4dyT24UG3yCt0wmspkYqrj4D/8kxdN3relk=
-github.com/gptscript-ai/chat-completion-client v0.0.0-20240813051153-a440ada7e3c3 h1:EQiFTZv+BnOWJX2B9XdF09fL2Zj7h19n1l23TpWCafc=
-github.com/gptscript-ai/chat-completion-client v0.0.0-20240813051153-a440ada7e3c3/go.mod h1:7P/o6/IWa1KqsntVf68hSnLKuu3+xuqm6lYhch1w4jo=
+github.com/gptscript-ai/chat-completion-client v0.0.0-20241104122544-5fe75f07c131 h1:y2FcmT4X8U606gUS0teX5+JWX9K/NclsLEhHiyrd+EU=
+github.com/gptscript-ai/chat-completion-client v0.0.0-20241104122544-5fe75f07c131/go.mod h1:7P/o6/IWa1KqsntVf68hSnLKuu3+xuqm6lYhch1w4jo=
 github.com/gptscript-ai/cmd v0.0.0-20240802230653-326b7baf6fcb h1:ky2J2CzBOskC7Jgm2VJAQi2x3p7FVGa+2/PcywkFJuc=
 github.com/gptscript-ai/cmd v0.0.0-20240802230653-326b7baf6fcb/go.mod h1:DJAo1xTht1LDkNYFNydVjTHd576TC7MlpsVRl3oloVw=
 github.com/gptscript-ai/go-gptscript v0.9.5-rc5.0.20240927213153-2af51434b93e h1:WpNae0NBx+Ri8RB3SxF8DhadDKU7h+jfWPQterDpbJA=
diff --git a/pkg/context/context.go b/pkg/context/context.go
@@ -46,14 +46,3 @@ func GetLogger(ctx context.Context) mvl.Logger {
 
 	return l
 }
-
-type envKey struct{}
-
-func WithEnv(ctx context.Context, env []string) context.Context {
-	return context.WithValue(ctx, envKey{}, env)
-}
-
-func GetEnv(ctx context.Context) []string {
-	l, _ := ctx.Value(envKey{}).([]string)
-	return l
-}
diff --git a/pkg/engine/engine.go b/pkg/engine/engine.go
@@ -8,14 +8,13 @@ import (
 	"sync"
 
 	"github.com/gptscript-ai/gptscript/pkg/config"
-	gcontext "github.com/gptscript-ai/gptscript/pkg/context"
 	"github.com/gptscript-ai/gptscript/pkg/counter"
 	"github.com/gptscript-ai/gptscript/pkg/types"
 	"github.com/gptscript-ai/gptscript/pkg/version"
 )
 
 type Model interface {
-	Call(ctx context.Context, messageRequest types.CompletionRequest, status chan<- types.CompletionStatus) (*types.CompletionMessage, error)
+	Call(ctx context.Context, messageRequest types.CompletionRequest, env []string, status chan<- types.CompletionStatus) (*types.CompletionMessage, error)
 	ProxyInfo() (string, string, error)
 }
 
@@ -389,7 +388,7 @@ func (e *Engine) complete(ctx context.Context, state *State) (*Return, error) {
 		}
 	}()
 
-	resp, err := e.Model.Call(gcontext.WithEnv(ctx, e.Env), state.Completion, progress)
+	resp, err := e.Model.Call(ctx, state.Completion, e.Env, progress)
 	if err != nil {
 		return nil, err
 	}
diff --git a/pkg/llm/proxy.go b/pkg/llm/proxy.go
@@ -54,7 +54,7 @@ func (r *Registry) ServeHTTP(w http.ResponseWriter, req *http.Request) {
 
 	var (
 		model string
-		data  = map[string]any{}
+		data  map[string]any
 	)
 
 	if json.Unmarshal(inBytes, &data) == nil {
@@ -65,7 +65,7 @@ func (r *Registry) ServeHTTP(w http.ResponseWriter, req *http.Request) {
 		model = builtin.GetDefaultModel()
 	}
 
-	c, err := r.getClient(req.Context(), model)
+	c, err := r.getClient(req.Context(), model, nil)
 	if err != nil {
 		http.Error(w, err.Error(), http.StatusInternalServerError)
 		return
diff --git a/pkg/llm/registry.go b/pkg/llm/registry.go
@@ -15,7 +15,7 @@ import (
 )
 
 type Client interface {
-	Call(ctx context.Context, messageRequest types.CompletionRequest, status chan<- types.CompletionStatus) (*types.CompletionMessage, error)
+	Call(ctx context.Context, messageRequest types.CompletionRequest, env []string, status chan<- types.CompletionStatus) (*types.CompletionMessage, error)
 	ListModels(ctx context.Context, providers ...string) (result []string, _ error)
 	Supports(ctx context.Context, modelName string) (bool, error)
 }
@@ -78,7 +78,7 @@ func (r *Registry) fastPath(modelName string) Client {
 	return r.clients[0]
 }
 
-func (r *Registry) getClient(ctx context.Context, modelName string) (Client, error) {
+func (r *Registry) getClient(ctx context.Context, modelName string, env []string) (Client, error) {
 	if c := r.fastPath(modelName); c != nil {
 		return c, nil
 	}
@@ -101,7 +101,7 @@ func (r *Registry) getClient(ctx context.Context, modelName string) (Client, err
 
 	if len(errs) > 0 && oaiClient != nil {
 		// Prompt the user to enter their OpenAI API key and try again.
-		if err := oaiClient.RetrieveAPIKey(ctx); err != nil {
+		if err := oaiClient.RetrieveAPIKey(ctx, env); err != nil {
 			return nil, err
 		}
 		ok, err := oaiClient.Supports(ctx, modelName)
@@ -119,13 +119,13 @@ func (r *Registry) getClient(ctx context.Context, modelName string) (Client, err
 	return nil, errors.Join(errs...)
 }
 
-func (r *Registry) Call(ctx context.Context, messageRequest types.CompletionRequest, status chan<- types.CompletionStatus) (*types.CompletionMessage, error) {
+func (r *Registry) Call(ctx context.Context, messageRequest types.CompletionRequest, env []string, status chan<- types.CompletionStatus) (*types.CompletionMessage, error) {
 	if messageRequest.Model == "" {
 		return nil, fmt.Errorf("model is required")
 	}
 
 	if c := r.fastPath(messageRequest.Model); c != nil {
-		return c.Call(ctx, messageRequest, status)
+		return c.Call(ctx, messageRequest, env, status)
 	}
 
 	var errs []error
@@ -140,20 +140,20 @@ func (r *Registry) Call(ctx context.Context, messageRequest types.CompletionRequ
 
 			errs = append(errs, err)
 		} else if ok {
-			return client.Call(ctx, messageRequest, status)
+			return client.Call(ctx, messageRequest, env, status)
 		}
 	}
 
 	if len(errs) > 0 && oaiClient != nil {
 		// Prompt the user to enter their OpenAI API key and try again.
-		if err := oaiClient.RetrieveAPIKey(ctx); err != nil {
+		if err := oaiClient.RetrieveAPIKey(ctx, env); err != nil {
 			return nil, err
 		}
 		ok, err := oaiClient.Supports(ctx, messageRequest.Model)
 		if err != nil {
 			return nil, err
 		} else if ok {
-			return oaiClient.Call(ctx, messageRequest, status)
+			return oaiClient.Call(ctx, messageRequest, env, status)
 		}
 	}
 
diff --git a/pkg/openai/client.go b/pkg/openai/client.go
@@ -13,7 +13,6 @@ import (
 
 	openai "github.com/gptscript-ai/chat-completion-client"
 	"github.com/gptscript-ai/gptscript/pkg/cache"
-	gcontext "github.com/gptscript-ai/gptscript/pkg/context"
 	"github.com/gptscript-ai/gptscript/pkg/counter"
 	"github.com/gptscript-ai/gptscript/pkg/credentials"
 	"github.com/gptscript-ai/gptscript/pkg/hash"
@@ -303,9 +302,9 @@ func toMessages(request types.CompletionRequest, compat bool) (result []openai.C
 	return
 }
 
-func (c *Client) Call(ctx context.Context, messageRequest types.CompletionRequest, status chan<- types.CompletionStatus) (*types.CompletionMessage, error) {
+func (c *Client) Call(ctx context.Context, messageRequest types.CompletionRequest, env []string, status chan<- types.CompletionStatus) (*types.CompletionMessage, error) {
 	if err := c.ValidAuth(); err != nil {
-		if err := c.RetrieveAPIKey(ctx); err != nil {
+		if err := c.RetrieveAPIKey(ctx, env); err != nil {
 			return nil, err
 		}
 	}
@@ -401,15 +400,15 @@ func (c *Client) Call(ctx context.Context, messageRequest types.CompletionReques
 	if err != nil {
 		return nil, err
 	} else if !ok {
-		result, err = c.call(ctx, request, id, status)
+		result, err = c.call(ctx, request, id, env, status)
 
 		// If we got back a context length exceeded error, keep retrying and shrinking the message history until we pass.
 		var apiError *openai.APIError
 		if errors.As(err, &apiError) && apiError.Code == "context_length_exceeded" && messageRequest.Chat {
 			// Decrease maxTokens by 10% to make garbage collection more aggressive.
 			// The retry loop will further decrease maxTokens if needed.
 			maxTokens := decreaseTenPercent(messageRequest.MaxTokens)
-			result, err = c.contextLimitRetryLoop(ctx, request, id, maxTokens, status)
+			result, err = c.contextLimitRetryLoop(ctx, request, id, env, maxTokens, status)
 		}
 		if err != nil {
 			return nil, err
@@ -443,7 +442,7 @@ func (c *Client) Call(ctx context.Context, messageRequest types.CompletionReques
 	return &result, nil
 }
 
-func (c *Client) contextLimitRetryLoop(ctx context.Context, request openai.ChatCompletionRequest, id string, maxTokens int, status chan<- types.CompletionStatus) (types.CompletionMessage, error) {
+func (c *Client) contextLimitRetryLoop(ctx context.Context, request openai.ChatCompletionRequest, id string, env []string, maxTokens int, status chan<- types.CompletionStatus) (types.CompletionMessage, error) {
 	var (
 		response types.CompletionMessage
 		err      error
@@ -452,7 +451,7 @@ func (c *Client) contextLimitRetryLoop(ctx context.Context, request openai.ChatC
 	for range 10 { // maximum 10 tries
 		// Try to drop older messages again, with a decreased max tokens.
 		request.Messages = dropMessagesOverCount(maxTokens, request.Messages)
-		response, err = c.call(ctx, request, id, status)
+		response, err = c.call(ctx, request, id, env, status)
 		if err == nil {
 			return response, nil
 		}
@@ -542,7 +541,7 @@ func override(left, right string) string {
 	return left
 }
 
-func (c *Client) call(ctx context.Context, request openai.ChatCompletionRequest, transactionID string, partial chan<- types.CompletionStatus) (types.CompletionMessage, error) {
+func (c *Client) call(ctx context.Context, request openai.ChatCompletionRequest, transactionID string, env []string, partial chan<- types.CompletionStatus) (types.CompletionMessage, error) {
 	streamResponse := os.Getenv("GPTSCRIPT_INTERNAL_OPENAI_STREAMING") != "false"
 
 	partial <- types.CompletionStatus{
@@ -553,11 +552,27 @@ func (c *Client) call(ctx context.Context, request openai.ChatCompletionRequest,
 		},
 	}
 
+	var (
+		headers          map[string]string
+		modelProviderEnv []string
+	)
+	for _, e := range env {
+		if strings.HasPrefix(e, "GPTSCRIPT_MODEL_PROVIDER_") {
+			modelProviderEnv = append(modelProviderEnv, e)
+		}
+	}
+
+	if len(modelProviderEnv) > 0 {
+		headers = map[string]string{
+			"X-GPTScript-Env": strings.Join(modelProviderEnv, ","),
+		}
+	}
+
 	slog.Debug("calling openai", "message", request.Messages)
 
 	if !streamResponse {
 		request.StreamOptions = nil
-		resp, err := c.c.CreateChatCompletion(ctx, request)
+		resp, err := c.c.CreateChatCompletion(ctx, request, headers)
 		if err != nil {
 			return types.CompletionMessage{}, err
 		}
@@ -582,7 +597,7 @@ func (c *Client) call(ctx context.Context, request openai.ChatCompletionRequest,
 		}), nil
 	}
 
-	stream, err := c.c.CreateChatCompletionStream(ctx, request)
+	stream, err := c.c.CreateChatCompletionStream(ctx, request, headers)
 	if err != nil {
 		return types.CompletionMessage{}, err
 	}
@@ -614,8 +629,8 @@ func (c *Client) call(ctx context.Context, request openai.ChatCompletionRequest,
 	}
 }
 
-func (c *Client) RetrieveAPIKey(ctx context.Context) error {
-	k, err := prompt.GetModelProviderCredential(ctx, c.credStore, BuiltinCredName, "OPENAI_API_KEY", "Please provide your OpenAI API key:", gcontext.GetEnv(ctx))
+func (c *Client) RetrieveAPIKey(ctx context.Context, env []string) error {
+	k, err := prompt.GetModelProviderCredential(ctx, c.credStore, BuiltinCredName, "OPENAI_API_KEY", "Please provide your OpenAI API key:", env)
 	if err != nil {
 		return err
 	}
diff --git a/pkg/remote/remote.go b/pkg/remote/remote.go
@@ -10,7 +10,6 @@ import (
 	"sync"
 
 	"github.com/gptscript-ai/gptscript/pkg/cache"
-	gcontext "github.com/gptscript-ai/gptscript/pkg/context"
 	"github.com/gptscript-ai/gptscript/pkg/credentials"
 	"github.com/gptscript-ai/gptscript/pkg/engine"
 	env2 "github.com/gptscript-ai/gptscript/pkg/env"
@@ -42,13 +41,13 @@ func New(r *runner.Runner, envs []string, cache *cache.Client, credStore credent
 	}
 }
 
-func (c *Client) Call(ctx context.Context, messageRequest types.CompletionRequest, status chan<- types.CompletionStatus) (*types.CompletionMessage, error) {
+func (c *Client) Call(ctx context.Context, messageRequest types.CompletionRequest, env []string, status chan<- types.CompletionStatus) (*types.CompletionMessage, error) {
 	_, provider := c.parseModel(messageRequest.Model)
 	if provider == "" {
 		return nil, fmt.Errorf("failed to find remote model %s", messageRequest.Model)
 	}
 
-	client, err := c.load(ctx, provider)
+	client, err := c.load(ctx, provider, env...)
 	if err != nil {
 		return nil, err
 	}
@@ -60,7 +59,7 @@ func (c *Client) Call(ctx context.Context, messageRequest types.CompletionReques
 		modelName = toolName
 	}
 	messageRequest.Model = modelName
-	return client.Call(ctx, messageRequest, status)
+	return client.Call(ctx, messageRequest, env, status)
 }
 
 func (c *Client) ListModels(ctx context.Context, providers ...string) (result []string, _ error) {
@@ -111,7 +110,7 @@ func isHTTPURL(toolName string) bool {
 		strings.HasPrefix(toolName, "https://")
 }
 
-func (c *Client) clientFromURL(ctx context.Context, apiURL string) (*openai.Client, error) {
+func (c *Client) clientFromURL(ctx context.Context, apiURL string, envs []string) (*openai.Client, error) {
 	parsed, err := url.Parse(apiURL)
 	if err != nil {
 		return nil, err
@@ -121,7 +120,7 @@ func (c *Client) clientFromURL(ctx context.Context, apiURL string) (*openai.Clie
 
 	if key == "" && !isLocalhost(apiURL) {
 		var err error
-		key, err = c.retrieveAPIKey(ctx, env, apiURL)
+		key, err = c.retrieveAPIKey(ctx, env, apiURL, envs)
 		if err != nil {
 			return nil, err
 		}
@@ -134,7 +133,7 @@ func (c *Client) clientFromURL(ctx context.Context, apiURL string) (*openai.Clie
 	})
 }
 
-func (c *Client) load(ctx context.Context, toolName string) (*openai.Client, error) {
+func (c *Client) load(ctx context.Context, toolName string, env ...string) (*openai.Client, error) {
 	c.clientsLock.Lock()
 	defer c.clientsLock.Unlock()
 
@@ -144,7 +143,7 @@ func (c *Client) load(ctx context.Context, toolName string) (*openai.Client, err
 	}
 
 	if isHTTPURL(toolName) {
-		remoteClient, err := c.clientFromURL(ctx, toolName)
+		remoteClient, err := c.clientFromURL(ctx, toolName, env)
 		if err != nil {
 			return nil, err
 		}
@@ -183,8 +182,8 @@ func (c *Client) load(ctx context.Context, toolName string) (*openai.Client, err
 	return oClient, nil
 }
 
-func (c *Client) retrieveAPIKey(ctx context.Context, env, url string) (string, error) {
-	return prompt.GetModelProviderCredential(ctx, c.credStore, url, env, fmt.Sprintf("Please provide your API key for %s", url), append(gcontext.GetEnv(ctx), c.envs...))
+func (c *Client) retrieveAPIKey(ctx context.Context, env, url string, envs []string) (string, error) {
+	return prompt.GetModelProviderCredential(ctx, c.credStore, url, env, fmt.Sprintf("Please provide your API key for %s", url), append(envs, c.envs...))
 }
 
 func isLocalhost(url string) bool {
diff --git a/pkg/runner/output.go b/pkg/runner/output.go
@@ -84,7 +84,7 @@ func (r *Runner) handleOutput(callCtx engine.Context, monitor Monitor, env []str
 		if err != nil {
 			return nil, fmt.Errorf("marshaling input for output filter: %w", err)
 		}
-		res, err := r.subCall(callCtx.Ctx, callCtx, monitor, env, outputToolRef.ToolID, string(inputData), "", engine.OutputToolCategory)
+		res, err := r.subCall(callCtx.Ctx, callCtx, monitor, env, outputToolRef.ToolID, inputData, "", engine.OutputToolCategory)
 		if err != nil {
 			return nil, err
 		}
diff --git a/pkg/tests/judge/judge.go b/pkg/tests/judge/judge.go
@@ -112,7 +112,7 @@ func (j *Judge[T]) Equal(ctx context.Context, expected, actual T, criteria strin
 			},
 		},
 	}
-	response, err := j.client.CreateChatCompletion(ctx, request)
+	response, err := j.client.CreateChatCompletion(ctx, request, nil)
 	if err != nil {
 		return false, "", fmt.Errorf("failed to create chat completion request: %w", err)
 	}
diff --git a/pkg/tests/tester/runner.go b/pkg/tests/tester/runner.go
@@ -35,7 +35,7 @@ func (c *Client) ProxyInfo() (string, string, error) {
 	return "test-auth", "test-url", nil
 }
 
-func (c *Client) Call(_ context.Context, messageRequest types.CompletionRequest, _ chan<- types.CompletionStatus) (resp *types.CompletionMessage, respErr error) {
+func (c *Client) Call(_ context.Context, messageRequest types.CompletionRequest, _ []string, _ chan<- types.CompletionStatus) (resp *types.CompletionMessage, respErr error) {
 	msgData, err := json.MarshalIndent(messageRequest, "", "  ")
 	require.NoError(c.t, err)
 

Original file line number	Diff line number	Diff line change
`@@ -8,14 +8,13 @@ import (`
`8`	`8`	`"sync"`
`9`	`9`
`10`	`10`	`"github.com/gptscript-ai/gptscript/pkg/config"`
`11`		`- gcontext "github.com/gptscript-ai/gptscript/pkg/context"`
`12`	`11`	`"github.com/gptscript-ai/gptscript/pkg/counter"`
`13`	`12`	`"github.com/gptscript-ai/gptscript/pkg/types"`
`14`	`13`	`"github.com/gptscript-ai/gptscript/pkg/version"`
`15`	`14`	`)`
`16`	`15`
`17`	`16`	`type Model interface {`
`18`		`- Call(ctx context.Context, messageRequest types.CompletionRequest, status chan<- types.CompletionStatus) (*types.CompletionMessage, error)`
	`17`	`+ Call(ctx context.Context, messageRequest types.CompletionRequest, env []string, status chan<- types.CompletionStatus) (*types.CompletionMessage, error)`
`19`	`18`	`ProxyInfo() (string, string, error)`
`20`	`19`	`}`
`21`	`20`
`@@ -389,7 +388,7 @@ func (e Engine) complete(ctx context.Context, state State) (*Return, error) {`
`389`	`388`	`}`
`390`	`389`	`}()`
`391`	`390`
`392`		`- resp, err := e.Model.Call(gcontext.WithEnv(ctx, e.Env), state.Completion, progress)`
	`391`	`+ resp, err := e.Model.Call(ctx, state.Completion, e.Env, progress)`
`393`	`392`	`if err != nil {`
`394`	`393`	`return nil, err`
`395`	`394`	`}`
Original file line number	Diff line number	Diff line change
`@@ -54,7 +54,7 @@ func (r Registry) ServeHTTP(w http.ResponseWriter, req http.Request) {`
`54`	`54`
`55`	`55`	`var (`
`56`	`56`	`model string`
`57`		`- data = map[string]any{}`
	`57`	`+ data map[string]any`
`58`	`58`	`)`
`59`	`59`
`60`	`60`	`if json.Unmarshal(inBytes, &data) == nil {`
`@@ -65,7 +65,7 @@ func (r Registry) ServeHTTP(w http.ResponseWriter, req http.Request) {`
`65`	`65`	`model = builtin.GetDefaultModel()`
`66`	`66`	`}`
`67`	`67`
`68`		`- c, err := r.getClient(req.Context(), model)`
	`68`	`+ c, err := r.getClient(req.Context(), model, nil)`
`69`	`69`	`if err != nil {`
`70`	`70`	`http.Error(w, err.Error(), http.StatusInternalServerError)`
`71`	`71`	`return`
Original file line number	Diff line number	Diff line change
`@@ -15,7 +15,7 @@ import (`
`15`	`15`	`)`
`16`	`16`
`17`	`17`	`type Client interface {`
`18`		`- Call(ctx context.Context, messageRequest types.CompletionRequest, status chan<- types.CompletionStatus) (*types.CompletionMessage, error)`
	`18`	`+ Call(ctx context.Context, messageRequest types.CompletionRequest, env []string, status chan<- types.CompletionStatus) (*types.CompletionMessage, error)`
`19`	`19`	`ListModels(ctx context.Context, providers ...string) (result []string, _ error)`
`20`	`20`	`Supports(ctx context.Context, modelName string) (bool, error)`
`21`	`21`	`}`
`@@ -78,7 +78,7 @@ func (r *Registry) fastPath(modelName string) Client {`
`78`	`78`	`return r.clients[0]`
`79`	`79`	`}`
`80`	`80`
`81`		`-func (r *Registry) getClient(ctx context.Context, modelName string) (Client, error) {`
	`81`	`+func (r *Registry) getClient(ctx context.Context, modelName string, env []string) (Client, error) {`
`82`	`82`	`if c := r.fastPath(modelName); c != nil {`
`83`	`83`	`return c, nil`
`84`	`84`	`}`
`@@ -101,7 +101,7 @@ func (r *Registry) getClient(ctx context.Context, modelName string) (Client, err`
`101`	`101`
`102`	`102`	`if len(errs) > 0 && oaiClient != nil {`
`103`	`103`	`// Prompt the user to enter their OpenAI API key and try again.`
`104`		`- if err := oaiClient.RetrieveAPIKey(ctx); err != nil {`
	`104`	`+ if err := oaiClient.RetrieveAPIKey(ctx, env); err != nil {`
`105`	`105`	`return nil, err`
`106`	`106`	`}`
`107`	`107`	`ok, err := oaiClient.Supports(ctx, modelName)`
`@@ -119,13 +119,13 @@ func (r *Registry) getClient(ctx context.Context, modelName string) (Client, err`
`119`	`119`	`return nil, errors.Join(errs...)`
`120`	`120`	`}`
`121`	`121`
`122`		`-func (r Registry) Call(ctx context.Context, messageRequest types.CompletionRequest, status chan<- types.CompletionStatus) (types.CompletionMessage, error) {`
	`122`	`+func (r Registry) Call(ctx context.Context, messageRequest types.CompletionRequest, env []string, status chan<- types.CompletionStatus) (types.CompletionMessage, error) {`
`123`	`123`	`if messageRequest.Model == "" {`
`124`	`124`	`return nil, fmt.Errorf("model is required")`
`125`	`125`	`}`
`126`	`126`
`127`	`127`	`if c := r.fastPath(messageRequest.Model); c != nil {`
`128`		`- return c.Call(ctx, messageRequest, status)`
	`128`	`+ return c.Call(ctx, messageRequest, env, status)`
`129`	`129`	`}`
`130`	`130`
`131`	`131`	`var errs []error`
`@@ -140,20 +140,20 @@ func (r *Registry) Call(ctx context.Context, messageRequest types.CompletionRequ`
`140`	`140`
`141`	`141`	`errs = append(errs, err)`
`142`	`142`	`} else if ok {`
`143`		`- return client.Call(ctx, messageRequest, status)`
	`143`	`+ return client.Call(ctx, messageRequest, env, status)`
`144`	`144`	`}`
`145`	`145`	`}`
`146`	`146`
`147`	`147`	`if len(errs) > 0 && oaiClient != nil {`
`148`	`148`	`// Prompt the user to enter their OpenAI API key and try again.`
`149`		`- if err := oaiClient.RetrieveAPIKey(ctx); err != nil {`
	`149`	`+ if err := oaiClient.RetrieveAPIKey(ctx, env); err != nil {`
`150`	`150`	`return nil, err`
`151`	`151`	`}`
`152`	`152`	`ok, err := oaiClient.Supports(ctx, messageRequest.Model)`
`153`	`153`	`if err != nil {`
`154`	`154`	`return nil, err`
`155`	`155`	`} else if ok {`
`156`		`- return oaiClient.Call(ctx, messageRequest, status)`
	`156`	`+ return oaiClient.Call(ctx, messageRequest, env, status)`
`157`	`157`	`}`
`158`	`158`	`}`
`159`	`159`
Original file line number	Diff line number	Diff line change
`@@ -10,7 +10,6 @@ import (`
`10`	`10`	`"sync"`
`11`	`11`
`12`	`12`	`"github.com/gptscript-ai/gptscript/pkg/cache"`
`13`		`- gcontext "github.com/gptscript-ai/gptscript/pkg/context"`
`14`	`13`	`"github.com/gptscript-ai/gptscript/pkg/credentials"`
`15`	`14`	`"github.com/gptscript-ai/gptscript/pkg/engine"`
`16`	`15`	`env2 "github.com/gptscript-ai/gptscript/pkg/env"`
`@@ -42,13 +41,13 @@ func New(r runner.Runner, envs []string, cache cache.Client, credStore credent`
`42`	`41`	`}`
`43`	`42`	`}`
`44`	`43`
`45`		`-func (c Client) Call(ctx context.Context, messageRequest types.CompletionRequest, status chan<- types.CompletionStatus) (types.CompletionMessage, error) {`
	`44`	`+func (c Client) Call(ctx context.Context, messageRequest types.CompletionRequest, env []string, status chan<- types.CompletionStatus) (types.CompletionMessage, error) {`
`46`	`45`	`_, provider := c.parseModel(messageRequest.Model)`
`47`	`46`	`if provider == "" {`
`48`	`47`	`return nil, fmt.Errorf("failed to find remote model %s", messageRequest.Model)`
`49`	`48`	`}`
`50`	`49`
`51`		`- client, err := c.load(ctx, provider)`
	`50`	`+ client, err := c.load(ctx, provider, env...)`
`52`	`51`	`if err != nil {`
`53`	`52`	`return nil, err`
`54`	`53`	`}`
`@@ -60,7 +59,7 @@ func (c *Client) Call(ctx context.Context, messageRequest types.CompletionReques`
`60`	`59`	`modelName = toolName`
`61`	`60`	`}`
`62`	`61`	`messageRequest.Model = modelName`
`63`		`- return client.Call(ctx, messageRequest, status)`
	`62`	`+ return client.Call(ctx, messageRequest, env, status)`
`64`	`63`	`}`
`65`	`64`
`66`	`65`	`func (c *Client) ListModels(ctx context.Context, providers ...string) (result []string, _ error) {`
`@@ -111,7 +110,7 @@ func isHTTPURL(toolName string) bool {`
`111`	`110`	`strings.HasPrefix(toolName, "https://")`
`112`	`111`	`}`
`113`	`112`
`114`		`-func (c Client) clientFromURL(ctx context.Context, apiURL string) (openai.Client, error) {`
	`113`	`+func (c Client) clientFromURL(ctx context.Context, apiURL string, envs []string) (openai.Client, error) {`
`115`	`114`	`parsed, err := url.Parse(apiURL)`
`116`	`115`	`if err != nil {`
`117`	`116`	`return nil, err`
`@@ -121,7 +120,7 @@ func (c Client) clientFromURL(ctx context.Context, apiURL string) (openai.Clie`
`121`	`120`
`122`	`121`	`if key == "" && !isLocalhost(apiURL) {`
`123`	`122`	`var err error`
`124`		`- key, err = c.retrieveAPIKey(ctx, env, apiURL)`
	`123`	`+ key, err = c.retrieveAPIKey(ctx, env, apiURL, envs)`
`125`	`124`	`if err != nil {`
`126`	`125`	`return nil, err`
`127`	`126`	`}`
`@@ -134,7 +133,7 @@ func (c Client) clientFromURL(ctx context.Context, apiURL string) (openai.Clie`
`134`	`133`	`})`
`135`	`134`	`}`
`136`	`135`
`137`		`-func (c Client) load(ctx context.Context, toolName string) (openai.Client, error) {`
	`136`	`+func (c Client) load(ctx context.Context, toolName string, env ...string) (openai.Client, error) {`
`138`	`137`	`c.clientsLock.Lock()`
`139`	`138`	`defer c.clientsLock.Unlock()`
`140`	`139`
`@@ -144,7 +143,7 @@ func (c Client) load(ctx context.Context, toolName string) (openai.Client, err`
`144`	`143`	`}`
`145`	`144`
`146`	`145`	`if isHTTPURL(toolName) {`
`147`		`- remoteClient, err := c.clientFromURL(ctx, toolName)`
	`146`	`+ remoteClient, err := c.clientFromURL(ctx, toolName, env)`
`148`	`147`	`if err != nil {`
`149`	`148`	`return nil, err`
`150`	`149`	`}`
`@@ -183,8 +182,8 @@ func (c Client) load(ctx context.Context, toolName string) (openai.Client, err`
`183`	`182`	`return oClient, nil`
`184`	`183`	`}`
`185`	`184`
`186`		`-func (c *Client) retrieveAPIKey(ctx context.Context, env, url string) (string, error) {`
`187`		`- return prompt.GetModelProviderCredential(ctx, c.credStore, url, env, fmt.Sprintf("Please provide your API key for %s", url), append(gcontext.GetEnv(ctx), c.envs...))`
	`185`	`+func (c *Client) retrieveAPIKey(ctx context.Context, env, url string, envs []string) (string, error) {`
	`186`	`+ return prompt.GetModelProviderCredential(ctx, c.credStore, url, env, fmt.Sprintf("Please provide your API key for %s", url), append(envs, c.envs...))`
`188`	`187`	`}`
`189`	`188`
`190`	`189`	`func isLocalhost(url string) bool {`
Original file line number	Diff line number	Diff line change
`@@ -84,7 +84,7 @@ func (r *Runner) handleOutput(callCtx engine.Context, monitor Monitor, env []str`
`84`	`84`	`if err != nil {`
`85`	`85`	`return nil, fmt.Errorf("marshaling input for output filter: %w", err)`
`86`	`86`	`}`
`87`		`- res, err := r.subCall(callCtx.Ctx, callCtx, monitor, env, outputToolRef.ToolID, string(inputData), "", engine.OutputToolCategory)`
	`87`	`+ res, err := r.subCall(callCtx.Ctx, callCtx, monitor, env, outputToolRef.ToolID, inputData, "", engine.OutputToolCategory)`
`88`	`88`	`if err != nil {`
`89`	`89`	`return nil, err`
`90`	`90`	`}`
Original file line number	Diff line number	Diff line change
`@@ -112,7 +112,7 @@ func (j *Judge[T]) Equal(ctx context.Context, expected, actual T, criteria strin`
`112`	`112`	`},`
`113`	`113`	`},`
`114`	`114`	`}`
`115`		`- response, err := j.client.CreateChatCompletion(ctx, request)`
	`115`	`+ response, err := j.client.CreateChatCompletion(ctx, request, nil)`
`116`	`116`	`if err != nil {`
`117`	`117`	`return false, "", fmt.Errorf("failed to create chat completion request: %w", err)`
`118`	`118`	`}`
Original file line number	Diff line number	Diff line change
`@@ -35,7 +35,7 @@ func (c *Client) ProxyInfo() (string, string, error) {`
`35`	`35`	`return "test-auth", "test-url", nil`
`36`	`36`	`}`
`37`	`37`
`38`		`-func (c Client) Call(_ context.Context, messageRequest types.CompletionRequest, _ chan<- types.CompletionStatus) (resp types.CompletionMessage, respErr error) {`
	`38`	`+func (c Client) Call(_ context.Context, messageRequest types.CompletionRequest, _ []string, _ chan<- types.CompletionStatus) (resp types.CompletionMessage, respErr error) {`
`39`	`39`	`msgData, err := json.MarshalIndent(messageRequest, "", " ")`
`40`	`40`	`require.NoError(c.t, err)`
`41`	`41`