mirror of
https://github.com/coder/coder.git
synced 2026-06-02 20:48:20 +00:00
22109a54ad
## Description Cleans up how key pool errors are represented and how they get turned into HTTP responses. Consolidates two error types into a single type with a kind tag, and gives the response helpers in both providers consistent names. ## Changes - Replaced the keypool sentinel and transient error struct with one error type that carries a kind and a retry-after duration. - Updated `KeyFailoverConfig.BuildKeyPoolResponse` to take the typed key pool error, so each provider can shape the exhaustion response in its own format. - Removed the per-provider `MarkKey` callback from `KeyFailoverConfig` since providers can rely on the shared `MarkKeyOnStatus` helper. - Renamed the response-error helpers so OpenAI and Anthropic use the same naming. Related to: https://linear.app/codercom/issue/AIGOV-334/aibridge-follow-ups-from-key-failover-prs > [!NOTE] > Initially generated by Claude Opus 4.7, modified and reviewed by @ssncferreira
118 lines
3.3 KiB
Go
118 lines
3.3 KiB
Go
package keypool
|
|
|
|
import (
|
|
"bytes"
|
|
"io"
|
|
"net/http"
|
|
|
|
"cdr.dev/slog/v3"
|
|
"github.com/coder/coder/v2/aibridge/utils"
|
|
)
|
|
|
|
// KeyFailoverConfig is the per-provider configuration consumed by
|
|
// NewKeyFailoverTransport.
|
|
type KeyFailoverConfig struct {
|
|
// Pool is the key pool to walk. Nil disables key failover.
|
|
Pool *Pool
|
|
|
|
ProviderName string
|
|
Logger slog.Logger
|
|
|
|
// IsBYOK returns true when the request already carries
|
|
// user-supplied auth. BYOK requests skip key failover.
|
|
IsBYOK func(*http.Request) bool
|
|
|
|
// InjectAuthKey writes the key value into the outbound headers
|
|
// in the format the provider expects.
|
|
InjectAuthKey func(*http.Header, string)
|
|
|
|
// BuildKeyPoolResponse renders the response sent to the client
|
|
// when the walker has no more keys to try.
|
|
BuildKeyPoolResponse func(*Error) *http.Response
|
|
}
|
|
|
|
// keyFailoverTransport retries inner across the key pool on
|
|
// key-specific failures.
|
|
type keyFailoverTransport struct {
|
|
inner http.RoundTripper
|
|
config KeyFailoverConfig
|
|
}
|
|
|
|
// NewKeyFailoverTransport returns an http.RoundTripper backed by
|
|
// keyFailoverTransport. If config.Pool is nil, inner is returned
|
|
// unchanged.
|
|
func NewKeyFailoverTransport(inner http.RoundTripper, config KeyFailoverConfig) http.RoundTripper {
|
|
if config.Pool == nil {
|
|
return inner
|
|
}
|
|
return &keyFailoverTransport{
|
|
inner: inner,
|
|
config: config,
|
|
}
|
|
}
|
|
|
|
// RoundTrip is invoked by the proxy once per outer client request,
|
|
// after Rewrite has applied proxy headers.
|
|
//
|
|
// For centralized requests it walks the key pool, retrying on
|
|
// key-specific failures until one key succeeds or the pool is
|
|
// exhausted. BYOK requests skip the failover loop.
|
|
func (t *keyFailoverTransport) RoundTrip(req *http.Request) (*http.Response, error) {
|
|
if t.config.IsBYOK(req) {
|
|
return t.inner.RoundTrip(req)
|
|
}
|
|
|
|
// Buffer once so retries can replay the body.
|
|
body, err := bufferBody(req)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
// Fresh walker per request, independent of other inflight requests.
|
|
walker := t.config.Pool.Walker()
|
|
for {
|
|
key, keyPoolErr := walker.Next()
|
|
if keyPoolErr != nil {
|
|
resp := t.config.BuildKeyPoolResponse(keyPoolErr)
|
|
if resp == nil {
|
|
// Fallback if BuildKeyPoolResponse returns nil.
|
|
body := []byte(`{"error":"key pool unavailable"}`)
|
|
resp = utils.NewJSONErrorResponse(http.StatusBadGateway, 0, body)
|
|
}
|
|
return resp, nil
|
|
}
|
|
|
|
// Clone per attempt so the original request isn't mutated.
|
|
outReq := req.Clone(req.Context())
|
|
if body != nil {
|
|
outReq.Body = io.NopCloser(bytes.NewReader(body))
|
|
}
|
|
t.config.InjectAuthKey(&outReq.Header, key.Value())
|
|
|
|
resp, rtErr := t.inner.RoundTrip(outReq)
|
|
if rtErr != nil {
|
|
// Transport-level error, not a key issue.
|
|
return resp, rtErr
|
|
}
|
|
// MarkKeyOnStatus returns true on key-specific failures (e.g. 401/403/429).
|
|
if MarkKeyOnStatus(req.Context(), key, resp, t.config.Logger, t.config.ProviderName) {
|
|
// Drain and retry with the next key.
|
|
_, _ = io.Copy(io.Discard, resp.Body)
|
|
_ = resp.Body.Close()
|
|
continue
|
|
}
|
|
// Success or non-key error, forward as-is.
|
|
return resp, nil
|
|
}
|
|
}
|
|
|
|
// bufferBody reads the request body fully so it can be replayed
|
|
// across key-failover retries. Returns nil for a nil body.
|
|
func bufferBody(req *http.Request) ([]byte, error) {
|
|
if req.Body == nil {
|
|
return nil, nil
|
|
}
|
|
defer req.Body.Close()
|
|
return io.ReadAll(req.Body)
|
|
}
|