Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

changing schema naming #100

Merged
merged 23 commits into from
Jan 18, 2025
Merged
Show file tree
Hide file tree
Changes from 22 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@ out/
.terraform
.idea
*for_tests.yaml
.idea/
mathetake marked this conversation as resolved.
Show resolved Hide resolved
yuzisun marked this conversation as resolved.
Show resolved Hide resolved

# Files and directories to ignore in the site directory
# dependencies
Expand Down
12 changes: 6 additions & 6 deletions api/v1alpha1/api.go
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@ import (
// This serves as a way to define a "unified" AI API for a Gateway which allows downstream
// clients to use a single schema API to interact with multiple AI backends.
//
// The inputSchema field is used to determine the structure of the requests that the Gateway will
// The schema field is used to determine the structure of the requests that the Gateway will
// receive. And then the Gateway will route the traffic to the appropriate AIServiceBackend based
// on the output schema of the AIServiceBackend while doing the other necessary jobs like
// upstream authentication, rate limit, etc.
Expand Down Expand Up @@ -52,8 +52,8 @@ type AIGatewayRouteSpec struct {
// Currently, the only supported schema is OpenAI as the input schema.
//
// +kubebuilder:validation:Required
// +kubebuilder:validation:XValidation:rule="self.schema == 'OpenAI'"
APISchema VersionedAPISchema `json:"inputSchema"`
// +kubebuilder:validation:XValidation:rule="self.name == 'OpenAI'"
APISchema VersionedAPISchema `json:"schema"`
// Rules is the list of AIGatewayRouteRule that this AIGatewayRoute will match the traffic to.
// Each rule is a subset of the HTTPRoute in the Gateway API (https://gateway-api.sigs.k8s.io/api-types/httproute/).
//
Expand Down Expand Up @@ -215,7 +215,7 @@ type AIServiceBackendSpec struct {
// This is required to be set.
//
// +kubebuilder:validation:Required
APISchema VersionedAPISchema `json:"outputSchema"`
APISchema VersionedAPISchema `json:"schema"`
// BackendRef is the reference to the Backend resource that this AIServiceBackend corresponds to.
//
// A backend can be of either k8s Service or Backend resource of Envoy Gateway.
Expand All @@ -240,10 +240,10 @@ type AIServiceBackendSpec struct {
// Note that this is vendor specific, and the stability of the API schema is not guaranteed by
// the ai-gateway, but by the vendor via proper versioning.
type VersionedAPISchema struct {
// Schema is the API schema of the AIGatewayRoute or AIServiceBackend.
// Name is the name of the API schema of the AIGatewayRoute or AIServiceBackend.
//
// +kubebuilder:validation:Enum=OpenAI;AWSBedrock
Schema APISchema `json:"schema"`
Name APISchema `json:"name"`

// Version is the version of the API schema.
Version string `json:"version,omitempty"`
Expand Down
40 changes: 20 additions & 20 deletions filterconfig/filterconfig.go
Original file line number Diff line number Diff line change
Expand Up @@ -19,8 +19,8 @@ import (
// DefaultConfig is the default configuration that can be used as a
// fallback when the configuration is not explicitly provided.
const DefaultConfig = `
inputSchema:
schema: OpenAI
schema:
name: OpenAI
selectedBackendHeaderKey: x-envoy-ai-gateway-selected-backend
modelNameHeaderKey: x-envoy-ai-gateway-model
`
Expand All @@ -29,8 +29,8 @@ modelNameHeaderKey: x-envoy-ai-gateway-model
//
// # Example configuration:
//
// inputSchema:
// schema: OpenAI
// schema:
// name: OpenAI
// selectedBackendHeaderKey: x-envoy-ai-gateway-selected-backend
// modelNameHeaderKey: x-envoy-ai-gateway-model
// tokenUsageMetadata:
Expand All @@ -40,19 +40,19 @@ modelNameHeaderKey: x-envoy-ai-gateway-model
// - backends:
// - name: kserve
// weight: 1
// outputSchema:
// schema: OpenAI
// schema:
// name: OpenAI
// - name: awsbedrock
// weight: 10
// outputSchema:
// schema: AWSBedrock
// schema:
// name: AWSBedrock
// headers:
// - name: x-envoy-ai-gateway-model
// value: llama3.3333
// - backends:
// - name: openai
// outputSchema:
// schema: OpenAI
// schema:
// name: OpenAI
// headers:
// - name: x-envoy-ai-gateway-model
// value: gpt4.4444
Expand All @@ -70,8 +70,8 @@ type Config struct {
// If this is provided, the filter will populate the usage token in the filter metadata at the end of the
// response body processing.
TokenUsageMetadata *TokenUsageMetadata `yaml:"tokenUsageMetadata,omitempty"`
// InputSchema specifies the API schema of the input format of requests to the filter.
InputSchema VersionedAPISchema `yaml:"inputSchema"`
// Schema specifies the API schema of the input format of requests to the filter.
Schema VersionedAPISchema `yaml:"schema"`
// ModelNameHeaderKey is the header key to be populated with the model name by the filter.
ModelNameHeaderKey string `yaml:"modelNameHeaderKey"`
// SelectedBackendHeaderKey is the header key to be populated with the backend name by the filter
Expand All @@ -96,18 +96,18 @@ type TokenUsageMetadata struct {

// VersionedAPISchema corresponds to LLMAPISchema in api/v1alpha1/api.go.
type VersionedAPISchema struct {
// Schema is the API schema.
Schema APISchema `yaml:"schema"`
// Name is the name of the API schema.
Name APISchemaName `yaml:"name"`
// Version is the version of the API schema. Optional.
Version string `yaml:"version,omitempty"`
}

// APISchema corresponds to APISchema in api/v1alpha1/api.go.
type APISchema string
// APISchemaName corresponds to APISchemaName in api/v1alpha1/api.go.
type APISchemaName string
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Given that the values are provider names, wouldn't APISchemaProviderName be more suitable than APISchemaName?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I dont have a big preference, open for discussion on this


const (
APISchemaOpenAI APISchema = "OpenAI"
APISchemaAWSBedrock APISchema = "AWSBedrock"
APISchemaOpenAI APISchemaName = "OpenAI"
APISchemaAWSBedrock APISchemaName = "AWSBedrock"
)

// HeaderMatch is an alias for HTTPHeaderMatch of the Gateway API.
Expand All @@ -130,8 +130,8 @@ type Backend struct {
// Name of the backend, which is the value in the final routing decision
// matching the header key specified in the [Config.BackendRoutingHeaderKey].
Name string `yaml:"name"`
// OutputSchema specifies the API schema of the output format of requests from.
OutputSchema VersionedAPISchema `yaml:"outputSchema"`
// Schema specifies the API schema of the output format of requests from.
Schema VersionedAPISchema `yaml:"schema"`
// Weight is the weight of the backend in the routing decision.
Weight int `yaml:"weight"`
// Auth is the authn/z configuration for the backend. Optional.
Expand Down
22 changes: 11 additions & 11 deletions filterconfig/filterconfig_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -29,8 +29,8 @@ func TestDefaultConfig(t *testing.T) {
func TestUnmarshalConfigYaml(t *testing.T) {
configPath := path.Join(t.TempDir(), "config.yaml")
const config = `
inputSchema:
schema: OpenAI
schema:
name: OpenAI
selectedBackendHeaderKey: x-envoy-ai-gateway-selected-backend
modelNameHeaderKey: x-envoy-ai-gateway-model
tokenUsageMetadata:
Expand All @@ -40,19 +40,19 @@ rules:
- backends:
- name: kserve
weight: 1
outputSchema:
schema: OpenAI
schema:
name: OpenAI
- name: awsbedrock
weight: 10
outputSchema:
schema: AWSBedrock
schema:
name: AWSBedrock
headers:
- name: x-envoy-ai-gateway-model
value: llama3.3333
- backends:
- name: openai
outputSchema:
schema: OpenAI
schema:
name: OpenAI
headers:
- name: x-envoy-ai-gateway-model
value: gpt4.4444
Expand All @@ -62,15 +62,15 @@ rules:
require.NoError(t, err)
require.Equal(t, "ai_gateway_llm_ns", cfg.TokenUsageMetadata.Namespace)
require.Equal(t, "token_usage_key", cfg.TokenUsageMetadata.Key)
require.Equal(t, "OpenAI", string(cfg.InputSchema.Schema))
require.Equal(t, "OpenAI", string(cfg.Schema.Name))
require.Equal(t, "x-envoy-ai-gateway-selected-backend", cfg.SelectedBackendHeaderKey)
require.Equal(t, "x-envoy-ai-gateway-model", cfg.ModelNameHeaderKey)
require.Len(t, cfg.Rules, 2)
require.Equal(t, "llama3.3333", cfg.Rules[0].Headers[0].Value)
require.Equal(t, "gpt4.4444", cfg.Rules[1].Headers[0].Value)
require.Equal(t, "kserve", cfg.Rules[0].Backends[0].Name)
require.Equal(t, 10, cfg.Rules[0].Backends[1].Weight)
require.Equal(t, "AWSBedrock", string(cfg.Rules[0].Backends[1].OutputSchema.Schema))
require.Equal(t, "AWSBedrock", string(cfg.Rules[0].Backends[1].Schema.Name))
require.Equal(t, "openai", cfg.Rules[1].Backends[0].Name)
require.Equal(t, "OpenAI", string(cfg.Rules[1].Backends[0].OutputSchema.Schema))
require.Equal(t, "OpenAI", string(cfg.Rules[1].Backends[0].Schema.Name))
}
2 changes: 1 addition & 1 deletion internal/apischema/awsbedrock/awsbedrock.go
Original file line number Diff line number Diff line change
Expand Up @@ -458,7 +458,7 @@ type ToolSpecification struct {
// The description for the tool.
Description *string `json:"description,omitempty"`

// The input schema for the tool in JSON format.
// The schema for the tool in JSON format.
//
// InputSchema is a required field
InputSchema *ToolInputSchema `json:"inputSchema"`
Expand Down
8 changes: 4 additions & 4 deletions internal/controller/sink.go
Original file line number Diff line number Diff line change
Expand Up @@ -165,8 +165,8 @@ func (c *configSink) updateExtProcConfigMap(aiGatewayRoute *aigv1a1.AIGatewayRou
ec := &filterconfig.Config{}
spec := &aiGatewayRoute.Spec

ec.InputSchema.Schema = filterconfig.APISchema(spec.APISchema.Schema)
ec.InputSchema.Version = spec.APISchema.Version
ec.Schema.Name = filterconfig.APISchemaName(spec.APISchema.Name)
ec.Schema.Version = spec.APISchema.Version
ec.ModelNameHeaderKey = aigv1a1.AIModelHeaderKey
ec.SelectedBackendHeaderKey = selectedBackendHeaderKey
ec.Rules = make([]filterconfig.RouteRule, len(spec.Rules))
Expand All @@ -180,8 +180,8 @@ func (c *configSink) updateExtProcConfigMap(aiGatewayRoute *aigv1a1.AIGatewayRou
if err != nil {
return fmt.Errorf("failed to get AIServiceBackend %s: %w", key, err)
} else {
ec.Rules[i].Backends[j].OutputSchema.Schema = filterconfig.APISchema(backendObj.Spec.APISchema.Schema)
ec.Rules[i].Backends[j].OutputSchema.Version = backendObj.Spec.APISchema.Version
ec.Rules[i].Backends[j].Schema.Name = filterconfig.APISchemaName(backendObj.Spec.APISchema.Name)
ec.Rules[i].Backends[j].Schema.Version = backendObj.Spec.APISchema.Version
}
}
ec.Rules[i].Headers = make([]filterconfig.HeaderMatch, len(rule.Matches))
Expand Down
10 changes: 5 additions & 5 deletions internal/controller/sink_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -60,7 +60,7 @@ func TestConfigSink_syncAIGatewayRoute(t *testing.T) {
BackendRefs: []aigv1a1.AIGatewayRouteRuleBackendRef{{Name: "apple", Weight: 1}, {Name: "orange", Weight: 1}},
},
},
APISchema: aigv1a1.VersionedAPISchema{Schema: aigv1a1.APISchemaOpenAI, Version: "v123"},
APISchema: aigv1a1.VersionedAPISchema{Name: aigv1a1.APISchemaOpenAI, Version: "v123"},
},
}
err := fakeClient.Create(context.Background(), route, &client.CreateOptions{})
Expand Down Expand Up @@ -216,7 +216,7 @@ func Test_updateExtProcConfigMap(t *testing.T) {
ObjectMeta: metav1.ObjectMeta{Name: "apple", Namespace: "ns"},
Spec: aigv1a1.AIServiceBackendSpec{
APISchema: aigv1a1.VersionedAPISchema{
Schema: aigv1a1.APISchemaAWSBedrock,
Name: aigv1a1.APISchemaAWSBedrock,
},
BackendRef: gwapiv1.BackendObjectReference{Name: "some-backend1", Namespace: ptr.To[gwapiv1.Namespace]("ns")},
},
Expand Down Expand Up @@ -249,7 +249,7 @@ func Test_updateExtProcConfigMap(t *testing.T) {
route: &aigv1a1.AIGatewayRoute{
ObjectMeta: metav1.ObjectMeta{Name: "myroute", Namespace: "ns"},
Spec: aigv1a1.AIGatewayRouteSpec{
APISchema: aigv1a1.VersionedAPISchema{Schema: aigv1a1.APISchemaOpenAI, Version: "v123"},
APISchema: aigv1a1.VersionedAPISchema{Name: aigv1a1.APISchemaOpenAI, Version: "v123"},
Rules: []aigv1a1.AIGatewayRouteRule{
{
BackendRefs: []aigv1a1.AIGatewayRouteRuleBackendRef{
Expand All @@ -270,13 +270,13 @@ func Test_updateExtProcConfigMap(t *testing.T) {
},
},
exp: &filterconfig.Config{
InputSchema: filterconfig.VersionedAPISchema{Schema: filterconfig.APISchemaOpenAI, Version: "v123"},
Schema: filterconfig.VersionedAPISchema{Name: filterconfig.APISchemaOpenAI, Version: "v123"},
ModelNameHeaderKey: aigv1a1.AIModelHeaderKey,
SelectedBackendHeaderKey: selectedBackendHeaderKey,
Rules: []filterconfig.RouteRule{
{
Backends: []filterconfig.Backend{
{Name: "apple.ns", Weight: 1, OutputSchema: filterconfig.VersionedAPISchema{Schema: filterconfig.APISchemaAWSBedrock}}, {Name: "pineapple.ns", Weight: 2},
{Name: "apple.ns", Weight: 1, Schema: filterconfig.VersionedAPISchema{Name: filterconfig.APISchemaAWSBedrock}}, {Name: "pineapple.ns", Weight: 2},
},
Headers: []filterconfig.HeaderMatch{{Name: aigv1a1.AIModelHeaderKey, Value: "some-ai"}},
},
Expand Down
2 changes: 1 addition & 1 deletion internal/extproc/mocks_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -108,7 +108,7 @@ type mockRouter struct {
// Calculate implements [router.Router.Calculate].
func (m mockRouter) Calculate(headers map[string]string) (*filterconfig.Backend, error) {
require.Equal(m.t, m.expHeaders, headers)
b := &filterconfig.Backend{Name: m.retBackendName, OutputSchema: m.retVersionedAPISchema}
b := &filterconfig.Backend{Name: m.retBackendName, Schema: m.retVersionedAPISchema}
return b, m.retErr
}

Expand Down
4 changes: 2 additions & 2 deletions internal/extproc/processor.go
Original file line number Diff line number Diff line change
Expand Up @@ -83,9 +83,9 @@ func (p *Processor) ProcessRequestBody(_ context.Context, rawBody *extprocv3.Htt
}
p.logger.Info("Selected backend", "backend", b.Name)

factory, ok := p.config.factories[b.OutputSchema]
factory, ok := p.config.factories[b.Schema]
if !ok {
return nil, fmt.Errorf("failed to find factory for output schema %q", b.OutputSchema)
return nil, fmt.Errorf("failed to find factory for output schema %q", b.Schema)
}

t, err := factory(path)
Expand Down
14 changes: 7 additions & 7 deletions internal/extproc/processor_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -96,7 +96,7 @@ func TestProcessor_ProcessRequestBody(t *testing.T) {
rbp := mockRequestBodyParser{t: t, retModelName: "some-model", expPath: "/foo"}
rt := mockRouter{
t: t, expHeaders: headers, retBackendName: "some-backend",
retVersionedAPISchema: filterconfig.VersionedAPISchema{Schema: "some-schema", Version: "v10.0"},
retVersionedAPISchema: filterconfig.VersionedAPISchema{Name: "some-schema", Version: "v10.0"},
}
p := &Processor{config: &processorConfig{
bodyParser: rbp.impl, router: rt,
Expand All @@ -110,13 +110,13 @@ func TestProcessor_ProcessRequestBody(t *testing.T) {
rbp := mockRequestBodyParser{t: t, retModelName: "some-model", expPath: "/foo"}
rt := mockRouter{
t: t, expHeaders: headers, retBackendName: "some-backend",
retVersionedAPISchema: filterconfig.VersionedAPISchema{Schema: "some-schema", Version: "v10.0"},
retVersionedAPISchema: filterconfig.VersionedAPISchema{Name: "some-schema", Version: "v10.0"},
}
factory := mockTranslatorFactory{t: t, retErr: errors.New("test error"), expPath: "/foo"}
p := &Processor{config: &processorConfig{
bodyParser: rbp.impl, router: rt,
factories: map[filterconfig.VersionedAPISchema]translator.Factory{
{Schema: "some-schema", Version: "v10.0"}: factory.impl,
{Name: "some-schema", Version: "v10.0"}: factory.impl,
},
}, requestHeaders: headers, logger: slog.Default()}
_, err := p.ProcessRequestBody(context.Background(), &extprocv3.HttpBody{})
Expand All @@ -127,13 +127,13 @@ func TestProcessor_ProcessRequestBody(t *testing.T) {
rbp := mockRequestBodyParser{t: t, retModelName: "some-model", expPath: "/foo"}
rt := mockRouter{
t: t, expHeaders: headers, retBackendName: "some-backend",
retVersionedAPISchema: filterconfig.VersionedAPISchema{Schema: "some-schema", Version: "v10.0"},
retVersionedAPISchema: filterconfig.VersionedAPISchema{Name: "some-schema", Version: "v10.0"},
}
factory := mockTranslatorFactory{t: t, retTranslator: mockTranslator{t: t, retErr: errors.New("test error")}, expPath: "/foo"}
p := &Processor{config: &processorConfig{
bodyParser: rbp.impl, router: rt,
factories: map[filterconfig.VersionedAPISchema]translator.Factory{
{Schema: "some-schema", Version: "v10.0"}: factory.impl,
{Name: "some-schema", Version: "v10.0"}: factory.impl,
},
}, requestHeaders: headers, logger: slog.Default()}
_, err := p.ProcessRequestBody(context.Background(), &extprocv3.HttpBody{})
Expand All @@ -145,7 +145,7 @@ func TestProcessor_ProcessRequestBody(t *testing.T) {
rbp := mockRequestBodyParser{t: t, retModelName: "some-model", expPath: "/foo", retRb: someBody}
rt := mockRouter{
t: t, expHeaders: headers, retBackendName: "some-backend",
retVersionedAPISchema: filterconfig.VersionedAPISchema{Schema: "some-schema", Version: "v10.0"},
retVersionedAPISchema: filterconfig.VersionedAPISchema{Name: "some-schema", Version: "v10.0"},
}
headerMut := &extprocv3.HeaderMutation{}
bodyMut := &extprocv3.BodyMutation{}
Expand All @@ -154,7 +154,7 @@ func TestProcessor_ProcessRequestBody(t *testing.T) {
p := &Processor{config: &processorConfig{
bodyParser: rbp.impl, router: rt,
factories: map[filterconfig.VersionedAPISchema]translator.Factory{
{Schema: "some-schema", Version: "v10.0"}: factory.impl,
{Name: "some-schema", Version: "v10.0"}: factory.impl,
},
selectedBackendHeaderKey: "x-ai-gateway-backend-key",
ModelNameHeaderKey: "x-ai-gateway-model-key",
Expand Down
6 changes: 3 additions & 3 deletions internal/extproc/router/request_body.go
Original file line number Diff line number Diff line change
Expand Up @@ -14,11 +14,11 @@ import (
type RequestBodyParser func(path string, body *extprocv3.HttpBody) (modelName string, rb RequestBody, err error)

// NewRequestBodyParser creates a new RequestBodyParser based on the schema.
func NewRequestBodyParser(inputSchema filterconfig.VersionedAPISchema) (RequestBodyParser, error) {
if inputSchema.Schema == filterconfig.APISchemaOpenAI {
func NewRequestBodyParser(schema filterconfig.VersionedAPISchema) (RequestBodyParser, error) {
if schema.Name == filterconfig.APISchemaOpenAI {
return openAIParseBody, nil
}
return nil, fmt.Errorf("unsupported API schema: %s", inputSchema)
return nil, fmt.Errorf("unsupported API schema: %s", schema)
}

// RequestBody is the union of all request body types.
Expand Down
4 changes: 2 additions & 2 deletions internal/extproc/router/request_body_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -13,12 +13,12 @@ import (

func TestNewRequestBodyParser(t *testing.T) {
t.Run("ok", func(t *testing.T) {
res, err := NewRequestBodyParser(filterconfig.VersionedAPISchema{Schema: filterconfig.APISchemaOpenAI})
res, err := NewRequestBodyParser(filterconfig.VersionedAPISchema{Name: filterconfig.APISchemaOpenAI})
require.NotNil(t, res)
require.NoError(t, err)
})
t.Run("error", func(t *testing.T) {
res, err := NewRequestBodyParser(filterconfig.VersionedAPISchema{Schema: "foo"})
res, err := NewRequestBodyParser(filterconfig.VersionedAPISchema{Name: "foo"})
require.Nil(t, res)
require.Error(t, err)
})
Expand Down
Loading
Loading