kubernetes-sigs · k8s-ci-robot · Jan 20, 2026 · Jan 16, 2026 · Jan 16, 2026 · Jan 16, 2026
diff --git a/api/v1/inferencepool_types.go b/api/v1/inferencepool_types.go
@@ -76,6 +76,7 @@ type InferencePoolSpec struct {
 	// +kubebuilder:validation:MinItems=1
 	// +kubebuilder:validation:MaxItems=8
 	// +kubebuilder:validation:XValidation:message="port number must be unique",rule="self.all(p1, self.exists_one(p2, p1.number==p2.number))"
+	// +kubebuilder:validation:XValidation:message="all ports must have the same AppProtocol",rule="self.all(p, (has(p.appProtocol) ? p.appProtocol : 'Unset') == (has(self[0].appProtocol) ? self[0].appProtocol : 'Unset'))"
 	// +listType=atomic
 	// +required
 	TargetPorts []Port `json:"targetPorts,omitempty"`
@@ -94,8 +95,34 @@ type Port struct {
 	//
 	// +required
 	Number PortNumber `json:"number,omitempty"`
+
+	// AppProtocol describes the application protocol for this port.
+	//
+	// If unspecified, the protocol defaults to HTTP/1.1.
+	//
+	// Supported values include:
+	// * "http": HTTP/1.1. This is the default.
+	// * "kubernetes.io/h2c": HTTP/2 over cleartext.
+	//
+	// +kubebuilder:validation:Enum=http;"kubernetes.io/h2c"
+	// +optional
+	AppProtocol AppProtocol `json:"appProtocol,omitempty"`
 }
 
+// AppProtocol describes the application protocol for a port.
+type AppProtocol string
+
+const (
+	// AppProtocolHTTP represents the HTTP/1.1 protocol.
+	// This is the default protocol if AppProtocol is unspecified.
+	AppProtocolHTTP AppProtocol = "http"
+
+	// AppProtocolH2C represents HTTP/2 over cleartext (h2c).
+	// This protocol is typically used for gRPC workloads where TLS is terminated
+	// at the Gateway or not used within the cluster.
+	AppProtocolH2C AppProtocol = "kubernetes.io/h2c"
+)
+
 // EndpointPickerRef specifies a reference to an Endpoint Picker extension and its
 // associated configuration.
 // +kubebuilder:validation:XValidation:rule="self.kind != 'Service' || has(self.port)",message="port is required when kind is 'Service' or unspecified (defaults to 'Service')"
@@ -136,7 +163,7 @@ type EndpointPickerRef struct {
 	// resource or this field.
 	//
 	// +optional
-	Port *Port `json:"port,omitempty"`
+	Port *EndpointPickerPort `json:"port,omitempty"`
 
 	// FailureMode configures how the parent handles the case when the Endpoint Picker extension
 	// is non-responsive. When unspecified, defaults to "FailClose".
@@ -146,6 +173,15 @@ type EndpointPickerRef struct {
 	FailureMode EndpointPickerFailureMode `json:"failureMode,omitempty"`
 }
 
+// EndpointPickerPort defines the network port for the Endpoint Picker extension.
+type EndpointPickerPort struct {
+	// Number defines the port number of the Endpoint Picker service.
+	// The number must be in the range 1 to 65535.
+	//
+	// +required
+	Number PortNumber `json:"number,omitempty"`
+}
+
 // EndpointPickerFailureMode defines the options for how the parent handles the case when the
 // Endpoint Picker extension is non-responsive.
 //

diff --git a/api/v1/zz_generated.deepcopy.go b/api/v1/zz_generated.deepcopy.go
diff --git a/apix/v1alpha2/inferencepool_conversion.go b/apix/v1alpha2/inferencepool_conversion.go
@@ -254,7 +254,7 @@ func convertExtensionRefToV1(src *Extension) (v1.EndpointPickerRef, error) {
 	}
 	endpointPickerRef.Name = v1.ObjectName(src.Name)
 	if src.PortNumber != nil {
-		endpointPickerRef.Port = ptr.To(v1.Port{Number: v1.PortNumber(*src.PortNumber)})
+		endpointPickerRef.Port = ptr.To(v1.EndpointPickerPort{Number: v1.PortNumber(*src.PortNumber)})
 	}
 	if src.FailureMode != nil {
 		endpointPickerRef.FailureMode = v1.EndpointPickerFailureMode(*src.FailureMode)

diff --git a/apix/v1alpha2/inferencepool_conversion_test.go b/apix/v1alpha2/inferencepool_conversion_test.go
@@ -35,7 +35,7 @@ var (
 	v1Group       = v1.Group("my-group")
 	v1Kind        = v1.Kind("MyKind")
 	v1FailureMode = v1.EndpointPickerFailureMode("Deny")
-	v1Port        = v1.Port{Number: 9000}
+	v1Port        = v1.EndpointPickerPort{Number: 9000}
 )
 
 func TestInferencePoolConvertTo(t *testing.T) {

diff --git a/client-go/applyconfiguration/api/v1/endpointpickerport.go b/client-go/applyconfiguration/api/v1/endpointpickerport.go
diff --git a/client-go/applyconfiguration/api/v1/endpointpickerref.go b/client-go/applyconfiguration/api/v1/endpointpickerref.go
diff --git a/client-go/applyconfiguration/api/v1/port.go b/client-go/applyconfiguration/api/v1/port.go
diff --git a/client-go/applyconfiguration/utils.go b/client-go/applyconfiguration/utils.go
diff --git a/config/crd/bases/inference.networking.k8s.io_inferencepools.yaml b/config/crd/bases/inference.networking.k8s.io_inferencepools.yaml
@@ -99,7 +99,7 @@ spec:
                     properties:
                       number:
                         description: |-
-                          Number defines the port number to access the selected model server Pods.
+                          Number defines the port number of the Endpoint Picker service.
                           The number must be in the range 1 to 65535.
                         format: int32
                         maximum: 65535
@@ -162,6 +162,19 @@ spec:
                   description: Port defines the network port that will be exposed
                     by this InferencePool.
                   properties:
+                    appProtocol:
+                      description: |-
+                        AppProtocol describes the application protocol for this port.
+
+                        If unspecified, the protocol defaults to HTTP/1.1.
+
+                        Supported values include:
+                        * "http": HTTP/1.1. This is the default.
+                        * "kubernetes.io/h2c": HTTP/2 over cleartext.
+                      enum:
+                      - http
+                      - kubernetes.io/h2c
+                      type: string
                     number:
                       description: |-
                         Number defines the port number to access the selected model server Pods.
@@ -180,6 +193,9 @@ spec:
                 x-kubernetes-validations:
                 - message: port number must be unique
                   rule: self.all(p1, self.exists_one(p2, p1.number==p2.number))
+                - message: all ports must have the same AppProtocol
+                  rule: 'self.all(p, (has(p.appProtocol) ? p.appProtocol : ''Unset'')
+                    == (has(self[0].appProtocol) ? self[0].appProtocol : ''Unset''))'
             required:
             - endpointPickerRef
             - selector