kgateway-dev
diff --git a/‎.github/actions/setup-kind-cluster/action.yaml‎
Lines changed: 5 additions & 0 deletions b/‎.github/actions/setup-kind-cluster/action.yaml‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎.github/workflows/e2e.yaml‎
Lines changed: 0 additions & 1 deletion b/‎.github/workflows/e2e.yaml‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎.github/workflows/nightly-tests.yaml‎
Lines changed: 51 additions & 0 deletions b/‎.github/workflows/nightly-tests.yaml‎
Lines changed: 51 additions & 0 deletions
diff --git a/‎design/12721.md‎
Lines changed: 145 additions & 0 deletions b/‎design/12721.md‎
Lines changed: 145 additions & 0 deletions
diff --git a/‎devel/testing/nightly-tests.md‎
Lines changed: 5 additions & 0 deletions b/‎devel/testing/nightly-tests.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎go.mod‎
Lines changed: 1 addition & 1 deletion b/‎go.mod‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎hack/utils/oss_compliance/osa_provided.md‎
Lines changed: 1 addition & 0 deletions b/‎hack/utils/oss_compliance/osa_provided.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎pkg/utils/cmdutils/local.go‎
Lines changed: 1 addition & 0 deletions b/‎pkg/utils/cmdutils/local.go‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎pkg/utils/helmutils/client.go‎
Lines changed: 4 additions & 1 deletion b/‎pkg/utils/helmutils/client.go‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎pkg/utils/kubeutils/kubectl/cli.go‎
Lines changed: 8 additions & 7 deletions b/‎pkg/utils/kubeutils/kubectl/cli.go‎
Lines changed: 8 additions & 7 deletions
@@ -19,6 +19,10 @@ inputs:
     required: false
     default: "" # If this is undefined the setup-kind script has its own default value
     description: The version of the gateway-api to use
+  gateway-api-channel:
+    required: false
+    default: "" # If this is undefined the setup-kind script has its own default value
+    description: The channel of the gateway-api to use
   localstack:
     required: false
     default: "false"
@@ -38,6 +42,7 @@ runs:
         CLUSTER_NODE_VERSION: ${{ inputs.kind-node-version }}
         ISTIO_VERSION: ${{ inputs.istio-version }}
         CONFORMANCE_VERSION: ${{ inputs.gateway-api-version }}
+        CONFORMANCE_CHANNEL: ${{ inputs.gateway-api-channel }}
         LOCALSTACK: ${{ inputs.localstack }}
         CONFORMANCE: true
       run: |
 
@@ -75,7 +75,6 @@ jobs:
         - cluster-name: 'agent-gateway-cluster'
           go-test-args: '-v -timeout=25m'
           go-test-run-regex: '^TestAgentgatewayIntegration'
-          agentgateway: 'true'
         # August 29, 2025: ~3 minutes
         - cluster-name: 'api-validation'
           go-test-args: '-v -timeout=10m'
 
@@ -22,6 +22,10 @@ on:
         description: "Run load testing suite"
         type: boolean
         default: false
+      run-e2e-tests:
+        description: "Run e2e tests"
+        type: boolean
+        default: false
 
 concurrency:
   group: ${{ github.workflow }}-${{ github.ref_name }}
@@ -59,3 +63,50 @@ jobs:
       with:
         ref: main
     - uses: ./.github/actions/kube-gateway-api-load-tests
+
+  kgateway_e2e_tests_for_gateway_api_versions:
+    name: GwApi E2E
+    if: ${{ (github.event_name == 'workflow_dispatch' && inputs.run-e2e-tests) || github.event.schedule == '0 5 * * *' }}
+    runs-on: ubuntu-22.04
+    timeout-minutes: 120
+    strategy:
+      fail-fast: false
+      matrix:
+        gateway-api-version: [ { version: 'v1.4.0', channel: 'experimental' },
+                              { version: 'v1.4.0', channel: 'standard' },
+                              { version: 'v1.3.0', channel: 'experimental' },
+                              { version: 'v1.3.0', channel: 'standard' },
+                              { version: 'v1.2.1', channel: 'experimental' },
+                              { version: 'v1.2.1', channel: 'standard' }]
+    steps:
+    - uses: actions/checkout@v4
+    - name: Prep Go Runner
+      uses: ./.github/actions/prep-go-runner
+    - name: Dotenv Action
+      uses: falti/[email protected]
+      id: dotenv
+      with:
+        path: "./.github/workflows/.env/nightly-tests/max_versions.env"
+        log-variables: true
+    - name: Setup KinD Cluster
+      uses: ./.github/actions/setup-kind-cluster
+      with:
+        gateway-api-version: ${{ matrix.gateway-api-version.version }}
+        gateway-api-channel: ${{ matrix.gateway-api-version.channel }}
+        cluster-name: "kgw-api-e2e-${{ matrix.gateway-api-version.version }}-${{ matrix.gateway-api-version.channel }}"
+        kubectl-version: ${{ steps.dotenv.outputs.kubectl_version }}
+        istio-version: ${{ steps.dotenv.outputs.istio_version }}
+        kind-node-version: ${{ steps.dotenv.outputs.node_version }}
+    - id: run-tests
+      uses: ./.github/actions/kubernetes-e2e-tests
+      env:
+        VERSION: '1.0.0-ci1'
+        GITHUB_TOKEN: ${{ github.token }}
+        GO_TEST_RETRIES: '3' # Use a higher number of retries because there are so many tests and we don't want to rerun
+        GOTESTSUM_ARGS: '--format=standard-verbose --rerun-fails-max-failures 60' # High value for "rerun-fails-max-failures" because 3 failed tests can result in gotestsum thinking there's 40+ failures
+      with:
+        cluster-name: "kgw-api-e2e-${{ matrix.gateway-api-version.version }}-${{ matrix.gateway-api-version.channel }}"
+        test-args: '-v -timeout=120m'
+        run-regex: "^Test"
+        istio-version: ${{ steps.dotenv.outputs.istio_version }}
+        matrix-label: "nightly-kgw-api-${{ matrix.gateway-api-version.version }}-${{ matrix.gateway-api-version.channel }}"
@@ -0,0 +1,145 @@
+# EP-12721: E2e testing with Gateway API Versions
+
+
+* Issue: [12721](https://github.com/kgateway-dev/kgateway/issues/12721)
+
+
+## Background
+The current e2e tests assume the latest supported experimental version of the `gateway.networking.k8s.io` APIs is installed. This will not always be the case in the environments in which kgateway is deployed. In order to validate functionality across a wider range of environments, we will allow testing with different versions of the Gateway API.
+
+In addition to different semver designated versions of the API, there are two channels, `standard` and `experimental`
+
+
+### Differences in API versions
+* v0.3.0
+  * TCPRoute, TLSRoute, and the unused UDPRoute added to experimental (not available in standard as of v1.4.0)
+* v1.1.0
+  * SessionPersistance for HTTPRoute rules added to experimental (not available in standard as of v1.4.0)
+* v1.2.0
+  * HTTPRoutes.spec.rules[].name added in experimental (promoted to standard in v1.4.0)
+* v1.3.0
+  * XListenerSets added to experimental (not available in standard as of v1.4.0, planned for v1.5.0)
+  * CORS filters added to experimental (not available in standard as of v1.4.0)
+* v1.4.0
+  * BackendTLSPolicy promoted to v1 in standard and experimental. Previous v1alpha3 version is not supported.
+  * HTTPRoutes.spec.rules[].name added to standard
+
+The are a substantial number of tests that need to be modified to 
+
+
+## Motivation
+Better test coverage and understanding of how kgateway works with different Gateway API versions
+
+## Goals
+* E2E tests can be run locally or in CI with different versions (semver and channel) of the Gateway API
+* Consistent approach to managing resources for different versions of the API
+
+## Non-Goals
+* Mass update of existing tests to use the BaseTestingSuite
+  * Suites that don't use the BaseTestingSuite will continue to run all tests for any GatewayAPI version
+  * Tests that need implement version dependent behavior will be migrated to BaseTestingSuite as needed
+* Running tests in CRC/Openshift
+* Updating application code to support earlier versions
+
+
+## Implementation Details
+### Determining the Gateway API version
+The Gateway API CRDs contain two relevant annotations:
+* `gateway.networking.k8s.io/bundle-version` - the API version, for example `gateway.networking.k8s.io/bundle-version: v1.2.0`
+* `gateway.networking.k8s.io/channel` - the API channel, standard or experimental, for example `gateway.networking.k8s.io/channel: standard`
+
+These annotations can be examined to determine the version. If the annotations are not present, this should be considered a fatal error.
+
+### Test cases
+The e2e tests are built up of [TestCases](https://github.com/kgateway-dev/kgateway/blob/2b04f3d1465257d0c449687922ea6e92603b822c/test/kubernetes/e2e/tests/base/base_suite.go#L33) that define the resources used for the tests.
+
+In order to allow test cases to run conditionally based on the API version, we will add new fields, `MinGwApiVersion` and `MaxGwApiVersion` to the TestCase struct:
+
+```
+	// MinGwApiVersion specifies the minimum Gateway API version required per channel.
+	// Map key is the channel (GwApiChannelStandard or GwApiChannelExperimental), value is the minimum version.
+	// If the map is empty/nil, the test runs on any channel/version.
+	// The test will only run if the Gateway API version is >= the specified minimum version.
+	// For minimum requirements, if only experimental constraints exist, the test is considered experimental-only and will skip on standard channel.
+	// Matching logic based on installed channel:
+	//   - experimental: If experimental key exists, check version; otherwise run
+	//   - standard: If standard key exists, check version; if only experimental exists, skip; otherwise runs on any standard version.
+	MinGwApiVersion map[GwApiChannel]*GwApiVersion
+
+	// MaxGwApiVersion specifies the maximum Gateway API version required per channel.
+	// Map key is the channel (GwApiChannelStandard or GwApiChannelExperimental), value is the maximum version.
+	// If the map is empty/nil, the test runs on any channel/version.
+	// The test will only run if the Gateway API version is < the specified maximum version.
+	// Maximum constraints are channel-specific - experimental constraints don't affect standard channel execution.
+	// If the maximum version is less than the minimum version, the test will be skipped.
+	MaxGwApiVersion map[GwApiChannel]*GwApiVersion
+```
+
+`MinGwApiChannel` is a typed string with the value of `experimental` or `standard`, and will define the minimum version of the API needed to run the test for the channel. If the current installation is now greater or equal to the required version, the test will be skipped. If no `MinGwApiChannel` value is defined, the test will run on any version of the API. The exception to this logic is if the standard channel is installed and the `MinGwApiVersion` for the TestCase only defines an experimental minimum version, for example:
+
+```
+    MinGwApiVersion: map[base.GwApiChannel]*semver.Version{
+        base.GwApiChannelExperimental: base.GwApiV1_3_0,
+    },
+```
+
+This will be interpreted as "the test needs to use features available in experimental API v1.4.0; these features are not yet available in the standard channel". In this case, the test will be skipped for all standard channel versions.
+
+`GwApiVersion` is a wrapper around the underlying semver packages used, and was created in order to allow test suites to use semver types without having to know about the underlying implementation.
+
+
+### Test Suites
+
+
+#### SetupByVersion
+A common pattern used in our e2e tests is to setup a Gateway and possibly other resources during suite setup and using them for every test. This pattern allows the tests to run faster, as time is not spent deploying and removing Gateways. In the [BaseTestingSuite](https://github.com/kgateway-dev/kgateway/blob/2b04f3d1465257d0c449687922ea6e92603b822c/test/kubernetes/e2e/tests/base/base_suite.go#L49C1-L66C2), these resources are defined by the [Setup](https://github.com/kgateway-dev/kgateway/blob/2b04f3d1465257d0c449687922ea6e92603b822c/test/kubernetes/e2e/tests/base/base_suite.go#L53) field
+
+However, once we allow tests to run for different versions of the API, we are no longer in a "one configuration fits all" situation. For example, using ListenerSets requires `allowedListeners` to be defined on the Gateway, but this field will cause the resource to be rejected when using older versions of the API.
+
+To accommodate this, we will add a new field `SetupByVersion` to the BaseTestingSuite:
+```
+	// SetupByVersion allows defining different setup configurations for different GW API versions and channels.
+	// The outer map key is the channel (standard or experimental).
+	// The inner map key is the minimum version, and the value is the TestCase to use.
+	// The system will select the setup with the highest matching version for the current channel.
+	// If no setups match, falls back to the Setup field for backward compatibility.
+	// Example:
+	//   SetupByVersion: map[GwApiChannel]map[*semver.Version]*TestCase{
+	//     GwApiChannelExperimental: {
+	//       GwApiV1_3_0: &setupExperimentalV1_3,
+	//     },
+	//     GwApiChannelStandard: {
+	//       GwApiV1_3_0: &setupStandardV1_4,
+	//     },
+	//   }
+	SetupByVersion map[GwApiChannel]map[*semver.Version]*TestCase
+```
+
+When choosing which setup to use, the suite will use the highest defined semver for the channel that is less than or equal to the current version, falling back to the existing `Setup` if there is no such version.
+
+There are other data structures that could be used to store the setup information, but this approach was chosen because by making channel and version keys for the map, we guarantee that it will be unambiguous which setup to use.
+
+#### MinGwApiVersion
+
+`MinGwApiVersion` has also been added at the suite level to allow entire suites to be skipped.
+
+This is used for the cases where all the tests in a suite require configuration not available in all Gw API versions, and it was introduced because test suites apply their setup before running (or skipping) the individual test cases. In these cases, the suite may run its setup with resources incompatible with the installed version of the Gw API, and we would not want to restore those resources.
+
+### DevX
+* This approach requires no changes for tests and suites that aren't version sensitive
+* If a test needs to be skipped on certain versions, it can configured on the test case
+* If a suite requires different setups/gateways based on version, once the setup is configured additional test cases just need to be congfigured with the versions they run on.
+
+
+### Test Plan
+Successful runs of a GitHub job across versions v1.2-1.4 in both channels.
+
+Tests and suites will be adapted to older versions in 2 ways:
+* If a test requires a feature (like XListenerSets or rule names in HTTPRoutes), those tests will be skipped.
+* Some tests will fail because the suite setup or test resources have invalid config for a Gw API version, but the test itself does not. For example, a Gateway for the suite may be configured with `allowedListeners`, but only some tests use listenersets. In this case we will split the resources and use a combination of SetupForVersion and MinGwApiVersion to apply the appropriate config and run the appropriate tests for the Gw API version.
+
+## Alternatives
+Do not test other versions of the API.
+
+## Open Questions
+* Should we be able to set minimum version at the suite level? EG, for the listenerset suite, when we know that no tests in the suite will run?
@@ -5,3 +5,8 @@ The following are run on a schedule via a [GitHub action](/.github/workflows/nig
 ## Gateway API conformance tests
 Kubernetes Gateway API conformance tests are run using the earliest and latest supported k8s versions.
 
+## Gateway Load Tests
+Kubernetes Gateway load tests are run using the earliest and latest supported k8s versions.
+
+## E2E tests with different Gateway API versions
+The entire e2e suite is run against a variety of Gateway API Versions and Channels.
@@ -183,7 +183,7 @@ require (
 	github.com/GoogleCloudPlatform/opentelemetry-operations-go/internal/resourcemapping v0.51.0 // indirect
 	github.com/MakeNowJust/heredoc v1.0.0 // indirect
 	github.com/Masterminds/goutils v1.1.1 // indirect
-	github.com/Masterminds/semver/v3 v3.4.0 // indirect
+	github.com/Masterminds/semver/v3 v3.4.0
 	github.com/Masterminds/sprig/v3 v3.3.0 // indirect
 	github.com/Masterminds/squirrel v1.5.4 // indirect
 	github.com/Microsoft/go-winio v0.6.2 // indirect
 
@@ -1,6 +1,7 @@
 Name|Version|License
 ---|---|---
 [cel.dev/expr](https://cel.dev/expr)|v0.24.0|Apache License 2.0
+[semver/v3](https://github.com/Masterminds/semver)|v3.4.0|MIT License
 [agentgateway/agentgateway](https://github.com/agentgateway/agentgateway)|v0.10.6-0.20251103234311-2f71d0e845d0|Apache License 2.0
 [anthropics/anthropic-sdk-go](https://github.com/anthropics/anthropic-sdk-go)|v1.13.0|MIT License
 [retry-go/v4](https://github.com/avast/retry-go)|v4.3.3|MIT License
 
@@ -81,6 +81,7 @@ func (cmd *LocalCmd) WithStderr(w io.Writer) Cmd {
 // Run runs the command
 // If the returned error is non-nil, it should be of type *RunError
 func (cmd *LocalCmd) Run() *RunError {
+	// Combined output is used to capture the stdout and stderr of the command for logging
 	var combinedOutput threadsafe.Buffer
 
 	if printCommands {
 
@@ -5,6 +5,7 @@ import (
 	"io"
 
 	"github.com/kgateway-dev/kgateway/v2/pkg/utils/cmdutils"
+	"github.com/kgateway-dev/kgateway/v2/pkg/utils/threadsafe"
 )
 
 // Client is a utility for executing `helm` commands
@@ -26,8 +27,10 @@ func NewClient() *Client {
 
 // WithReceiver sets the io.Writer that will be used by default for the stdout and stderr
 // of cmdutils.Cmd created by the Client
+// This modifies the value in place, so affects shared references to the Client and future commands run by the Client.
+// Wrap this in a threadsafe struct to avoid data races when wrapped in io.MultiWriter in cmdutils.
 func (c *Client) WithReceiver(receiver io.Writer) *Client {
-	c.receiver = receiver
+	c.receiver = &threadsafe.WriterWrapper{W: receiver}
 	return c
 }
 
 
@@ -16,6 +16,7 @@ import (
 	"github.com/kgateway-dev/kgateway/v2/pkg/utils/cmdutils"
 	"github.com/kgateway-dev/kgateway/v2/pkg/utils/kubeutils/portforward"
 	"github.com/kgateway-dev/kgateway/v2/pkg/utils/requestutils/curl"
+	"github.com/kgateway-dev/kgateway/v2/pkg/utils/threadsafe"
 )
 
 // Cli is a utility for executing `kubectl` commands
@@ -52,8 +53,10 @@ type CurlResponse struct {
 
 // WithReceiver sets the io.Writer that will be used by default for the stdout and stderr
 // of cmdutils.Cmd created by the Cli
+// This modifies the value in place, so affects shared references to the Cli and future commands run by the Cli.
+// Wrap this in a threadsafe struct to avoid data races when wrapped in io.MultiWriter in cmdutils.
 func (c *Cli) WithReceiver(receiver io.Writer) *Cli {
-	c.receiver = receiver
+	c.receiver = &threadsafe.WriterWrapper{W: receiver}
 	return c
 }
 
@@ -355,14 +358,12 @@ func (c *Cli) Execute(ctx context.Context, args ...string) (string, string, erro
 		}
 	}
 
-	stdout := new(strings.Builder)
-	stderr := new(strings.Builder)
+	stdout := threadsafe.Buffer{}
+	stderr := threadsafe.Buffer{}
 
 	err := cmdutils.Command(ctx, "kubectl", args...).
-		// For convenience, we set the stdout and stderr to the receiver
-		// This can still be overwritten by consumers who use the commands
-		WithStdout(stdout).
-		WithStderr(stderr).Run().Cause()
+		WithStdout(&stdout).
+		WithStderr(&stderr).Run().Cause()
 
 	return stdout.String(), stderr.String(), err
 }