diff --git a/.github/workflows/cluster_endtoend_vtgate_foreignkey_stress.yml b/.github/workflows/cluster_endtoend_vtgate_foreignkey_stress.yml
new file mode 100644
index 00000000000..d44389d1497
--- /dev/null
+++ b/.github/workflows/cluster_endtoend_vtgate_foreignkey_stress.yml
@@ -0,0 +1,148 @@
+# DO NOT MODIFY: THIS FILE IS GENERATED USING "make generate_ci_workflows"
+
+name: Cluster (vtgate_foreignkey_stress)
+on: [push, pull_request]
+concurrency:
+  group: format('{0}-{1}', ${{ github.ref }}, 'Cluster (vtgate_foreignkey_stress)')
+  cancel-in-progress: true
+
+permissions: read-all
+
+env:
+  LAUNCHABLE_ORGANIZATION: "vitess"
+  LAUNCHABLE_WORKSPACE: "vitess-app"
+  GITHUB_PR_HEAD_SHA: "${{ github.event.pull_request.head.sha }}"
+
+jobs:
+  build:
+    name: Run endtoend tests on Cluster (vtgate_foreignkey_stress)
+    runs-on: gh-hosted-runners-4cores-1
+
+    steps:
+    - name: Skip CI
+      run: |
+        if [[ "${{contains( github.event.pull_request.labels.*.name, 'Skip CI')}}" == "true" ]]; then
+          echo "skipping CI due to the 'Skip CI' label"
+          exit 1
+        fi
+
+    - name: Check if workflow needs to be skipped
+      id: skip-workflow
+      run: |
+        skip='false'
+        if [[ "${{github.event.pull_request}}" ==  "" ]] && [[ "${{github.ref}}" != "refs/heads/main" ]] && [[ ! "${{github.ref}}" =~ ^refs/heads/release-[0-9]+\.[0-9]$ ]] && [[ ! "${{github.ref}}" =~ "refs/tags/.*" ]]; then
+          skip='true'
+        fi
+        echo Skip ${skip}
+        echo "skip-workflow=${skip}" >> $GITHUB_OUTPUT
+
+        PR_DATA=$(curl \
+          -H "Authorization: token ${{ secrets.GITHUB_TOKEN }}" \
+          -H "Accept: application/vnd.github.v3+json" \
+          "https://api.github.com/repos/${{ github.repository }}/pulls/${{ github.event.pull_request.number }}")
+        draft=$(echo "$PR_DATA" | jq .draft -r)
+        echo "is_draft=${draft}" >> $GITHUB_OUTPUT
+
+    - name: Check out code
+      if: steps.skip-workflow.outputs.skip-workflow == 'false'
+      uses: actions/checkout@v3
+
+    - name: Check for changes in relevant files
+      if: steps.skip-workflow.outputs.skip-workflow == 'false'
+      uses: frouioui/paths-filter@main
+      id: changes
+      with:
+        token: ''
+        filters: |
+          end_to_end:
+            - 'go/**/*.go'
+            - 'test.go'
+            - 'Makefile'
+            - 'build.env'
+            - 'go.sum'
+            - 'go.mod'
+            - 'proto/*.proto'
+            - 'tools/**'
+            - 'config/**'
+            - 'bootstrap.sh'
+            - '.github/workflows/cluster_endtoend_vtgate_foreignkey_stress.yml'
+
+    - name: Set up Go
+      if: steps.skip-workflow.outputs.skip-workflow == 'false' && steps.changes.outputs.end_to_end == 'true'
+      uses: actions/setup-go@v4
+      with:
+        go-version: 1.21.0
+
+    - name: Set up python
+      if: steps.skip-workflow.outputs.skip-workflow == 'false' && steps.changes.outputs.end_to_end == 'true'
+      uses: actions/setup-python@v4
+
+    - name: Tune the OS
+      if: steps.skip-workflow.outputs.skip-workflow == 'false' && steps.changes.outputs.end_to_end == 'true'
+      run: |
+        # Limit local port range to not use ports that overlap with server side
+        # ports that we listen on.
+        sudo sysctl -w net.ipv4.ip_local_port_range="22768 65535"
+        # Increase the asynchronous non-blocking I/O. More information at https://dev.mysql.com/doc/refman/5.7/en/innodb-parameters.html#sysvar_innodb_use_native_aio
+        echo "fs.aio-max-nr = 1048576" | sudo tee -a /etc/sysctl.conf
+        sudo sysctl -p /etc/sysctl.conf
+
+    - name: Get dependencies
+      if: steps.skip-workflow.outputs.skip-workflow == 'false' && steps.changes.outputs.end_to_end == 'true'
+      run: |
+        
+        # Get key to latest MySQL repo
+        sudo apt-key adv --keyserver keyserver.ubuntu.com --recv-keys 467B942D3A79BD29
+        # Setup MySQL 8.0
+        wget -c https://dev.mysql.com/get/mysql-apt-config_0.8.24-1_all.deb
+        echo mysql-apt-config mysql-apt-config/select-server select mysql-8.0 | sudo debconf-set-selections
+        sudo DEBIAN_FRONTEND="noninteractive" dpkg -i mysql-apt-config*
+        sudo apt-get update
+        # Install everything else we need, and configure
+        sudo apt-get install -y mysql-server mysql-client make unzip g++ etcd curl git wget eatmydata xz-utils libncurses5
+
+        sudo service mysql stop
+        sudo service etcd stop
+        sudo ln -s /etc/apparmor.d/usr.sbin.mysqld /etc/apparmor.d/disable/
+        sudo apparmor_parser -R /etc/apparmor.d/usr.sbin.mysqld
+        go mod download
+
+        # install JUnit report formatter
+        go install github.com/vitessio/go-junit-report@HEAD
+
+    - name: Setup launchable dependencies
+      if: steps.skip-workflow.outputs.is_draft == 'false' && steps.skip-workflow.outputs.skip-workflow == 'false' && steps.changes.outputs.end_to_end == 'true' && github.base_ref == 'main'
+      run: |
+        # Get Launchable CLI installed. If you can, make it a part of the builder image to speed things up
+        pip3 install --user launchable~=1.0 > /dev/null
+
+        # verify that launchable setup is all correct.
+        launchable verify || true
+
+        # Tell Launchable about the build you are producing and testing
+        launchable record build --name "$GITHUB_RUN_ID" --no-commit-collection --source .
+
+    - name: Run cluster endtoend test
+      if: steps.skip-workflow.outputs.skip-workflow == 'false' && steps.changes.outputs.end_to_end == 'true'
+      timeout-minutes: 45
+      run: |
+        # We set the VTDATAROOT to the /tmp folder to reduce the file path of mysql.sock file
+        # which musn't be more than 107 characters long.
+        export VTDATAROOT="/tmp/"
+        source build.env
+
+        set -exo pipefail
+
+        # run the tests however you normally do, then produce a JUnit XML file
+        eatmydata -- go run test.go -docker=false -follow -shard vtgate_foreignkey_stress | tee -a output.txt | go-junit-report -set-exit-code > report.xml
+
+    - name: Print test output and Record test result in launchable if PR is not a draft
+      if: steps.skip-workflow.outputs.skip-workflow == 'false' && steps.changes.outputs.end_to_end == 'true' && always()
+      run: |
+        if [[ "${{steps.skip-workflow.outputs.is_draft}}" ==  "false" ]]; then
+          # send recorded tests to launchable
+          launchable record tests --build "$GITHUB_RUN_ID" go-test . || true
+        fi
+
+        # print test output
+        cat output.txt
diff --git a/go.mod b/go.mod
index 639a22edc6b..88e09e70d22 100644
--- a/go.mod
+++ b/go.mod
@@ -107,6 +107,7 @@ require (
 	github.com/spf13/jwalterweatherman v1.1.0
 	github.com/xlab/treeprint v1.2.0
 	go.uber.org/goleak v1.2.1
+	golang.org/x/exp v0.0.0-20230817173708-d852ddb80c63
 	golang.org/x/sync v0.3.0
 	modernc.org/sqlite v1.20.3
 )
diff --git a/go.sum b/go.sum
index ffadd6498b9..cb54903b2e9 100644
--- a/go.sum
+++ b/go.sum
@@ -677,6 +677,8 @@ golang.org/x/exp v0.0.0-20191227195350-da58074b4299/go.mod h1:2RIsYlXP63K8oxa1u0
 golang.org/x/exp v0.0.0-20200119233911-0405dc783f0a/go.mod h1:2RIsYlXP63K8oxa1u096TMicItID8zy7Y6sNkU49FU4=
 golang.org/x/exp v0.0.0-20200207192155-f17229e696bd/go.mod h1:J/WKrq2StrnmMY6+EHIKF9dgMWnmCNThgcyBT1FY9mM=
 golang.org/x/exp v0.0.0-20200224162631-6cc2880d07d6/go.mod h1:3jZMyOhIsHpP37uCMkUooju7aAi5cS1Q23tOzKc+0MU=
+golang.org/x/exp v0.0.0-20230817173708-d852ddb80c63 h1:m64FZMko/V45gv0bNmrNYoDEq8U5YUhetc9cBWKS1TQ=
+golang.org/x/exp v0.0.0-20230817173708-d852ddb80c63/go.mod h1:0v4NqG35kSWCMzLaMeX+IQrlSnVE/bqGSyC2cz/9Le8=
 golang.org/x/image v0.0.0-20190227222117-0694c2d4d067/go.mod h1:kZ7UVZpmo3dzQBMxlp+ypCbDeSB+sBbTgSJuh5dn5js=
 golang.org/x/image v0.0.0-20190802002840-cff245a6509b/go.mod h1:FeLwcggjj3mMvU+oOTbSwawSJRM1uh48EjtB4UJZlP0=
 golang.org/x/lint v0.0.0-20181026193005-c67002cb31c3/go.mod h1:UVdnD1Gm6xHRNCYTkRU2/jEulfH38KcIWyp/GAMgvoE=
diff --git a/go/test/endtoend/cluster/cluster_util.go b/go/test/endtoend/cluster/cluster_util.go
index 0e3cc2d0c95..1af9504389b 100644
--- a/go/test/endtoend/cluster/cluster_util.go
+++ b/go/test/endtoend/cluster/cluster_util.go
@@ -223,26 +223,53 @@ func filterResultWhenRunsForCoverage(input string) string {
 	return result
 }
 
+func ValidateReplicationIsHealthy(t *testing.T, tablet *Vttablet) bool {
+	query := "show replica status"
+	rs, err := tablet.VttabletProcess.QueryTablet(query, "", true)
+	assert.NoError(t, err)
+	row := rs.Named().Row()
+	require.NotNil(t, row)
+
+	ioRunning := row.AsString("Replica_IO_Running", "")
+	require.NotEmpty(t, ioRunning)
+	ioHealthy := assert.Equalf(t, "Yes", ioRunning, "Replication is broken. Replication status: %v", row)
+	sqlRunning := row.AsString("Replica_SQL_Running", "")
+	require.NotEmpty(t, sqlRunning)
+	sqlHealthy := assert.Equalf(t, "Yes", sqlRunning, "Replication is broken. Replication status: %v", row)
+
+	return ioHealthy && sqlHealthy
+}
+
 // WaitForReplicationPos will wait for replication position to catch-up
-func WaitForReplicationPos(t *testing.T, tabletA *Vttablet, tabletB *Vttablet, hostname string, timeout float64) {
+func WaitForReplicationPos(t *testing.T, tabletA *Vttablet, tabletB *Vttablet, validateReplication bool, timeout time.Duration) {
+	hostname := "localhost"
+	ctx, cancel := context.WithTimeout(context.Background(), timeout)
+	defer cancel()
+	ticker := time.NewTicker(10 * time.Millisecond)
+	defer ticker.Stop()
+
 	replicationPosA, _ := GetPrimaryPosition(t, *tabletA, hostname)
 	for {
+		if validateReplication {
+			if !ValidateReplicationIsHealthy(t, tabletB) {
+				assert.FailNowf(t, "Replication broken on tablet %v. Will not wait for position", tabletB.Alias)
+			}
+			if t.Failed() {
+				return
+			}
+		}
 		replicationPosB, _ := GetPrimaryPosition(t, *tabletB, hostname)
 		if positionAtLeast(t, tabletA, replicationPosB, replicationPosA) {
-			break
+			return
 		}
 		msg := fmt.Sprintf("%s's replication position to catch up to %s's;currently at: %s, waiting to catch up to: %s", tabletB.Alias, tabletA.Alias, replicationPosB, replicationPosA)
-		waitStep(t, msg, timeout, 0.01)
-	}
-}
-
-func waitStep(t *testing.T, msg string, timeout float64, sleepTime float64) float64 {
-	timeout = timeout - sleepTime
-	if timeout < 0.0 {
-		t.Errorf("timeout waiting for condition '%s'", msg)
+		select {
+		case <-ctx.Done():
+			assert.FailNowf(t, "Timeout waiting for condition '%s'", msg)
+			return
+		case <-ticker.C:
+		}
 	}
-	time.Sleep(time.Duration(sleepTime) * time.Second)
-	return timeout
 }
 
 func positionAtLeast(t *testing.T, tablet *Vttablet, a string, b string) bool {
diff --git a/go/test/endtoend/onlineddl/vtgate_util.go b/go/test/endtoend/onlineddl/vtgate_util.go
index ae214a644b6..3d99a2cef92 100644
--- a/go/test/endtoend/onlineddl/vtgate_util.go
+++ b/go/test/endtoend/onlineddl/vtgate_util.go
@@ -207,7 +207,7 @@ func CheckLaunchAllMigrations(t *testing.T, vtParams *mysql.ConnParams, expectCo
 }
 
 // CheckMigrationStatus verifies that the migration indicated by given UUID has the given expected status
-func CheckMigrationStatus(t *testing.T, vtParams *mysql.ConnParams, shards []cluster.Shard, uuid string, expectStatuses ...schema.OnlineDDLStatus) {
+func CheckMigrationStatus(t *testing.T, vtParams *mysql.ConnParams, shards []cluster.Shard, uuid string, expectStatuses ...schema.OnlineDDLStatus) bool {
 	query, err := sqlparser.ParseAndBind("show vitess_migrations like %a",
 		sqltypes.StringBindVariable(uuid),
 	)
@@ -229,7 +229,7 @@ func CheckMigrationStatus(t *testing.T, vtParams *mysql.ConnParams, shards []clu
 			}
 		}
 	}
-	assert.Equal(t, len(shards), count)
+	return assert.Equal(t, len(shards), count)
 }
 
 // WaitForMigrationStatus waits for a migration to reach either provided statuses (returns immediately), or eventually time out
diff --git a/go/test/endtoend/tabletgateway/buffer/reparent/failover_buffer_test.go b/go/test/endtoend/tabletgateway/buffer/reparent/failover_buffer_test.go
index ace652fc1d2..d3828eb8166 100644
--- a/go/test/endtoend/tabletgateway/buffer/reparent/failover_buffer_test.go
+++ b/go/test/endtoend/tabletgateway/buffer/reparent/failover_buffer_test.go
@@ -51,7 +51,7 @@ func failoverExternalReparenting(t *testing.T, clusterInstance *cluster.LocalPro
 	primary.VttabletProcess.QueryTablet(demoteQuery, keyspaceUnshardedName, true)
 
 	// Wait for replica to catch up to primary.
-	cluster.WaitForReplicationPos(t, primary, replica, "localhost", 60.0)
+	cluster.WaitForReplicationPos(t, primary, replica, false, time.Minute)
 
 	duration := time.Since(start)
 	minUnavailabilityInS := 1.0
diff --git a/go/test/endtoend/vtgate/foreignkey/stress/fk_stress_test.go b/go/test/endtoend/vtgate/foreignkey/stress/fk_stress_test.go
new file mode 100644
index 00000000000..600961e6f0c
--- /dev/null
+++ b/go/test/endtoend/vtgate/foreignkey/stress/fk_stress_test.go
@@ -0,0 +1,1131 @@
+/*
+Copyright 2023 The Vitess Authors.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+package fkstress
+
+import (
+	"context"
+	"flag"
+	"fmt"
+	"math/rand"
+	"os"
+	"path"
+	"strings"
+	"sync"
+	"sync/atomic"
+	"testing"
+	"time"
+
+	"github.com/stretchr/testify/assert"
+	"github.com/stretchr/testify/require"
+	"golang.org/x/exp/slices"
+
+	"vitess.io/vitess/go/mysql"
+	"vitess.io/vitess/go/mysql/sqlerror"
+	"vitess.io/vitess/go/sqltypes"
+	"vitess.io/vitess/go/test/endtoend/cluster"
+	"vitess.io/vitess/go/test/endtoend/onlineddl"
+	"vitess.io/vitess/go/test/endtoend/utils"
+	"vitess.io/vitess/go/textutil"
+	"vitess.io/vitess/go/vt/log"
+	"vitess.io/vitess/go/vt/schema"
+	"vitess.io/vitess/go/vt/sqlparser"
+)
+
+// This endtoend test is designd to validate VTGate's FOREIGN KEY implementation for unsharded/single-sharded/shard-scope, meaning
+// we expect foreign key constraints to be limited to a shard (related rows can never be on diffrent shards).
+//
+// This test validates NO ACTION, CASCADE and SET NULL reference actions.
+// VTGate's support for foreign keys includes:
+// - Analyzing the foreign key constraints in a keyspace.
+// - Rejecting INSERT statements for child table when there's no matching row on a parent table.
+// - Handling DELETE and UPDATE statements on a parent table according to the reference action on all children.
+//   Specifically, this means for example that VTGate will handle a ON DELETE CASCADE in Vitess plane. It will first delete rows
+//   from the child (recursive operation) before deleting the row on the parent. As result, the underlying MySQL server will have
+//   nothing to cascade.
+//
+// The design of this test is as follows:
+// - Create a cluster with PRIMARY and REPLICA tablets
+// - Given this structure of tables with foreign key constraints:
+//   stress_parent
+//   +- stress_child
+//      +- stress_grandchild
+//   +- stress_child2
+// - Create these tables. Then, on the MySQL replica, remove the foreign key constraints.
+// - Static test:
+//   - Randomly populate all tables via highly-contentive INSERT/UPDATE/DELETE statements
+//   - Validate collected metrics match actual table data
+//   - Validate foreign key constraints integrity
+// - Workload test:
+//   - Initially populate tables as above
+//   - Run a high contention workload where multiple connections issue random INSERT/UPDATE/DELETE on all related tables
+//   - Validate collected metrics match actual table data
+//   - Validate foreign key constraints integrity on MySQL primary
+//   - Validate foreign key constraints integrity on MySQL replica
+//   - Compare data on primary & replica
+//
+// We of course know that foreign key integrity is maintained on the MySQL primary. However, the replica does not have the matching
+// constraints. Since cascaded (SET NULL, CASCADE) writes are handled internally by InnoDB and not written to the binary log,
+// any cascaded writes on the primary are lost, and the replica is unaware of those writes. Without VTGate intervention, we expect
+// the replica to quickly diverge from the primary, and in fact in all likelyhood replication will break very quickly.
+// However, if VTGate implements the cascading rules correctly, the primary MySQL server will never have any actual cascades, and
+// so cascaded writes are all accounted for in the binary logs, which means we can expect the replica to be compliant with the
+// primary.
+
+type WriteMetrics struct {
+	mu                                                      sync.Mutex
+	insertsAttempts, insertsFailures, insertsNoops, inserts int64
+	updatesAttempts, updatesFailures, updatesNoops, updates int64
+	deletesAttempts, deletesFailures, deletesNoops, deletes int64
+
+	insertsFKErrors, updatesFKErrors, deletesFKErrors             int64
+	sampleInsertFKError, sampleUpdateFKError, sampleDeleteFKError error
+}
+
+func (w *WriteMetrics) Clear() {
+	w.mu.Lock()
+	defer w.mu.Unlock()
+
+	w.inserts = 0
+	w.updates = 0
+	w.deletes = 0
+
+	w.insertsAttempts = 0
+	w.insertsFailures = 0
+	w.insertsNoops = 0
+
+	w.updatesAttempts = 0
+	w.updatesFailures = 0
+	w.updatesNoops = 0
+
+	w.deletesAttempts = 0
+	w.deletesFailures = 0
+	w.deletesNoops = 0
+
+	w.insertsFKErrors = 0
+	w.updatesFKErrors = 0
+	w.deletesFKErrors = 0
+}
+
+func (w *WriteMetrics) String() string {
+	return fmt.Sprintf(`WriteMetrics: inserts-deletes=%d, updates-deletes=%d,
+insertsAttempts=%d, insertsFailures=%d, insertsNoops=%d, inserts=%d,
+updatesAttempts=%d, updatesFailures=%d, updatesNoops=%d, updates=%d,
+deletesAttempts=%d, deletesFailures=%d, deletesNoops=%d, deletes=%d,
+`,
+		w.inserts-w.deletes, w.updates-w.deletes,
+		w.insertsAttempts, w.insertsFailures, w.insertsNoops, w.inserts,
+		w.updatesAttempts, w.updatesFailures, w.updatesNoops, w.updates,
+		w.deletesAttempts, w.deletesFailures, w.deletesNoops, w.deletes,
+	)
+}
+
+var (
+	clusterInstance *cluster.LocalProcessCluster
+	shards          []cluster.Shard
+	primary         *cluster.Vttablet
+	replica         *cluster.Vttablet
+	vtParams        mysql.ConnParams
+
+	onlineDDLStrategy     = "vitess --unsafe-allow-foreign-keys --cut-over-threshold=15s"
+	hostname              = "localhost"
+	keyspaceName          = "ks"
+	cell                  = "zone1"
+	schemaChangeDirectory = ""
+	parentTableName       = "stress_parent"
+	childTableName        = "stress_child"
+	child2TableName       = "stress_child2"
+	grandchildTableName   = "stress_grandchild"
+	tableNames            = []string{parentTableName, childTableName, child2TableName, grandchildTableName}
+	reverseTableNames     []string
+
+	seedOnce sync.Once
+
+	referenceActionMap = map[sqlparser.ReferenceAction]string{
+		sqlparser.NoAction: "NO ACTION",
+		sqlparser.Cascade:  "CASCADE",
+		sqlparser.SetNull:  "SET NULL",
+	}
+	referenceActions = []sqlparser.ReferenceAction{sqlparser.NoAction, sqlparser.SetNull, sqlparser.Cascade}
+	createStatements = []string{
+		`
+		CREATE TABLE stress_parent (
+			id bigint not null,
+			parent_id bigint,
+			rand_val varchar(32) null default '',
+			hint_col varchar(64) not null default '',
+			created_timestamp timestamp not null default current_timestamp,
+			updates int unsigned not null default 0,
+			PRIMARY KEY (id),
+			key parent_id_idx(parent_id),
+			key created_idx(created_timestamp),
+			key updates_idx(updates)
+		) ENGINE=InnoDB
+		`,
+		`
+		CREATE TABLE stress_child (
+			id bigint not null,
+			parent_id bigint,
+			rand_val varchar(32) null default '',
+			hint_col varchar(64) not null default '',
+			created_timestamp timestamp not null default current_timestamp,
+			updates int unsigned not null default 0,
+			PRIMARY KEY (id),
+			key parent_id_idx(parent_id),
+			key created_idx(created_timestamp),
+			key updates_idx(updates),
+			CONSTRAINT child_parent_fk FOREIGN KEY (parent_id) REFERENCES stress_parent (id) ON DELETE %s ON UPDATE %s
+		) ENGINE=InnoDB
+		`,
+		`
+		CREATE TABLE stress_child2 (
+			id bigint not null,
+			parent_id bigint,
+			rand_val varchar(32) null default '',
+			hint_col varchar(64) not null default '',
+			created_timestamp timestamp not null default current_timestamp,
+			updates int unsigned not null default 0,
+			PRIMARY KEY (id),
+			key parent_id_idx(parent_id),
+			key created_idx(created_timestamp),
+			key updates_idx(updates),
+			CONSTRAINT child2_parent_fk FOREIGN KEY (parent_id) REFERENCES stress_parent (id) ON DELETE %s ON UPDATE %s
+		) ENGINE=InnoDB
+		`,
+		`
+		CREATE TABLE stress_grandchild (
+			id bigint not null,
+			parent_id bigint,
+			rand_val varchar(32) null default '',
+			hint_col varchar(64) not null default '',
+			created_timestamp timestamp not null default current_timestamp,
+			updates int unsigned not null default 0,
+			PRIMARY KEY (id),
+			key parent_id_idx(parent_id),
+			key created_idx(created_timestamp),
+			key updates_idx(updates),
+			CONSTRAINT grandchild_child_fk FOREIGN KEY (parent_id) REFERENCES stress_child (id) ON DELETE %s ON UPDATE %s
+		) ENGINE=InnoDB
+		`,
+	}
+	dropConstraintsStatements = []string{
+		`ALTER TABLE stress_child DROP CONSTRAINT child_parent_fk`,
+		`ALTER TABLE stress_child2 DROP CONSTRAINT child2_parent_fk`,
+		`ALTER TABLE stress_grandchild DROP CONSTRAINT grandchild_child_fk`,
+	}
+	alterHintStatement = `
+		ALTER TABLE %s modify hint_col varchar(64) not null default '%s'
+	`
+	insertRowStatement = `
+		INSERT IGNORE INTO %s (id, parent_id, rand_val) VALUES (%d, %d, left(md5(rand()), 8))
+	`
+	updateRowStatement = `
+		UPDATE %s SET rand_val=left(md5(rand()), 8), updates=updates+1 WHERE id=%d
+	`
+	updateRowIdStatement = `
+		UPDATE %s SET id=%v, rand_val=left(md5(rand()), 8), updates=updates+1 WHERE id=%d
+	`
+	deleteRowStatement = `
+		DELETE FROM %s WHERE id=%d AND updates=1
+	`
+	// We use CAST(SUM(updates) AS SIGNED) because SUM() returns a DECIMAL datatype, and we want to read a SIGNED INTEGER type
+	selectCountRowsStatement = `
+		SELECT COUNT(*) AS num_rows, CAST(SUM(updates) AS SIGNED) AS sum_updates FROM %s
+	`
+	selectMatchingRowsChild = `
+		select stress_child.id from stress_child join stress_parent on (stress_parent.id = stress_child.parent_id)
+	`
+	selectMatchingRowsChild2 = `
+		select stress_child2.id from stress_child2 join stress_parent on (stress_parent.id = stress_child2.parent_id)
+	`
+	selectMatchingRowsGrandchild = `
+		select stress_grandchild.id from stress_grandchild join stress_child on (stress_child.id = stress_grandchild.parent_id)
+	`
+	selectOrphanedRowsChild = `
+		select stress_child.id from stress_child left join stress_parent on (stress_parent.id = stress_child.parent_id) where stress_parent.id is null
+	`
+	selectOrphanedRowsChild2 = `
+		select stress_child2.id from stress_child2 left join stress_parent on (stress_parent.id = stress_child2.parent_id) where stress_parent.id is null
+	`
+	selectOrphanedRowsGrandchild = `
+		select stress_grandchild.id from stress_grandchild left join stress_child on (stress_child.id = stress_grandchild.parent_id) where stress_child.id is null
+	`
+	deleteAllStatement = `
+		DELETE FROM %s
+	`
+	writeMetrics = map[string]*WriteMetrics{}
+)
+
+const (
+	maxTableRows         = 4096
+	workloadDuration     = 5 * time.Second
+	migrationWaitTimeout = 60 * time.Second
+)
+
+// The following variables are fit for a local, strong developer box.
+// The test overrides these into more relaxed values if running on GITHUB_ACTIONS,
+// seeing that GitHub CI is much weaker.
+var (
+	maxConcurrency                = 10
+	singleConnectionSleepInterval = 10 * time.Millisecond
+	countIterations               = 3
+)
+
+func TestMain(m *testing.M) {
+	defer cluster.PanicHandler(nil)
+	flag.Parse()
+
+	exitcode, err := func() (int, error) {
+		clusterInstance = cluster.NewCluster(cell, hostname)
+		schemaChangeDirectory = path.Join("/tmp", fmt.Sprintf("schema_change_dir_%d", clusterInstance.GetAndReserveTabletUID()))
+		defer os.RemoveAll(schemaChangeDirectory)
+		defer clusterInstance.Teardown()
+
+		if _, err := os.Stat(schemaChangeDirectory); os.IsNotExist(err) {
+			_ = os.Mkdir(schemaChangeDirectory, 0700)
+		}
+
+		clusterInstance.VtctldExtraArgs = []string{
+			"--schema_change_dir", schemaChangeDirectory,
+			"--schema_change_controller", "local",
+			"--schema_change_check_interval", "1s",
+		}
+
+		clusterInstance.VtTabletExtraArgs = []string{
+			"--heartbeat_enable",
+			"--heartbeat_interval", "250ms",
+			"--heartbeat_on_demand_duration", "5s",
+			"--watch_replication_stream",
+			"--vreplication_tablet_type", "primary",
+		}
+		clusterInstance.VtGateExtraArgs = []string{}
+
+		if err := clusterInstance.StartTopo(); err != nil {
+			return 1, err
+		}
+
+		// Start keyspace
+		keyspace := &cluster.Keyspace{
+			Name: keyspaceName,
+			VSchema: `{
+				"sharded": false,
+				"foreignKeyMode": "FK_MANAGED"
+			}`,
+		}
+
+		// We will use a replica to confirm that vtgate's cascading works correctly.
+		if err := clusterInstance.StartKeyspace(*keyspace, []string{"1"}, 1, false); err != nil {
+			return 1, err
+		}
+
+		vtgateInstance := clusterInstance.NewVtgateInstance()
+		// Start vtgate
+		if err := vtgateInstance.Setup(); err != nil {
+			return 1, err
+		}
+		// ensure it is torn down during cluster TearDown
+		clusterInstance.VtgateProcess = *vtgateInstance
+		vtParams = mysql.ConnParams{
+			Host: clusterInstance.Hostname,
+			Port: clusterInstance.VtgateMySQLPort,
+		}
+
+		return m.Run(), nil
+	}()
+	if err != nil {
+		fmt.Printf("%v\n", err)
+		os.Exit(1)
+	} else {
+		os.Exit(exitcode)
+	}
+
+}
+
+func queryTablet(t *testing.T, tablet *cluster.Vttablet, query string, expectError string) *sqltypes.Result {
+	rs, err := tablet.VttabletProcess.QueryTablet(query, keyspaceName, true)
+	if expectError == "" {
+		assert.NoError(t, err)
+	} else {
+		assert.ErrorContains(t, err, expectError)
+	}
+	return rs
+}
+
+func tabletTestName(t *testing.T, tablet *cluster.Vttablet) string {
+	switch tablet {
+	case primary:
+		return "primary"
+	case replica:
+		return "replica"
+	default:
+		assert.FailNowf(t, "unknown tablet", "%v, type=%v", tablet.Alias, tablet.Type)
+	}
+	return ""
+}
+
+func waitForReplicaCatchup(t *testing.T) {
+	cluster.WaitForReplicationPos(t, primary, replica, true, time.Minute)
+}
+
+func validateMetrics(t *testing.T, tcase *testCase) {
+	for _, workloadTable := range []string{parentTableName, childTableName, child2TableName, grandchildTableName} {
+		t.Run(workloadTable, func(t *testing.T) {
+			t.Run("fk errors", func(t *testing.T) {
+				testSelectTableFKErrors(t, workloadTable, tcase)
+			})
+			var primaryRows, replicaRows int64
+			t.Run(tabletTestName(t, primary), func(t *testing.T) {
+				primaryRows = testSelectTableMetrics(t, primary, workloadTable, tcase)
+			})
+			t.Run(tabletTestName(t, replica), func(t *testing.T) {
+				replicaRows = testSelectTableMetrics(t, replica, workloadTable, tcase)
+			})
+			t.Run("compare primary and replica", func(t *testing.T) {
+				assert.Equal(t, primaryRows, replicaRows)
+			})
+		})
+	}
+}
+
+func TestInitialSetup(t *testing.T) {
+	shards = clusterInstance.Keyspaces[0].Shards
+	require.Equal(t, 1, len(shards))
+	require.Equal(t, 2, len(shards[0].Vttablets))
+	primary = shards[0].Vttablets[0]
+	require.NotNil(t, primary)
+	replica = shards[0].Vttablets[1]
+	require.NotNil(t, replica)
+	require.NotEqual(t, primary.Alias, replica.Alias)
+
+	tableNames = []string{parentTableName, childTableName, child2TableName, grandchildTableName}
+	reverseTableNames = slices.Clone(tableNames)
+	slices.Reverse(reverseTableNames)
+	require.ElementsMatch(t, tableNames, reverseTableNames)
+
+	for _, tableName := range tableNames {
+		writeMetrics[tableName] = &WriteMetrics{}
+	}
+
+	if val, present := os.LookupEnv("GITHUB_ACTIONS"); present && val != "" {
+		// This is the place to fine tune the stress parameters if GitHub actions are too slow
+		maxConcurrency = maxConcurrency * 1
+		singleConnectionSleepInterval = singleConnectionSleepInterval * 1
+	}
+	t.Logf("==== test setup: maxConcurrency=%v, singleConnectionSleepInterval=%v", maxConcurrency, singleConnectionSleepInterval)
+}
+
+type testCase struct {
+	onDeleteAction sqlparser.ReferenceAction
+	onUpdateAction sqlparser.ReferenceAction
+	workload       bool
+	onlineDDLTable string
+}
+
+// ExecuteFKTest runs a single test case, which can be:
+// - With/out workload
+// - Either one of ON DELETE actions
+// - Either one of ON UPDATE actions
+// - Potentially running an Online DDL on an indicated table (this will not work in Vanilla MySQL, see https://vitess.io/blog/2021-06-15-online-ddl-why-no-fk/)
+func ExecuteFKTest(t *testing.T, tcase *testCase) {
+	workloadName := "static data"
+	if tcase.workload {
+		workloadName = "workload"
+	}
+	testName := fmt.Sprintf("%s/del=%s/upd=%s", workloadName, referenceActionMap[tcase.onDeleteAction], referenceActionMap[tcase.onUpdateAction])
+	if tcase.onlineDDLTable != "" {
+		testName = fmt.Sprintf("%s/ddl=%s", testName, tcase.onlineDDLTable)
+	}
+	t.Run(testName, func(t *testing.T) {
+		ctx, cancel := context.WithCancel(context.Background())
+		defer cancel()
+
+		t.Run("create schema", func(t *testing.T) {
+			createInitialSchema(t, tcase)
+		})
+		t.Run("init tables", func(t *testing.T) {
+			populateTables(t)
+		})
+		if tcase.workload {
+			t.Run("workload", func(t *testing.T) {
+				var wg sync.WaitGroup
+				for _, workloadTable := range []string{parentTableName, childTableName, child2TableName, grandchildTableName} {
+					wg.Add(1)
+					go func(tbl string) {
+						defer wg.Done()
+						runMultipleConnections(ctx, t, tbl)
+					}(workloadTable)
+				}
+				timer := time.NewTimer(workloadDuration)
+
+				if tcase.onlineDDLTable != "" {
+					t.Run("migrating", func(t *testing.T) {
+						// This cannot work with Vanilla MySQL. We put the code for testing, but we're not actually going to use it
+						// for now. The test cases all have empty tcase.onlineDDLTable
+						hint := "hint-alter"
+						uuid := testOnlineDDLStatement(t, fmt.Sprintf(alterHintStatement, tcase.onlineDDLTable, hint), onlineDDLStrategy, "vtgate", hint)
+						ok := onlineddl.CheckMigrationStatus(t, &vtParams, shards, uuid, schema.OnlineDDLStatusComplete)
+						require.True(t, ok) // or else don't attempt to cleanup artifacts
+						t.Run("cleanup artifacts", func(t *testing.T) {
+							rs := onlineddl.ReadMigrations(t, &vtParams, uuid)
+							require.NotNil(t, rs)
+							row := rs.Named().Row()
+							require.NotNil(t, row)
+
+							artifacts := textutil.SplitDelimitedList(row.AsString("artifacts", ""))
+							for _, artifact := range artifacts {
+								t.Run(artifact, func(t *testing.T) {
+									err := clusterInstance.VtctlclientProcess.ApplySchema(keyspaceName, "drop table if exists "+artifact)
+									require.NoError(t, err)
+								})
+							}
+						})
+					})
+				}
+
+				<-timer.C
+				cancel() // will cause runMultipleConnections() to terminate
+				wg.Wait()
+			})
+		}
+		t.Run("wait for replica", func(t *testing.T) {
+			waitForReplicaCatchup(t)
+		})
+		t.Run("validate metrics", func(t *testing.T) {
+			validateMetrics(t, tcase)
+		})
+		t.Run("validate replication health", func(t *testing.T) {
+			cluster.ValidateReplicationIsHealthy(t, replica)
+		})
+		t.Run("validate fk", func(t *testing.T) {
+			testFKIntegrity(t, primary, tcase)
+			testFKIntegrity(t, replica, tcase)
+		})
+	})
+}
+
+func TestStressFK(t *testing.T) {
+	defer cluster.PanicHandler(t)
+
+	t.Run("validate replication health", func(t *testing.T) {
+		cluster.ValidateReplicationIsHealthy(t, replica)
+	})
+
+	runOnlineDDL := false
+
+	// Without workload ; with workload
+	for _, workload := range []bool{false, true} {
+		// For any type of ON DELETE action
+		for _, actionDelete := range referenceActions {
+			// For any type of ON UPDATE action
+			for _, actionUpdate := range referenceActions {
+				tcase := &testCase{
+					workload:       workload,
+					onDeleteAction: actionDelete,
+					onUpdateAction: actionUpdate,
+				}
+				ExecuteFKTest(t, tcase)
+			}
+		}
+	}
+
+	if runOnlineDDL {
+		// Running Online DDL on all test tables. We don't use all of the combinations
+		// presented above; we will run with workload, and suffice with same ON DELETE - ON UPDATE actions.
+		for _, action := range referenceActions {
+			for _, table := range tableNames {
+				tcase := &testCase{
+					workload:       true,
+					onDeleteAction: action,
+					onUpdateAction: action,
+					onlineDDLTable: table,
+				}
+				ExecuteFKTest(t, tcase)
+			}
+		}
+	}
+}
+
+// createInitialSchema creates the tables from scratch, and drops the foreign key constraints on the replica.
+func createInitialSchema(t *testing.T, tcase *testCase) {
+	ctx := context.Background()
+	conn, err := mysql.Connect(ctx, &vtParams)
+	require.Nil(t, err)
+	defer conn.Close()
+
+	t.Run("dropping tables", func(t *testing.T) {
+		for _, tableName := range reverseTableNames {
+			err := clusterInstance.VtctlclientProcess.ApplySchema(keyspaceName, "drop table if exists "+tableName)
+			require.NoError(t, err)
+		}
+	})
+	t.Run("creating tables", func(t *testing.T) {
+		// Create the stress tables
+		var b strings.Builder
+		for i, sql := range createStatements {
+			if i == 0 {
+				// parent table, no foreign keys
+				b.WriteString(sql)
+			} else {
+				b.WriteString(fmt.Sprintf(sql, referenceActionMap[tcase.onDeleteAction], referenceActionMap[tcase.onUpdateAction]))
+			}
+			b.WriteString(";")
+		}
+		err := clusterInstance.VtctlclientProcess.ApplySchema(keyspaceName, b.String())
+		require.NoError(t, err)
+	})
+	t.Run("wait for replica", func(t *testing.T) {
+		waitForReplicaCatchup(t)
+	})
+	t.Run("validating tables: vttablet", func(t *testing.T) {
+		// Check if table is created. Checked on tablets.
+		checkTable(t, parentTableName, "hint_col")
+		checkTable(t, childTableName, "hint_col")
+		checkTable(t, child2TableName, "hint_col")
+		checkTable(t, grandchildTableName, "hint_col")
+	})
+	t.Run("validating tables: vtgate", func(t *testing.T) {
+		// Wait for tables to appear on VTGate
+		waitForTable(t, parentTableName, conn)
+		waitForTable(t, childTableName, conn)
+		waitForTable(t, child2TableName, conn)
+		waitForTable(t, grandchildTableName, conn)
+	})
+	t.Run("waiting for vschema definition to apply", func(t *testing.T) {
+		for _, tableName := range []string{parentTableName, childTableName, child2TableName, grandchildTableName} {
+			err := utils.WaitForColumn(t, clusterInstance.VtgateProcess, keyspaceName, tableName, "id")
+			require.NoError(t, err)
+		}
+	})
+
+	t.Run("dropping foreign keys on replica", func(t *testing.T) {
+		for _, statement := range dropConstraintsStatements {
+			_ = queryTablet(t, replica, "set global super_read_only=0", "")
+			_ = queryTablet(t, replica, statement, "")
+			_ = queryTablet(t, replica, "set global super_read_only=1", "")
+		}
+	})
+	t.Run("validate definitions", func(t *testing.T) {
+		for _, tableName := range []string{childTableName, child2TableName, grandchildTableName} {
+			t.Run(tableName, func(t *testing.T) {
+				t.Run(tabletTestName(t, primary), func(t *testing.T) {
+					stmt := getCreateTableStatement(t, primary, tableName)
+					assert.Contains(t, stmt, "CONSTRAINT")
+				})
+				t.Run(tabletTestName(t, replica), func(t *testing.T) {
+					stmt := getCreateTableStatement(t, replica, tableName)
+					assert.NotContains(t, stmt, "CONSTRAINT")
+				})
+			})
+		}
+	})
+}
+
+// testOnlineDDLStatement runs an online DDL, ALTER statement
+func testOnlineDDLStatement(t *testing.T, alterStatement string, ddlStrategy string, executeStrategy string, expectHint string) (uuid string) {
+	if executeStrategy == "vtgate" {
+		row := onlineddl.VtgateExecDDL(t, &vtParams, ddlStrategy, alterStatement, "").Named().Row()
+		if row != nil {
+			uuid = row.AsString("uuid", "")
+		}
+	} else {
+		var err error
+		uuid, err = clusterInstance.VtctlclientProcess.ApplySchemaWithOutput(keyspaceName, alterStatement, cluster.VtctlClientParams{DDLStrategy: ddlStrategy})
+		assert.NoError(t, err)
+	}
+	uuid = strings.TrimSpace(uuid)
+	fmt.Println("# Generated UUID (for debug purposes):")
+	fmt.Printf("<%s>\n", uuid)
+
+	strategySetting, err := schema.ParseDDLStrategy(ddlStrategy)
+	assert.NoError(t, err)
+
+	if !strategySetting.Strategy.IsDirect() {
+		t.Logf("===== waiting for migration %v to conclude", uuid)
+		status := onlineddl.WaitForMigrationStatus(t, &vtParams, shards, uuid, migrationWaitTimeout, schema.OnlineDDLStatusComplete, schema.OnlineDDLStatusFailed)
+		fmt.Printf("# Migration status (for debug purposes): <%s>\n", status)
+	}
+
+	if expectHint != "" {
+		stmt, err := sqlparser.Parse(alterStatement)
+		require.NoError(t, err)
+		ddlStmt, ok := stmt.(sqlparser.DDLStatement)
+		require.True(t, ok)
+		tableName := ddlStmt.GetTable().Name.String()
+		checkTable(t, tableName, expectHint)
+	}
+
+	if !strategySetting.Strategy.IsDirect() {
+		// let's see what FK tables have been renamed to
+		rs := onlineddl.ReadMigrations(t, &vtParams, uuid)
+		require.NotNil(t, rs)
+		row := rs.Named().Row()
+		require.NotNil(t, row)
+
+		artifacts := textutil.SplitDelimitedList(row.AsString("artifacts", ""))
+		for _, artifact := range artifacts {
+			checkTable(t, artifact, "")
+		}
+	}
+
+	return uuid
+}
+
+// waitForTable waits until table is seen in VTGate
+func waitForTable(t *testing.T, tableName string, conn *mysql.Conn) {
+	ctx, cancel := context.WithTimeout(context.Background(), time.Second*10)
+	defer cancel()
+	ticker := time.NewTicker(time.Second)
+	defer ticker.Stop()
+
+	query := fmt.Sprintf("select count(*) from %s", tableName)
+	for {
+		if _, err := conn.ExecuteFetch(query, 1, false); err == nil {
+			return // good
+		}
+		select {
+		case <-ticker.C:
+		case <-ctx.Done():
+			t.Fail()
+			return
+		}
+	}
+}
+
+// checkTable checks that the given table exists on all tablets
+func checkTable(t *testing.T, showTableName string, expectHint string) {
+	for _, tablet := range shards[0].Vttablets {
+		checkTablesCount(t, tablet, showTableName, 1)
+		if expectHint != "" {
+			createStatement := getCreateTableStatement(t, tablet, showTableName)
+			assert.Contains(t, createStatement, expectHint)
+		}
+	}
+}
+
+// checkTablesCount checks the number of tables in the given tablet
+func checkTablesCount(t *testing.T, tablet *cluster.Vttablet, showTableName string, expectCount int) {
+	query := fmt.Sprintf(`show tables like '%s';`, showTableName)
+	ctx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
+	defer cancel()
+	rowcount := 0
+	for {
+		queryResult, err := tablet.VttabletProcess.QueryTablet(query, keyspaceName, true)
+		require.Nil(t, err)
+		rowcount = len(queryResult.Rows)
+		if rowcount > 0 {
+			break
+		}
+
+		select {
+		case <-time.After(time.Second):
+		case <-ctx.Done():
+			break
+		}
+	}
+	assert.Equal(t, expectCount, rowcount)
+}
+
+// getCreateTableStatement returns the CREATE TABLE statement for a given table
+func getCreateTableStatement(t *testing.T, tablet *cluster.Vttablet, tableName string) (statement string) {
+	queryResult := queryTablet(t, tablet, fmt.Sprintf("show create table %s", tableName), "")
+
+	require.Equal(t, len(queryResult.Rows), 1)
+	row := queryResult.Rows[0]
+	assert.Equal(t, len(row), 2) // table name, create statement
+	statement = row[1].ToString()
+	return statement
+}
+
+func isFKError(err error) bool {
+	if err == nil {
+		return false
+	}
+	sqlErr, ok := err.(*sqlerror.SQLError)
+	if !ok {
+		return false
+	}
+
+	// Let's try and account for all known errors:
+	switch sqlErr.Number() {
+	case sqlerror.ERDupEntry: // happens since we hammer the tables randomly
+		return false
+	case sqlerror.ERTooManyUserConnections: // can happen in Online DDL cut-over
+		return false
+	case sqlerror.ERUnknownError: // happens when query buffering times out
+		return false
+	case sqlerror.ERQueryInterrupted: // cancelled due to context expiration
+		return false
+	case sqlerror.ERLockDeadlock:
+		return false // bummer, but deadlocks can happen, it's a legit error.
+	case sqlerror.ERNoReferencedRow,
+		sqlerror.ERRowIsReferenced,
+		sqlerror.ERRowIsReferenced2,
+		sqlerror.ErNoReferencedRow2:
+		return true
+	case sqlerror.ERNotSupportedYet:
+		return true
+	}
+	// Unknown error
+	fmt.Printf("Unexpected error detected in isFKError: %v\n", err)
+	// Treat it as if it's a FK error
+	return true
+}
+
+func generateInsert(t *testing.T, tableName string, conn *mysql.Conn) error {
+	id := rand.Int31n(int32(maxTableRows))
+	parentId := rand.Int31n(int32(maxTableRows))
+	query := fmt.Sprintf(insertRowStatement, tableName, id, parentId)
+	qr, err := conn.ExecuteFetch(query, 1000, true)
+
+	func() {
+		writeMetrics[tableName].mu.Lock()
+		defer writeMetrics[tableName].mu.Unlock()
+
+		writeMetrics[tableName].insertsAttempts++
+		if err != nil {
+			writeMetrics[tableName].insertsFailures++
+			if isFKError(err) {
+				writeMetrics[tableName].insertsFKErrors++
+				writeMetrics[tableName].sampleInsertFKError = err
+			}
+			return
+		}
+		assert.Less(t, qr.RowsAffected, uint64(2))
+		if qr.RowsAffected == 0 {
+			writeMetrics[tableName].insertsNoops++
+			return
+		}
+		writeMetrics[tableName].inserts++
+	}()
+	return err
+}
+
+func generateUpdate(t *testing.T, tableName string, conn *mysql.Conn) error {
+	// Most of the UPDATEs we run are "normal" updates, but the minority will actually change the
+	// `id` column itself, which is the FOREIGN KEY parent column for some of the tables.
+	id := rand.Int31n(int32(maxTableRows))
+	query := fmt.Sprintf(updateRowStatement, tableName, id)
+	if tableName == parentTableName || tableName == childTableName {
+		if rand.Intn(4) == 0 {
+			updatedId := rand.Int31n(int32(maxTableRows))
+			query = fmt.Sprintf(updateRowIdStatement, tableName, updatedId, id)
+		}
+	}
+	qr, err := conn.ExecuteFetch(query, 1000, true)
+
+	func() {
+		writeMetrics[tableName].mu.Lock()
+		defer writeMetrics[tableName].mu.Unlock()
+
+		writeMetrics[tableName].updatesAttempts++
+		if err != nil {
+			writeMetrics[tableName].updatesFailures++
+			if isFKError(err) {
+				writeMetrics[tableName].updatesFKErrors++
+				writeMetrics[tableName].sampleUpdateFKError = err
+			}
+			return
+		}
+		assert.Less(t, qr.RowsAffected, uint64(2))
+		if qr.RowsAffected == 0 {
+			writeMetrics[tableName].updatesNoops++
+			return
+		}
+		writeMetrics[tableName].updates++
+	}()
+	return err
+}
+
+func generateDelete(t *testing.T, tableName string, conn *mysql.Conn) error {
+	id := rand.Int31n(int32(maxTableRows))
+	query := fmt.Sprintf(deleteRowStatement, tableName, id)
+	qr, err := conn.ExecuteFetch(query, 1000, true)
+
+	func() {
+		writeMetrics[tableName].mu.Lock()
+		defer writeMetrics[tableName].mu.Unlock()
+
+		writeMetrics[tableName].deletesAttempts++
+		if err != nil {
+			writeMetrics[tableName].deletesFailures++
+			if isFKError(err) {
+				writeMetrics[tableName].deletesFKErrors++
+				writeMetrics[tableName].sampleDeleteFKError = err
+			}
+			return
+		}
+		assert.Less(t, qr.RowsAffected, uint64(2))
+		if qr.RowsAffected == 0 {
+			writeMetrics[tableName].deletesNoops++
+			return
+		}
+		writeMetrics[tableName].deletes++
+	}()
+	return err
+}
+
+func runSingleConnection(ctx context.Context, t *testing.T, tableName string, done *int64) {
+	log.Infof("Running single connection on %s", tableName)
+	conn, err := mysql.Connect(ctx, &vtParams)
+	require.Nil(t, err)
+	defer conn.Close()
+
+	_, err = conn.ExecuteFetch("set autocommit=1", 1000, true)
+	require.Nil(t, err)
+	_, err = conn.ExecuteFetch("set transaction isolation level read committed", 1000, true)
+	require.Nil(t, err)
+
+	for {
+		if atomic.LoadInt64(done) == 1 {
+			log.Infof("Terminating single connection")
+			return
+		}
+		switch rand.Int31n(3) {
+		case 0:
+			_ = generateInsert(t, tableName, conn)
+		case 1:
+			_ = generateUpdate(t, tableName, conn)
+		case 2:
+			_ = generateDelete(t, tableName, conn)
+		}
+		time.Sleep(singleConnectionSleepInterval)
+	}
+}
+
+func runMultipleConnections(ctx context.Context, t *testing.T, tableName string) {
+	log.Infof("Running multiple connections")
+	var done int64
+	var wg sync.WaitGroup
+	for i := 0; i < maxConcurrency; i++ {
+		wg.Add(1)
+		go func() {
+			defer wg.Done()
+			runSingleConnection(ctx, t, tableName, &done)
+		}()
+	}
+	<-ctx.Done()
+	atomic.StoreInt64(&done, 1)
+	log.Infof("Running multiple connections: done")
+	wg.Wait()
+	log.Infof("All connections cancelled")
+}
+
+func wrapWithNoFKChecks(sql string) string {
+	return fmt.Sprintf("set foreign_key_checks=0; %s; set foreign_key_checks=1;", sql)
+}
+
+// populateTables randomly populates all test tables. This is done sequentially.
+func populateTables(t *testing.T) {
+	log.Infof("initTable begin")
+	defer log.Infof("initTable complete")
+
+	ctx := context.Background()
+	conn, err := mysql.Connect(ctx, &vtParams)
+	require.Nil(t, err)
+	defer conn.Close()
+
+	t.Logf("===== clearing tables")
+	for _, tableName := range reverseTableNames {
+		writeMetrics[tableName].Clear()
+		deleteQuery := fmt.Sprintf(deleteAllStatement, tableName)
+		_, err = conn.ExecuteFetch(deleteQuery, 1000, true)
+		require.Nil(t, err)
+	}
+	// In an ideal world we would randomly re-seed the tables in each and every instance of the test.
+	// In reality, that takes a lot of time, and while the seeding is important, it's not the heart of
+	// the test. To that effect, the seeding works as follows:
+	// - First ever time, we randomly seed the tables (running thousands of queries). We then create *_seed
+	//   tables and clone the data in those seed tables.
+	// - 2nd test and forward: we just copy over the rows from the *_seed tables.
+	tablesSeeded := false
+	seedOnce.Do(func() {
+		for _, tableName := range tableNames {
+			t.Run(tableName, func(t *testing.T) {
+				t.Run("populating", func(t *testing.T) {
+					// populate parent, then child, child2, then grandchild
+					for i := 0; i < maxTableRows/2; i++ {
+						generateInsert(t, tableName, conn)
+					}
+					for i := 0; i < maxTableRows/4; i++ {
+						generateUpdate(t, tableName, conn)
+					}
+					for i := 0; i < maxTableRows/4; i++ {
+						generateDelete(t, tableName, conn)
+					}
+				})
+				t.Run("creating seed", func(t *testing.T) {
+					// We create the seed table in the likeness of stress_parent, because that's the only table
+					// that doesn't have FK constraints.
+					{
+						createSeedQuery := fmt.Sprintf("create table %s_seed like %s", tableName, parentTableName)
+						_, err := conn.ExecuteFetch(createSeedQuery, 1000, true)
+						require.NoError(t, err)
+					}
+					{
+						seedQuery := fmt.Sprintf("insert into %s_seed select * from %s", tableName, tableName)
+						_, err := conn.ExecuteFetch(seedQuery, 1000, true)
+						require.NoError(t, err)
+					}
+					{
+						validationQuery := fmt.Sprintf("select count(*) as c from %s_seed", tableName)
+						rs, err := conn.ExecuteFetch(validationQuery, 1000, true)
+						require.NoError(t, err)
+						row := rs.Named().Row()
+						require.NotNil(t, row)
+						require.NotZero(t, row.AsInt64("c", 0))
+					}
+				})
+			})
+		}
+		tablesSeeded = true
+	})
+	if !tablesSeeded {
+		t.Run("reseeding", func(t *testing.T) {
+			for _, tableName := range tableNames {
+				seedQuery := fmt.Sprintf("insert into %s select * from %s_seed", tableName, tableName)
+				_, err := conn.ExecuteFetch(seedQuery, 1000, true)
+				require.NoError(t, err)
+			}
+		})
+	}
+
+	t.Run("validating table rows", func(t *testing.T) {
+		for _, tableName := range tableNames {
+			validationQuery := fmt.Sprintf(selectCountRowsStatement, tableName)
+			rs, err := conn.ExecuteFetch(validationQuery, 1000, true)
+			require.NoError(t, err)
+			row := rs.Named().Row()
+			require.NotNil(t, row)
+			numRows := row.AsInt64("num_rows", 0)
+			sumUpdates := row.AsInt64("sum_updates", 0)
+			require.NotZero(t, numRows)
+			if !tablesSeeded {
+				// We cloned the data from *_seed tables. This means we didn't populate writeMetrics. Now,
+				// this function only takes care of the base seed. We will later on run a stress workload on
+				// these tables, at the end of which we will examine the writeMetrics. We thus have to have those
+				// metrics consistent with the cloned data. It's a bit ugly, but we inject fake writeMetrics.
+				writeMetrics[tableName].deletes = 1
+				writeMetrics[tableName].inserts = numRows + writeMetrics[tableName].deletes
+				writeMetrics[tableName].updates = sumUpdates + writeMetrics[tableName].deletes
+			}
+		}
+	})
+}
+
+// testSelectTableMetrics cross references the known metrics (number of successful insert/delete/updates) on each table, with the
+// actual number of rows and with the row values on those tables.
+// With CASCADE/SET NULL rules we can't do the comparison, because child tables are implicitly affected by the cascading rules,
+// and the values do not match what reported to us when we UPDATE/DELETE on the parent tables.
+func testSelectTableMetrics(
+	t *testing.T,
+	tablet *cluster.Vttablet,
+	tableName string,
+	tcase *testCase,
+) int64 {
+	switch tcase.onDeleteAction {
+	case sqlparser.Cascade, sqlparser.SetNull:
+		if tableName != parentTableName {
+			// We can't validate those tables because they will have been affected by cascading rules.
+			return 0
+		}
+	}
+	// metrics are unaffected by value of onUpdateAction.
+
+	writeMetrics[tableName].mu.Lock()
+	defer writeMetrics[tableName].mu.Unlock()
+
+	log.Infof("%s %s", tableName, writeMetrics[tableName].String())
+
+	rs := queryTablet(t, tablet, fmt.Sprintf(selectCountRowsStatement, tableName), "")
+
+	row := rs.Named().Row()
+	require.NotNil(t, row)
+	log.Infof("testSelectTableMetrics, row: %v", row)
+	numRows := row.AsInt64("num_rows", 0)
+	sumUpdates := row.AsInt64("sum_updates", 0)
+	assert.NotZero(t, numRows)
+	assert.NotZero(t, sumUpdates)
+	assert.NotZero(t, writeMetrics[tableName].inserts)
+	assert.NotZero(t, writeMetrics[tableName].deletes)
+	assert.NotZero(t, writeMetrics[tableName].updates)
+	assert.Equal(t, writeMetrics[tableName].inserts-writeMetrics[tableName].deletes, numRows)
+	assert.Equal(t, writeMetrics[tableName].updates-writeMetrics[tableName].deletes, sumUpdates) // because we DELETE WHERE updates=1
+
+	return numRows
+}
+
+// testSelectTableFKErrors
+func testSelectTableFKErrors(
+	t *testing.T,
+	tableName string,
+	tcase *testCase,
+) {
+	writeMetrics[tableName].mu.Lock()
+	defer writeMetrics[tableName].mu.Unlock()
+
+	if tcase.onDeleteAction == sqlparser.Cascade {
+		assert.Zerof(t, writeMetrics[tableName].deletesFKErrors, "unexpected foreign key errors for DELETEs in ON DELETE CASCADE. Sample error: %v", writeMetrics[tableName].sampleDeleteFKError)
+	}
+	if tcase.onUpdateAction == sqlparser.Cascade {
+		assert.Zerof(t, writeMetrics[tableName].updatesFKErrors, "unexpected foreign key errors for UPDATEs in ON UPDATE CASCADE. Sample error: %v", writeMetrics[tableName].sampleUpdateFKError)
+	}
+}
+
+// testFKIntegrity validates that foreign key consitency is maintained on the given tablet. We cross reference all
+// parent-child relationships.
+// There are two test types:
+// 1. Do a JOIN on parent-child associated rows, expect non-empty
+// 2. Check that there are no orphaned child rows. Notes:
+//   - This applies to NO ACTION and CASCADE, but not to SET NULL, because SET NULL by design creates orphaned rows.
+//   - On the primary database, this test trivially passes because of course MySQL maintains this integrity. But remember
+//     that we remove the foreign key constraints on the replica. Also remember that cascaded writes are not written to
+//     the binary log. And so, if VTGate does not do a proper job, then a parent and child will drift apart in CASCADE writes.
+func testFKIntegrity(
+	t *testing.T,
+	tablet *cluster.Vttablet,
+	tcase *testCase,
+) {
+	testName := tabletTestName(t, tablet)
+	t.Run(testName, func(t *testing.T) {
+		t.Run("matching parent-child rows", func(t *testing.T) {
+			rs := queryTablet(t, tablet, selectMatchingRowsChild, "")
+			assert.NotZero(t, len(rs.Rows))
+		})
+		t.Run("matching parent-child2 rows", func(t *testing.T) {
+			rs := queryTablet(t, tablet, selectMatchingRowsChild2, "")
+			assert.NotZero(t, len(rs.Rows))
+		})
+		t.Run("matching child-grandchild rows", func(t *testing.T) {
+			rs := queryTablet(t, tablet, selectMatchingRowsGrandchild, "")
+			assert.NotZero(t, len(rs.Rows))
+		})
+		if tcase.onDeleteAction != sqlparser.SetNull && tcase.onUpdateAction != sqlparser.SetNull {
+			// Because with SET NULL there _are_ orphaned rows
+			t.Run("parent-child orphaned rows", func(t *testing.T) {
+				rs := queryTablet(t, tablet, selectOrphanedRowsChild, "")
+				assert.Zero(t, len(rs.Rows))
+			})
+			t.Run("parent-child2 orphaned rows", func(t *testing.T) {
+				rs := queryTablet(t, tablet, selectOrphanedRowsChild2, "")
+				assert.Zero(t, len(rs.Rows))
+			})
+			t.Run("child-grandchild orphaned rows", func(t *testing.T) {
+				rs := queryTablet(t, tablet, selectOrphanedRowsGrandchild, "")
+				assert.Zero(t, len(rs.Rows))
+			})
+		}
+	})
+}
diff --git a/test/ci_workflow_gen.go b/test/ci_workflow_gen.go
index 43e874ec182..5a3031d7307 100644
--- a/test/ci_workflow_gen.go
+++ b/test/ci_workflow_gen.go
@@ -111,6 +111,7 @@ var (
 		"vtgate_vschema",
 		"vtgate_queries",
 		"vtgate_schema_tracker",
+		"vtgate_foreignkey_stress",
 		"vtorc",
 		"xb_recovery",
 		"mysql80",
diff --git a/test/config.json b/test/config.json
index c28de9bb385..cab160288df 100644
--- a/test/config.json
+++ b/test/config.json
@@ -851,6 +851,15 @@
 			"RetryMax": 2,
 			"Tags": []
 		},
+		"vtgate_foreignkey_stress": {
+			"File": "unused.go",
+			"Args": ["vitess.io/vitess/go/test/endtoend/vtgate/foreignkey/stress"],
+			"Command": [],
+			"Manual": false,
+			"Shard": "vtgate_foreignkey_stress",
+			"RetryMax": 1,
+			"Tags": []
+		},
 		"vtgate_gen4": {
 			"File": "unused.go",
 			"Args": ["vitess.io/vitess/go/test/endtoend/vtgate/gen4"],