diff --git a/scripts/run.sh b/scripts/run.sh
index bf38028..e2f225a 100755
--- a/scripts/run.sh
+++ b/scripts/run.sh
@@ -15,7 +15,10 @@
 #   POD_IP_TYPE         = Address type of POD_IP (one of IPV4, IPv6)
 #   PRIMARY_TYPE        = defines single/multi primary
 
+
+
 env | sort | grep "POD\|HOST\|NAME"
+echo "running">/scripts/setup.txt
 RECOVERY_DONE_FILE="/tmp/recovery.done"
 if [[ "$PITR_RESTORE" == "true" ]]; then
     while true; do
@@ -138,6 +141,7 @@ log_bin = binlog
 loose-group_replication_bootstrap_group = OFF
 loose-group_replication_start_on_boot = OFF
 loose_group_replication_unreachable_majority_timeout = 20
+loose_group_replication_exit_state_action = OFFLINE_MODE
 
 # default tls configuration for the group
 # group_replication_recovery_use_ssl will be overwritten from DB arguments
@@ -179,23 +183,32 @@ fi
 # wait for mysql daemon be running (alive)
 function wait_for_mysqld_running() {
     local mysql="$mysql_header --host=$localhost"
+    local max_restarts=60
+    local restarts=0
+
+    while true; do
+        if ! kill -0 "$pid" 2>/dev/null; then
+            if (( restarts >= max_restarts )); then
+                log "ERROR" "mysqld (pid=$pid) died and exceeded $max_restarts restart attempts. Aborting."
+                exit 1
+            fi
+            restarts=$((restarts + 1))
+            log "ERROR" "mysqld (pid=$pid) is no longer running. Restart attempt $restarts/$max_restarts..."
+            start_mysqld_in_background
+            sleep 10
+            continue
+        fi
 
-    for i in {900..0}; do
         out=$(${mysql} -N -e "select 1;" 2>/dev/null)
-        log "INFO" "Attempt $i: Pinging '$report_host' has returned: '$out'...................................."
         if [[ "$out" == "1" ]]; then
+            log "INFO" "mysqld is ready (pid=$pid, restarts=$restarts)"
             break
         fi
-
+        log "INFO" "Pinging '$report_host' has returned: '$out' (pid=$pid alive, restarts=$restarts)"
         echo -n .
         sleep 1
     done
 
-    if [[ "$i" == "0" ]]; then
-        echo ""
-        log "ERROR" "Server ${report_host} failed to start in 900 seconds............."
-        exit 1
-    fi
     log "INFO" "mysql daemon is ready to use......."
 
     # Set read-only immediately after MySQL starts to prevent any external
@@ -594,6 +607,8 @@ install_group_replication_plugin
 install_clone_plugin
 
 while true; do
+    log "INFO" "creating setup.txt file"
+    echo "running">/scripts/setup.txt
     kill -0 $pid
     exit="$?"
     if [[ "$exit" == "0" ]]; then
@@ -629,6 +644,9 @@ while true; do
         join_by_clone
     fi
     joining_for_first_time=0
+
+    log "INFO" "removing setup.txt file"
+    rm -rf /scripts/setup.txt
     log "INFO" "waiting for mysql process id  = $pid"
     wait $pid
 done
diff --git a/scripts/run_innodb.sh b/scripts/run_innodb.sh
index 1de07bf..f8dac6f 100755
--- a/scripts/run_innodb.sh
+++ b/scripts/run_innodb.sh
@@ -1,5 +1,33 @@
 #!/usr/bin/env bash
 #set -x
+# run_innodb.sh — MySQL InnoDB Cluster init script
+#
+# Compatibility: MySQL 8.4.x with appscode images (ghcr.io/appscode-images/mysql)
+#
+# Key differences from MySQL 8.0 (mysql-server Oracle image):
+#   1. Entrypoint is at /usr/local/bin/docker-entrypoint.sh (not /entrypoint.sh)
+#   2. docker-entrypoint.sh already creates root@% (CREATE USER fails without IF NOT EXISTS)
+#   3. mysqlsh 8.4 defaults to SQL mode (need --js for JavaScript API calls)
+#   4. dba.configureInstance() removed 'password' and 'interactive' options
+#   5. REQUIRE SSL is strictly enforced on socket connections (repl can't connect locally)
+
+env | sort | grep "POD\|HOST\|NAME"
+echo "running">/scripts/setup.txt
+RECOVERY_DONE_FILE="/tmp/recovery.done"
+if [[ "$PITR_RESTORE" == "true" ]]; then
+    while true; do
+      sleep 2
+      echo "Point In Time Recovery In Progress. Waiting for $RECOVERY_DONE_FILE file"
+      if [[ -e "$RECOVERY_DONE_FILE" ]]; then
+        echo "$RECOVERY_DONE_FILE found."
+        break
+      fi
+    done
+fi
+
+if [[ -e "$RECOVERY_DONE_FILE" ]]; then
+  rm $RECOVERY_DONE_FILE
+fi
 
 function timestamp() {
     date +"%Y/%m/%d %T"
@@ -11,10 +39,10 @@ function log() {
     echo "$(timestamp) [$script_name] [$type] $msg"
 }
 
-#stores all the arguments that are passed from statefulSet
 args=$@
-report_host="$HOSTNAME.$GOV_SVC.$POD_NAMESPACE.svc"
+report_host="$HOSTNAME.$GOV_SVC.$POD_NAMESPACE"
 log "INFO" "report_host = $report_host"
+
 # wait for the peer-list file created by coordinator
 while [ ! -f "/scripts/peer-list" ]; do
     log "WARNING" "peer-list is not created yet"
@@ -26,24 +54,40 @@ IFS=', ' read -r -a peers <<<"$hosts"
 echo "${peers[@]}"
 log "INFO" "hosts are ${peers[@]}"
 
-whitelist="$MYSQL_GROUP_REPLICATION_IP_WHITELIST"
-if [ -z "$whitelist" ]; then
-    if [[ "$POD_IP_TYPE" == "IPv6" ]]; then
-        whitelist="$POD_IP"/64
-    else
-        whitelist="$POD_IP"/16
-    fi
+# Create a writable dir for mysqlsh's configureInstance() output.
+# Copy user's custom config (read-only Secret mount in conf.d/) into this writable dir.
+# Only include the writable dir in my.cnf — mysqlsh will write its config here too.
+INNODB_CONF_DIR="/etc/mysql/innodb-conf.d"
+mkdir -p "$INNODB_CONF_DIR"
+# Copy custom config files from read-only conf.d/ to writable dir
+if [ -d /etc/mysql/conf.d ] && ls /etc/mysql/conf.d/*.cnf >/dev/null 2>&1; then
+    cp /etc/mysql/conf.d/*.cnf "$INNODB_CONF_DIR/" 2>/dev/null
+    log "INFO" "Copied custom config from conf.d/ to writable $INNODB_CONF_DIR/"
 fi
-mkdir -p /etc/mysql/conf.d/
 cat >>/etc/mysql/my.cnf <<EOL
-!includedir /etc/mysql/conf.d/
+!includedir ${INNODB_CONF_DIR}
 [mysqld]
 mysql_native_password=ON
-#loose-group_replication_ip_whitelist = "${whitelist}"
-loose-group_replication_ip_allowlist = "${whitelist}"
+# Use MySQL communication stack instead of XCom (8.0.27+).
+# Benefits: no extra port 33061, no IP allowlist needed, uses MySQL auth + SSL.
+loose-group_replication_communication_stack = MYSQL
+# Faster failover on network partition (match run.sh)
+loose_group_replication_unreachable_majority_timeout = 20
+loose_group_replication_exit_state_action = OFFLINE_MODE
 EOL
 
+# Multi-Primary mode: allow all nodes to accept writes (match run.sh)
+if [[ "$PRIMARY_TYPE" == "Multi-Primary" ]]; then
+    log "INFO" "Configuring Multi-Primary mode"
+    cat >>/etc/mysql/my.cnf <<EOL
+[mysqld]
+loose-group_replication_single_primary_mode = OFF
+loose-group_replication_enforce_update_everywhere_checks = ON
+EOL
+fi
+
 function retry {
+
     local retries="$1"
     shift
     local count=0
@@ -58,55 +102,131 @@ function retry {
             return $exit
         fi
         count=$(($count + 1))
+        # Allow coordinator to stop retries (match run.sh)
+        retryfile="/scripts/retry-stop"
+        if [ -e "$retryfile" ]; then
+            return 0
+        fi
     done
     return 0
 }
 
 function wait_for_host_online() {
-    #function called with parameter user,host,password
     log "INFO" "checking for host $2 to come online"
+    local mysqlshell="mysql -u$1 -h$2 -p$3"
+    local max_restarts=60
+    local restarts=0
+
+    while true; do
+        if ! kill -0 "$pid" 2>/dev/null; then
+            if (( restarts >= max_restarts )); then
+                log "ERROR" "mysqld (pid=$pid) died and exceeded $max_restarts restart attempts. Aborting."
+                exit 1
+            fi
+            restarts=$((restarts + 1))
+            log "ERROR" "mysqld (pid=$pid) is no longer running. Restart attempt $restarts/$max_restarts..."
+            start_mysqld_in_background
+            sleep 10
+            continue
+        fi
+        out=$(${mysqlshell} -e "select 1;" | head -n1 | awk '{print$1}')
+        log "INFO" "Attempt $i: Pinging '$report_host' has returned: '$out'...................................."
+        if [[ "$out" == "1" ]]; then
+            break
+        fi
+        log "INFO" "Pinging '$report_host' has returned: '$out' (pid=$pid alive, restarts=$restarts)"
+        echo -n .
+        sleep 1
+    done
 
-    local mysqlshell="mysql -u$1 -h$2 -p$3" # "mysql -uroot -ppass -hmysql-server-0.mysql-server.default.svc"
-    retry 900 ${mysqlshell} -e "select 1;" | awk '{print$1}'
-    out=$(${mysqlshell} -e "select 1;" | head -n1 | awk '{print$1}')
-    if [[ "$out" == "1" ]]; then
-        log "INFO" "host $2 is online"
-    else
-        log "INFO" "server failed to comes online within 900 seconds"
-    fi
+    log "INFO" "mysql daemon is ready to use......."
 
+    # Set read-only immediately after MySQL starts to prevent any external
+    # process (e.g. KubeDB health checker) from writing local GTIDs before
+    # the node joins the cluster. Cannot be set in my.cnf because it blocks --initialize.
+    # (match run.sh)
+    local mysql_ro="mysql -u${MYSQL_ROOT_USERNAME} -hlocalhost -p${MYSQL_ROOT_PASSWORD} --port=3306"
+    ${mysql_ro} -N -e "SET GLOBAL read_only=ON; SET GLOBAL super_read_only=ON;" 2>/dev/null
+    log "INFO" "Set super_read_only=ON to prevent errant GTIDs"
+}
+
+# mysql client shorthand — always use root for local operations
+mysql_local="mysql -u${MYSQL_ROOT_USERNAME} -hlocalhost -p${MYSQL_ROOT_PASSWORD} --port=3306"
+# mysqlsh shorthand — root for local, --js for JavaScript API
+mysqlsh_local="mysqlsh --js -u${MYSQL_ROOT_USERNAME} -p${MYSQL_ROOT_PASSWORD}"
+replication_user=repl
+
+# Kill any stale mysqlsh AdminAPI session holding the cluster-wide EXCLUSIVE lock
+# on $1 (usually the primary). A session holding AdminAPI_lock while in Sleep
+# state means a previous mysqlsh call died without releasing — rescan/addInstance/
+# rejoinInstance will hang with MYSQLSH 51500. Legitimate in-flight AdminAPI ops
+# are always in Query state, never Sleep. Kill Sleep>5s holders to auto-recover.
+function clear_stale_cluster_lock() {
+    local target_host=$1
+    local mysql_root="mysql -u${MYSQL_ROOT_USERNAME} -h${target_host} -p${MYSQL_ROOT_PASSWORD} --port=3306 -N"
+    local stuck_ids
+    stuck_ids=$(${mysql_root} -e "
+        SELECT t.PROCESSLIST_ID
+        FROM performance_schema.metadata_locks m
+        JOIN performance_schema.threads t ON m.OWNER_THREAD_ID = t.THREAD_ID
+        WHERE m.OBJECT_SCHEMA='AdminAPI_cluster'
+          AND m.OBJECT_NAME='AdminAPI_lock'
+          AND m.LOCK_TYPE='EXCLUSIVE'
+          AND t.PROCESSLIST_COMMAND='Sleep'
+          AND t.PROCESSLIST_TIME > 5;" 2>/dev/null | awk 'NF')
+    if [[ -n "$stuck_ids" ]]; then
+        for stuck_id in $stuck_ids; do
+            log "WARNING" "Killing stale AdminAPI_lock holder on ${target_host} (conn=${stuck_id}, Sleep>5s)"
+            ${mysql_root} -e "KILL ${stuck_id};" 2>/dev/null
+        done
+        sleep 2
+    fi
 }
 
 function create_replication_user() {
-    # MySql server's need a replication user to communicate with each other
-    # 01. official doc (section from 17.2.1.3 to 17.2.1.5): https://dev.mysql.com/doc/refman/5.7/en/group-replication-user-credentials.html
-    # 02. https://dev.mysql.com/doc/refman/8.0/en/group-replication-secure-user.html
-    # 03. repl user permissions: https://www.sqlshack.com/deploy-mysql-innodb-clusters-for-high-availability/
-    # 04. digitalocean doc: https://www.digitalocean.com/community/tutorials/how-to-configure-mysql-group-replication-on-ubuntu-16-04
     log "INFO" "Checking whether replication user exist or not..."
-    local mysql="mysql -u ${MYSQL_ROOT_USERNAME} -hlocalhost -p${MYSQL_ROOT_PASSWORD} --port=3306"
 
-    # At first, ensure that the command executes without any error. Then, run the command again and extract the output.
-    retry 120 ${mysql} -N -e "select count(host) from mysql.user where mysql.user.user='repl';"
-    out=$(${mysql} -N -e "select count(host) from mysql.user where mysql.user.user='repl';" | awk '{print$1}')
-    # if the user doesn't exist, crete new one.
+    retry 60 ${mysql_local} -N -e "select count(host) from mysql.user where mysql.user.user='${replication_user}';"
+    out=$(${mysql_local} -N -e "select count(host) from mysql.user where mysql.user.user='${replication_user}';" | awk '{print$1}')
+
+    # All operations in a SINGLE session with SQL_LOG_BIN=0 to prevent errant GTIDs.
+    # Uses IF NOT EXISTS because appscode images already create root@% via entrypoint.
+    # (match run.sh single-session pattern)
     if [[ "$out" -eq "0" ]]; then
         log "INFO" "Replication user not found. Creating new replication user..."
-        retry 120 ${mysql} -N -e "SET SQL_LOG_BIN=0;"
-        retry 120 ${mysql} -N -e "CREATE USER 'repl'@'%' IDENTIFIED BY '${MYSQL_ROOT_PASSWORD}' REQUIRE SSL;"
-        retry 120 ${mysql} -N -e "GRANT CREATE USER, FILE, PROCESS, RELOAD, REPLICATION CLIENT, REPLICATION SLAVE, SELECT, SHUTDOWN, SUPER ON *.* TO 'repl'@'%' WITH GRANT OPTION;"
-        retry 120 ${mysql} -N -e "GRANT DELETE, INSERT, UPDATE ON mysql.* TO 'repl'@'%' WITH GRANT OPTION;"
-        retry 120 ${mysql} -N -e "GRANT ALTER, ALTER ROUTINE, CREATE, CREATE ROUTINE, CREATE TEMPORARY TABLES, CREATE VIEW, DELETE, DROP, EVENT, EXECUTE, INDEX, INSERT, LOCK TABLES, REFERENCES, SHOW VIEW, TRIGGER, UPDATE ON mysql_innodb_cluster_metadata.* TO 'repl'@'%' WITH GRANT OPTION;"
-        retry 120 ${mysql} -N -e "GRANT ALTER, ALTER ROUTINE, CREATE, CREATE ROUTINE, CREATE TEMPORARY TABLES, CREATE VIEW, DELETE, DROP, EVENT, EXECUTE, INDEX, INSERT, LOCK TABLES, REFERENCES, SHOW VIEW, TRIGGER, UPDATE ON mysql_innodb_cluster_metadata_bkp.* TO 'repl'@'%' WITH GRANT OPTION;"
-        retry 120 ${mysql} -N -e "GRANT ALTER, ALTER ROUTINE, CREATE, CREATE ROUTINE, CREATE TEMPORARY TABLES, CREATE VIEW, DELETE, DROP, EVENT, EXECUTE, INDEX, INSERT, LOCK TABLES, REFERENCES, SHOW VIEW, TRIGGER, UPDATE ON mysql_innodb_cluster_metadata_previous.* TO 'repl'@'%' WITH GRANT OPTION;"
-        retry 120 ${mysql} -N -e "GRANT CLONE_ADMIN, BACKUP_ADMIN, CONNECTION_ADMIN, EXECUTE, GROUP_REPLICATION_ADMIN, PERSIST_RO_VARIABLES_ADMIN, REPLICATION_APPLIER, REPLICATION_SLAVE_ADMIN, ROLE_ADMIN, SYSTEM_VARIABLES_ADMIN ON *.* TO 'repl'@'%' WITH GRANT OPTION;"
-        #mysql-server docker image doesn't has the user root that can connect from any host
-        retry 120 ${mysql} -N -e "CREATE USER 'root'@'%' IDENTIFIED BY '${MYSQL_ROOT_PASSWORD}';"
-        retry 120 ${mysql} -N -e "GRANT ALL ON *.* TO 'root'@'%' WITH GRANT OPTION;"
-        retry 120 ${mysql} -N -e "FLUSH PRIVILEGES;"
-        retry 120 ${mysql} -N -e "SET SQL_LOG_BIN=1;"
+        retry 60 ${mysql_local} -N -e "
+            SET SQL_LOG_BIN=0;
+            SET GLOBAL super_read_only=OFF;
+            SET GLOBAL read_only=OFF;
+            CREATE USER IF NOT EXISTS '${replication_user}'@'%' IDENTIFIED BY '${MYSQL_ROOT_PASSWORD}' REQUIRE SSL;
+            GRANT CREATE USER, FILE, PROCESS, RELOAD, REPLICATION CLIENT, REPLICATION SLAVE, SELECT, SHUTDOWN, SUPER ON *.* TO '${replication_user}'@'%' WITH GRANT OPTION;
+            GRANT DELETE, INSERT, UPDATE ON mysql.* TO '${replication_user}'@'%' WITH GRANT OPTION;
+            GRANT ALTER, ALTER ROUTINE, CREATE, CREATE ROUTINE, CREATE TEMPORARY TABLES, CREATE VIEW, DELETE, DROP, EVENT, EXECUTE, INDEX, INSERT, LOCK TABLES, REFERENCES, SHOW VIEW, TRIGGER, UPDATE ON mysql_innodb_cluster_metadata.* TO '${replication_user}'@'%' WITH GRANT OPTION;
+            GRANT ALTER, ALTER ROUTINE, CREATE, CREATE ROUTINE, CREATE TEMPORARY TABLES, CREATE VIEW, DELETE, DROP, EVENT, EXECUTE, INDEX, INSERT, LOCK TABLES, REFERENCES, SHOW VIEW, TRIGGER, UPDATE ON mysql_innodb_cluster_metadata_bkp.* TO '${replication_user}'@'%' WITH GRANT OPTION;
+            GRANT ALTER, ALTER ROUTINE, CREATE, CREATE ROUTINE, CREATE TEMPORARY TABLES, CREATE VIEW, DELETE, DROP, EVENT, EXECUTE, INDEX, INSERT, LOCK TABLES, REFERENCES, SHOW VIEW, TRIGGER, UPDATE ON mysql_innodb_cluster_metadata_previous.* TO '${replication_user}'@'%' WITH GRANT OPTION;
+            GRANT CLONE_ADMIN, BACKUP_ADMIN, CONNECTION_ADMIN, EXECUTE, GROUP_REPLICATION_ADMIN, PERSIST_RO_VARIABLES_ADMIN, REPLICATION_APPLIER, REPLICATION_SLAVE_ADMIN, ROLE_ADMIN, SYSTEM_VARIABLES_ADMIN ON *.* TO '${replication_user}'@'%' WITH GRANT OPTION;
+            CREATE USER IF NOT EXISTS 'root'@'%' IDENTIFIED BY '${MYSQL_ROOT_PASSWORD}';
+            GRANT ALL ON *.* TO 'root'@'%' WITH GRANT OPTION;
+            FLUSH PRIVILEGES;
+            SET GLOBAL read_only=ON;
+            SET GLOBAL super_read_only=ON;
+            SET SQL_LOG_BIN=1;
+        "
+    else
+        log "INFO" "Replication user exists. Updating password if changed..."
+        # Update password in case it was rotated via RotateAuth (match run.sh)
+        retry 60 ${mysql_local} -N -e "
+            SET SQL_LOG_BIN=0;
+            SET GLOBAL super_read_only=OFF;
+            SET GLOBAL read_only=OFF;
+            ALTER USER '${replication_user}'@'%' IDENTIFIED BY '${MYSQL_ROOT_PASSWORD}';
+            ALTER USER IF EXISTS 'root'@'%' IDENTIFIED BY '${MYSQL_ROOT_PASSWORD}';
+            FLUSH PRIVILEGES;
+            SET GLOBAL read_only=ON;
+            SET GLOBAL super_read_only=ON;
+            SET SQL_LOG_BIN=1;
+        "
     fi
-    #    retry 120 ${mysql} -N -e "CHANGE MASTER TO MASTER_USER='repl', MASTER_PASSWORD='$MYSQL_ROOT_PASSWORD' FOR CHANNEL 'group_replication_recovery';"
     touch /scripts/ready.txt
 }
 
@@ -115,45 +235,120 @@ already_configured=0
 
 function configure_instance() {
     log "INFO" "configuring instance $report_host."
-    local mysqlshell="mysqlsh -u${replication_user} -p${MYSQL_ROOT_PASSWORD}"
 
-    retry 120 ${mysqlshell} --sql -e "select @@gtid_mode;"
-    gtid=($($mysqlshell --sql -e "select @@gtid_mode;"))
+    # Check if already configured (gtid_mode=ON means it was configured before)
+    retry 60 ${mysqlsh_local} --sql -e "select @@gtid_mode;"
+    gtid=($(${mysqlsh_local} --sql -e "select @@gtid_mode;"))
     if [[ "${gtid[1]}" == "ON" ]]; then
         log "INFO" "$report_host is already_configured."
         already_configured=1
         return
     fi
 
-    retry 30 ${mysqlshell} -e "dba.configureInstance('${replication_user}@${report_host}',{password:'${MYSQL_ROOT_PASSWORD}',interactive:false,restart:true});"
-    #instance need to restart after configuration
-    # Prevent creation of new process until this one is finished
-    #https://serverfault.com/questions/477448/mysql-keeps-crashing-innodb-unable-to-lock-ibdata1-error-11
-    #The most common cause of this problem is trying to start MySQL when it is already running.
+    # In MySQL Shell 8.4:
+    #   - Pass credentials via URI (not via 'password' option — removed)
+    #   - mycnfPath required so Shell writes config instead of prompting
+    #   - restart:false — we handle restart ourselves (container environment)
+    #   - Pipe 'yes' to auto-confirm any remaining prompts
+    yes | ${mysqlsh_local} -e "dba.configureInstance('${MYSQL_ROOT_USERNAME}:${MYSQL_ROOT_PASSWORD}@${report_host}:3306',{mycnfPath:'/etc/mysql/my.cnf',restart:false});"
+
+    # Manually restart mysqld after configuration (match run.sh pattern:
+    # restart:false + manual shutdown, because mysqlsh can't restart a process it didn't start)
+    log "INFO" "Shutting down mysqld for restart after configure..."
+    mysqladmin -u${MYSQL_ROOT_USERNAME} -hlocalhost -p${MYSQL_ROOT_PASSWORD} --port=3306 shutdown
     wait $pid
     restart_required=1
 }
 
 function create_cluster() {
-    local mysqlshell="mysqlsh -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${report_host}"
+    local mysqlsh_remote="mysqlsh --js -u${MYSQL_ROOT_USERNAME} -p${MYSQL_ROOT_PASSWORD} -h${report_host}"
     clusterName=$(echo -n $BASE_NAME | sed 's/-/_/g')
-    retry 5 $mysqlshell -e "cluster=dba.createCluster('$clusterName',{consistency:'BEFORE_ON_PRIMARY_FAILOVER',manualStartOnBoot:'true'});"
+    # Temporarily disable read-only for cluster bootstrap (match run.sh)
+    ${mysql_local} -N -e "SET GLOBAL super_read_only=OFF; SET GLOBAL read_only=OFF;" 2>/dev/null
+    # communicationStack:'MYSQL' — uses MySQL protocol on port 3306 instead of XCom on 33061.
+    # consistency defaults to BEFORE_ON_PRIMARY_FAILOVER on 8.4+.
+    if [[ "$PRIMARY_TYPE" == "Multi-Primary" ]]; then
+        log "INFO" "Creating InnoDB Cluster in Multi-Primary mode"
+        retry 5 $mysqlsh_remote -e "cluster=dba.createCluster('$clusterName',{communicationStack:'MYSQL',manualStartOnBoot:true,multiPrimary:true,force:true});"
+    else
+        retry 5 $mysqlsh_remote -e "cluster=dba.createCluster('$clusterName',{communicationStack:'MYSQL',manualStartOnBoot:true});"
+    fi
+}
+
+function fix_metadata_uuids() {
+    # After a pod restart with data loss (PVC deleted), or after a logical
+    # restore from a different cluster's backup, MySQL initialises a fresh
+    # data directory and generates a new server_uuid. The InnoDB Cluster
+    # metadata still has the old server_uuid for that address, so AdminAPI
+    # calls (dba.getCluster, cluster.rejoinInstance,
+    # dba.rebootClusterFromCompleteOutage) fail with errors like
+    # "Metadata for instance not found" or "unmanaged replication group".
+    #
+    # Strategy: find any peer whose stored UUID matches its actual server_uuid
+    # — that peer can serve as a working entry point for dba.getCluster(). For
+    # any peer with a stale entry, removeInstance(force:true) followed by
+    # addInstance(recoveryMethod:'clone') so the rejoining node ends up
+    # consistent with the live cluster. The current host is left out of the
+    # re-add loop because join_in_cluster will handle it once metadata is
+    # consistent.
+    log "INFO" "Checking for stale server_uuid in InnoDB Cluster metadata..."
+
+    local good_host=""
+    for host in "${peers[@]}"; do
+        actual_uuid=$(mysql -u${MYSQL_ROOT_USERNAME} -h${host} -p${MYSQL_ROOT_PASSWORD} --port=3306 -N -e "SELECT @@server_uuid;" 2>/dev/null)
+        if [[ -z "$actual_uuid" ]]; then
+            continue
+        fi
+        stored_uuid=$(mysql -u${MYSQL_ROOT_USERNAME} -h${host} -p${MYSQL_ROOT_PASSWORD} --port=3306 -N -e \
+            "SELECT mysql_server_uuid FROM mysql_innodb_cluster_metadata.instances WHERE address='${host}:3306';" 2>/dev/null)
+        if [[ -n "$stored_uuid" && "$stored_uuid" == "$actual_uuid" ]]; then
+            good_host="$host"
+            break
+        fi
+    done
+
+    if [[ -z "$good_host" ]]; then
+        log "WARNING" "No peer with matching UUID found in metadata. Cannot fix metadata — may need full cluster reboot."
+        return
+    fi
+
+    for host in "${peers[@]}"; do
+        actual_uuid=$(mysql -u${MYSQL_ROOT_USERNAME} -h${host} -p${MYSQL_ROOT_PASSWORD} --port=3306 -N -e "SELECT @@server_uuid;" 2>/dev/null)
+        if [[ -z "$actual_uuid" ]]; then
+            continue
+        fi
+        stored_uuid=$(mysql -u${MYSQL_ROOT_USERNAME} -h${host} -p${MYSQL_ROOT_PASSWORD} --port=3306 -N -e \
+            "SELECT mysql_server_uuid FROM mysql_innodb_cluster_metadata.instances WHERE address='${host}:3306';" 2>/dev/null)
+
+        if [[ -n "$stored_uuid" && "$stored_uuid" != "$actual_uuid" ]]; then
+            log "INFO" "UUID mismatch for $host: metadata=$stored_uuid actual=$actual_uuid"
+            log "INFO" "Removing stale instance from cluster and re-adding with fresh data..."
+            local mysqlsh_good="mysqlsh --js -u${MYSQL_ROOT_USERNAME} -p${MYSQL_ROOT_PASSWORD} -h${good_host}"
+            clear_stale_cluster_lock "${good_host}"
+            ${mysqlsh_good} -e "cluster = dba.getCluster(); cluster.removeInstance('${host}:3306',{force:true});" 2>/dev/null
+            if [[ "$host" != "$report_host" ]]; then
+                # Only re-add remote peers here; the current host will be
+                # added by join_in_cluster after metadata is consistent.
+                clear_stale_cluster_lock "${good_host}"
+                ${mysqlsh_good} -e "cluster = dba.getCluster(); cluster.addInstance('${replication_user}:${MYSQL_ROOT_PASSWORD}@${host}:3306',{recoveryMethod:'clone'});" 2>/dev/null
+            fi
+        fi
+    done
 }
 
 export primary=""
 function select_primary() {
     for i in {900..0}; do
         for host in "${peers[@]}"; do
-            local mysqlshell="mysqlsh -u${replication_user} -h${host} -p${MYSQL_ROOT_PASSWORD}"
-            #result of the query output "member_host host_name" in this format
-            #       $mysqlshell --sql -e "SELECT member_host FROM performance_schema.replication_group_members where member_role = 'PRIMARY' ;"
-            selected_primary=($($mysqlshell --sql -e "SELECT member_host FROM performance_schema.replication_group_members where member_role = 'PRIMARY' ;"))
-            if [[ "${#selected_primary[@]}" -ge "1" ]]; then
+            local mysqlsh_peer="mysqlsh --js -u${MYSQL_ROOT_USERNAME} -h${host} -p${MYSQL_ROOT_PASSWORD}"
+            selected_primary=($(${mysqlsh_peer} --sql -e "SELECT member_host FROM performance_schema.replication_group_members where member_role = 'PRIMARY' ;" 2>/dev/null))
+            if [[ "${#selected_primary[@]}" -ge "2" ]]; then
                 primary=${selected_primary[1]}
                 log "INFO" "Primary found $primary."
                 return
             fi
         done
+        sleep 1
     done
     log "INFO" "Primary not found."
 }
@@ -161,9 +356,13 @@ function select_primary() {
 already_in_cluster=0
 
 function is_already_in_cluster() {
-    local mysqlshell="mysqlsh -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
-    ${mysqlshell} -e "cluster = dba.getCluster();  cluster.rescan({addInstances:['${report_host}:3306'],interactive:false})"
-    out=($(${mysqlshell} --sql -e "SELECT member_host FROM performance_schema.replication_group_members where member_state='ONLINE';"))
+    local mysqlsh_primary="mysqlsh --js -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
+    # Refresh stale server_uuid entries in metadata before dba.getCluster()
+    # so it doesn't reject the call with "Metadata for instance not found".
+    fix_metadata_uuids
+    clear_stale_cluster_lock "${primary}"
+    ${mysqlsh_primary} -e "cluster = dba.getCluster(); cluster.rescan()"
+    out=($(${mysqlsh_primary} --sql -e "SELECT member_host FROM performance_schema.replication_group_members where member_state='ONLINE';"))
 
     for host in ${out[@]}; do
         if [[ "$host" == "$report_host" ]]; then
@@ -175,48 +374,60 @@ function is_already_in_cluster() {
 }
 
 function join_in_cluster() {
-    log "INFO " "$report_host joining in cluster"
-    local mysqlshell="mysqlsh -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
-    retry 10 ${mysqlshell} -e "cluster = dba.getCluster();cluster.addInstance('${replication_user}@${report_host}',{recoveryMethod:'incremental'});"
+    log "INFO" "$report_host joining in cluster"
+    local mysqlsh_primary="mysqlsh --js -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
+    # Temporarily disable read-only for join operations (match run.sh)
+    ${mysql_local} -N -e "SET GLOBAL super_read_only=OFF; SET GLOBAL read_only=OFF;" 2>/dev/null
+    clear_stale_cluster_lock "${primary}"
+    retry 10 ${mysqlsh_primary} -e "cluster = dba.getCluster(); cluster.addInstance('${replication_user}:${MYSQL_ROOT_PASSWORD}@${report_host}:3306',{recoveryMethod:'incremental'});"
 }
 
 function join_by_clone() {
-    log "INFO " "$report_host joining in cluster"
-    local mysqlshell="mysqlsh -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
-    retry 10 ${mysqlshell} -e "cluster = dba.getCluster();cluster.removeInstance('$report_host',{force:'true'});"
-    retry 10 ${mysqlshell} -e "cluster = dba.getCluster(); cluster.addInstance('${replication_user}@${report_host}',{recoveryMethod:'clone'});"
-
-    #this is required for clone method
-    # Prevent creation of new process until this one is finished
-    #https://serverfault.com/questions/477448/mysql-keeps-crashing-innodb-unable-to-lock-ibdata1-error-11
+    log "INFO" "$report_host joining in cluster by clone"
+    local mysqlsh_primary="mysqlsh --js -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
+    # Temporarily disable read-only for clone operations (match run.sh)
+    ${mysql_local} -N -e "SET GLOBAL super_read_only=OFF; SET GLOBAL read_only=OFF;" 2>/dev/null
+    clear_stale_cluster_lock "${primary}"
+    retry 10 ${mysqlsh_primary} -e "cluster = dba.getCluster(); cluster.removeInstance('${report_host}:3306',{force:true});"
+    clear_stale_cluster_lock "${primary}"
+    retry 10 ${mysqlsh_primary} -e "cluster = dba.getCluster(); cluster.addInstance('${replication_user}:${MYSQL_ROOT_PASSWORD}@${report_host}:3306',{recoveryMethod:'clone'});"
+    # Clone restarts mysqld — wait for the old process to finish
     wait $pid
 }
+
 joined_in_cluster=0
-check_instance_joined_in_cluster() {
-    local mysqlshell="mysqlsh -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
-    out=($(${mysqlshell} --sql -e "SELECT member_host FROM performance_schema.replication_group_members;"))
+function check_instance_joined_in_cluster() {
+    local mysqlsh_primary="mysqlsh --js -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
+    out=($(${mysqlsh_primary} --sql -e "SELECT member_host FROM performance_schema.replication_group_members;"))
 
     for host in "${out[@]}"; do
         if [[ "$host" == "$report_host" ]]; then
-            join_in_cluster=1
-            echo "$report_host successfully join_in_cluster"
+            joined_in_cluster=1
+            echo "$report_host successfully joined_in_cluster"
         fi
     done
 }
 
 function make_sure_instance_join_in_cluster() {
-    local mysqlshell="mysqlsh -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
-    retry 10 ${mysqlshell} -e "cluster = dba.getCluster();  cluster.rescan({addInstances:['${report_host}:3306'],interactive:false})"
+    local mysqlsh_primary="mysqlsh --js -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
+    clear_stale_cluster_lock "${primary}"
+    retry 10 ${mysqlsh_primary} -e "cluster = dba.getCluster(); cluster.rescan()"
 }
 
 function rejoin_in_cluster() {
-    local mysqlshell="mysqlsh -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
-    ${mysqlshell} -e "cluster=dba.getCluster(); cluster.rejoinInstance('${replication_user}@${report_host}')"
-    out=($(${mysqlshell} --sql -e "SELECT member_host FROM performance_schema.replication_group_members;"))
+    local mysqlsh_primary="mysqlsh --js -u${replication_user} -p${MYSQL_ROOT_PASSWORD} -h${primary}"
+    # Refresh stale server_uuid entries in metadata before dba.getCluster() /
+    # cluster.rejoinInstance() so they don't reject this host as "unknown".
+    fix_metadata_uuids
+    # Temporarily disable read-only for rejoin (match run.sh)
+    ${mysql_local} -N -e "SET GLOBAL super_read_only=OFF; SET GLOBAL read_only=OFF;" 2>/dev/null
+    clear_stale_cluster_lock "${primary}"
+    ${mysqlsh_primary} -e "cluster = dba.getCluster(); cluster.rejoinInstance('${replication_user}:${MYSQL_ROOT_PASSWORD}@${report_host}:3306')"
+    out=($(${mysqlsh_primary} --sql -e "SELECT member_host FROM performance_schema.replication_group_members;"))
 
     for host in "${out[@]}"; do
         if [[ "$host" == "$report_host" ]]; then
-            echo "$report_host successfully join_in_cluster"
+            echo "$report_host successfully joined_in_cluster"
         fi
     done
     check_instance_joined_in_cluster
@@ -225,40 +436,128 @@ function rejoin_in_cluster() {
     fi
     check_instance_joined_in_cluster
     if [[ "$joined_in_cluster" == "0" ]]; then
-        retry 1 ${mysqlshell} -e "cluster = dba.getCluster();cluster.removeInstance('$report_host',{force:'true'});"
+        clear_stale_cluster_lock "${primary}"
+        retry 1 ${mysqlsh_primary} -e "cluster = dba.getCluster(); cluster.removeInstance('${report_host}:3306',{force:true});"
         join_in_cluster
     fi
-
 }
 
 export pid
 function reboot_from_completeOutage() {
-    local mysqlshell="mysqlsh -u${replication_user} -h${report_host} -p${MYSQL_ROOT_PASSWORD}"
-    #https://dev.mysql.com/doc/dev/mysqlsh-api-javascript/8.0/classmysqlsh_1_1dba_1_1_dba.html#ac68556e9a8e909423baa47dc3b42aadb
-    #mysql wait for user interaction to remove the unavailable seed from the cluster..
+    local mysqlsh_self="mysqlsh --js -u${MYSQL_ROOT_USERNAME} -h${report_host} -p${MYSQL_ROOT_PASSWORD}"
     clusterName=$(echo -n $BASE_NAME | sed 's/-/_/g')
-    yes | $mysqlshell -e "dba.rebootClusterFromCompleteOutage('$clusterName',{force:'true'})"
-    yes | $mysqlshell -e "cluster = dba.getCluster();  cluster.rescan()"
+
+    # Refresh stale server_uuid entries in metadata before
+    # dba.rebootClusterFromCompleteOutage(), which otherwise treats this
+    # node as a standalone instance (MYSQLSH 51300).
+    fix_metadata_uuids
+
+    # Before rebooting, stop GR on any peer stuck in ERROR state.
+    # dba.rebootClusterFromCompleteOutage() refuses to proceed if any peer has GR
+    # in ERROR state ("belongs to a GR group that is not managed as an InnoDB Cluster").
+    # All peers must be in OFFLINE state for the reboot to work.
+    for host in "${peers[@]}"; do
+        peer_state=$(mysql -u${MYSQL_ROOT_USERNAME} -h${host} -p${MYSQL_ROOT_PASSWORD} --port=3306 -N -e \
+            "SELECT MEMBER_STATE FROM performance_schema.replication_group_members LIMIT 1;" 2>/dev/null)
+        if [[ "$peer_state" == "ERROR" ]]; then
+            log "INFO" "Stopping GR on $host (stuck in ERROR state) before cluster reboot..."
+            mysql -u${MYSQL_ROOT_USERNAME} -h${host} -p${MYSQL_ROOT_PASSWORD} --port=3306 -N -e "STOP GROUP_REPLICATION;" 2>/dev/null
+        fi
+    done
+
+    # Temporarily disable read-only for reboot (match run.sh)
+    ${mysql_local} -N -e "SET GLOBAL super_read_only=OFF; SET GLOBAL read_only=OFF;" 2>/dev/null
+
+    # Determine whether the InnoDB Cluster metadata schema exists AND recognizes
+    # this instance's server_uuid. dba.rebootClusterFromCompleteOutage() requires
+    # both — without them mysqlsh fails with MYSQLSH 51300 ("function not
+    # available through a session to a standalone instance"), and the coordinator
+    # ends up looping the reboot signal forever. This happens after:
+    #   - the metadata schema was dropped (manually or by an upstream cleanup);
+    #   - a logical restore where the source's metadata referenced a different
+    #     cluster's pod hostnames / server_uuids (so this server_uuid is unknown
+    #     to the metadata that came along with the restore);
+    #   - any cluster recreation where IDC metadata was wiped.
+    local has_metadata known_instance my_uuid
+    has_metadata=$(${mysql_local} -N -e \
+        "SELECT COUNT(*) FROM information_schema.schemata WHERE schema_name='mysql_innodb_cluster_metadata';" \
+        2>/dev/null || echo 0)
+    my_uuid=$(${mysql_local} -N -e "SELECT @@server_uuid;" 2>/dev/null)
+    known_instance=0
+    if [[ "$has_metadata" == "1" && -n "$my_uuid" ]]; then
+        known_instance=$(${mysql_local} -N -e \
+            "SELECT COUNT(*) FROM mysql_innodb_cluster_metadata.instances WHERE mysql_server_uuid='$my_uuid';" \
+            2>/dev/null || echo 0)
+    fi
+
+    if [[ "$has_metadata" == "1" && "$known_instance" == "1" ]]; then
+        # Normal path — metadata is present and recognises this instance.
+        log "INFO" "InnoDB Cluster metadata present; running rebootClusterFromCompleteOutage"
+        yes | $mysqlsh_self -e "dba.rebootClusterFromCompleteOutage('$clusterName',{force:true})"
+    else
+        # Fallback path — metadata is missing or stale. Recreate it so this
+        # node is recognised and the cluster can come back ONLINE without
+        # operator intervention.
+        log "WARN" "InnoDB Cluster metadata missing or does not recognise this server_uuid (has_metadata=$has_metadata, known_instance=$known_instance); falling back to createCluster"
+
+        # Drop any stale metadata schemas so createCluster starts clean.
+        # SQL_LOG_BIN=0 keeps these DDLs out of the binlog so peers don't
+        # replay them during the next round of recovery.
+        ${mysql_local} -N -e "
+            SET SQL_LOG_BIN=0;
+            DROP DATABASE IF EXISTS mysql_innodb_cluster_metadata;
+            DROP DATABASE IF EXISTS mysql_innodb_cluster_metadata_bkp;
+            DROP DATABASE IF EXISTS mysql_innodb_cluster_metadata_previous;
+            SET SQL_LOG_BIN=1;
+        " 2>/dev/null
+
+        # If GR is already running on at least one member, adopt the live
+        # group instead of bootstrapping a new one (preserves any post-outage
+        # writes already in flight). Otherwise plain createCluster will
+        # configure + bootstrap GR locally and seed metadata.
+        local gr_online
+        gr_online=$(${mysql_local} -N -e \
+            "SELECT COUNT(*) FROM performance_schema.replication_group_members WHERE MEMBER_STATE='ONLINE';" \
+            2>/dev/null || echo 0)
+
+        local create_opts="multiPrimary:false,force:true"
+        if [[ "$PRIMARY_TYPE" == "Multi-Primary" ]]; then
+            create_opts="multiPrimary:true,force:true"
+        fi
+
+        if [[ "${gr_online}" -ge "1" ]]; then
+            log "INFO" "GR already ONLINE on some member; createCluster with adoptFromGR:true"
+            yes | $mysqlsh_self -e "dba.createCluster('$clusterName',{adoptFromGR:true,${create_opts}});"
+        else
+            log "INFO" "GR is OFFLINE everywhere; createCluster will bootstrap GR locally"
+            yes | $mysqlsh_self -e "dba.createCluster('$clusterName',{${create_opts}});"
+        fi
+    fi
+
+    clear_stale_cluster_lock "${report_host}"
+    yes | $mysqlsh_self -e "cluster = dba.getCluster(); cluster.rescan()"
     wait $pid
 }
 
 function start_mysqld_in_background() {
     log "INFO" "Starting mysql server with 'docker-entrypoint.sh mysqld $args'..."
-    /entrypoint.sh mysqld --user=root --report-host=$report_host --bind-address=* $args &
+    # Use docker-entrypoint.sh (in PATH at /usr/local/bin/) — works on both
+    # Oracle mysql-server images and appscode images.
+    docker-entrypoint.sh mysqld --user=root --report-host=$report_host --bind-address=* $args &
     pid=$!
     log "INFO" "The process id of mysqld is '$pid'"
 }
 
-replication_user=repl
+# ── Main flow ────────────────────────────────────────────────────────────────
 
 start_mysqld_in_background
-wait_for_host_online "root" "localhost" "$MYSQL_ROOT_PASSWORD"
+wait_for_host_online "${MYSQL_ROOT_USERNAME}" "localhost" "$MYSQL_ROOT_PASSWORD"
 create_replication_user
 configure_instance
 
 if [[ "$restart_required" == "1" ]]; then
     start_mysqld_in_background
-    wait_for_host_online "repl" "$report_host" "$MYSQL_ROOT_PASSWORD"
+    wait_for_host_online "${MYSQL_ROOT_USERNAME}" "$report_host" "$MYSQL_ROOT_PASSWORD"
 fi
 
 mysqld_alive=0
@@ -272,56 +571,77 @@ function check_mysqld_alive() {
     fi
 }
 
+# ── Signal loop ──────────────────────────────────────────────────────────────
+
 while true; do
+    echo "running">/scripts/setup.txt
+    log "INFO" "creating setup.txt file"
     check_mysqld_alive
     if [[ "$mysqld_alive" == "1" ]]; then
         echo "mysqld process is running"
     else
         echo "need start mysqld and wait_for_mysqld_running"
         start_mysqld_in_background
-        wait_for_host_online "repl" "$report_host" "$MYSQL_ROOT_PASSWORD"
+        wait_for_host_online "${MYSQL_ROOT_USERNAME}" "$report_host" "$MYSQL_ROOT_PASSWORD"
     fi
 
-    # wait for the script copied by coordinator
+    # wait for the signal file from coordinator
+    # Also check if this node is already ONLINE in GR — this happens when
+    # another pod's coordinator called rebootClusterFromCompleteOutage() which
+    # rejoins all members remotely via mysqlsh AdminAPI, bypassing this script.
     while [ ! -f "/scripts/signal.txt" ]; do
+        member_state=$(mysql -u${MYSQL_ROOT_USERNAME} -hlocalhost -p${MYSQL_ROOT_PASSWORD} -N -e \
+            "SELECT MEMBER_STATE FROM performance_schema.replication_group_members WHERE MEMBER_HOST='${report_host}' LIMIT 1;" 2>/dev/null)
+        if [[ "$member_state" == "ONLINE" ]]; then
+            log "INFO" "Already ONLINE in GR group (joined by another node's reboot) — skipping signal wait"
+            break
+        fi
         log "WARNING" "signal is not present yet!"
         sleep 1
     done
 
-    desired_func=$(cat /scripts/signal.txt)
-    rm -rf /scripts/signal.txt
-    log "INFO" "going to execute $desired_func"
+    # If we broke out because GR is already ONLINE (no signal file), skip to wait.
+    if [ ! -f "/scripts/signal.txt" ]; then
+        log "INFO" "No signal to execute — node already joined via external reboot"
+    else
+        desired_func=$(cat /scripts/signal.txt)
+        rm -rf /scripts/signal.txt
+        log "INFO" "going to execute $desired_func"
 
-    if [[ $desired_func == "create_cluster" ]]; then
-        create_cluster
-    fi
+        if [[ $desired_func == "create_cluster" ]]; then
+            create_cluster
+        fi
 
-    if [[ $desired_func == "join_in_cluster" ]]; then
-        select_primary
-        join_in_cluster
-        check_instance_joined_in_cluster
-        if [[ "$joined_in_cluster" == "0" ]]; then
-            make_sure_instance_join_in_cluster
+        if [[ $desired_func == "join_in_cluster" ]]; then
+            select_primary
+            join_in_cluster
+            check_instance_joined_in_cluster
+            if [[ "$joined_in_cluster" == "0" ]]; then
+                make_sure_instance_join_in_cluster
+            fi
         fi
-    fi
 
-    if [[ $desired_func == "rejoin_in_cluster" ]]; then
-        select_primary
-        rejoin_in_cluster
-    fi
-    if [[ $desired_func == "join_by_clone" ]]; then
-        select_primary
-        join_by_clone
-        start_mysqld_in_background
-        wait_for_host_online "repl" "$report_host" "$MYSQL_ROOT_PASSWORD"
-        join_in_cluster
-    fi
+        if [[ $desired_func == "rejoin_in_cluster" ]]; then
+            select_primary
+            rejoin_in_cluster
+        fi
+
+        if [[ $desired_func == "join_by_clone" ]]; then
+            select_primary
+            join_by_clone
+            start_mysqld_in_background
+            wait_for_host_online "${MYSQL_ROOT_USERNAME}" "$report_host" "$MYSQL_ROOT_PASSWORD"
+            join_in_cluster
+        fi
 
-    if [[ $desired_func == "reboot_from_complete_outage" ]]; then
-        reboot_from_completeOutage
+        if [[ $desired_func == "reboot_from_complete_outage" ]]; then
+            reboot_from_completeOutage
+        fi
     fi
-    log "INFO" "waiting for mysql process id  = $pid"
-    wait $pid
-    rm -rf /scripts/signal.txt
 
+    log "INFO" "removing setup.txt file"
+    rm -rf /scripts/signal.txt
+    rm -rf /scripts/setup.txt
+    log "INFO" "waiting for mysql process id = $pid"
+    wait $pid
 done