fixes

egegunes · egegunes · commit 5c73861eadf2 · 2025-08-07T19:26:00.000+03:00
diff --git a/e2e-tests/functions b/e2e-tests/functions
@@ -54,34 +54,46 @@ wait_for_delete() {
 	done
 }
 
+apply_crd() {
+	kubectl -n "${OPERATOR_NS:-$NAMESPACE}" apply --server-side --force-conflicts -f "${DEPLOY_DIR}/crd.yaml"
+}
+
+apply_rbac() {
+	local rbac_file
+
+	if [ -n "$OPERATOR_NS" ]; then
+		rbac_file="${DEPLOY_DIR}/cw-rbac.yaml"
+	else
+		rbac_file="${DEPLOY_DIR}/rbac.yaml"
+	fi
+
+	kubectl -n "${OPERATOR_NS:-$NAMESPACE}" apply -f "${rbac_file}"
+}
+
 deploy_operator() {
 	destroy_operator
 
 	if [[ $OPERATOR_NS ]]; then
 		create_namespace "${OPERATOR_NS}"
 	fi
 
-	kubectl -n "${OPERATOR_NS:-$NAMESPACE}" apply --server-side --force-conflicts -f "${DEPLOY_DIR}/crd.yaml"
+	apply_crd
+	apply_rbac
+
+	local operator_file
 
 	if [ -n "$OPERATOR_NS" ]; then
-		kubectl -n "${OPERATOR_NS:-$NAMESPACE}" apply -f "${DEPLOY_DIR}/cw-rbac.yaml"
-
-		yq eval \
-			"$(printf 'select(documentIndex==1).spec.template.spec.containers[0].image="%s"' "${IMAGE}")" \
-			"${DEPLOY_DIR}/cw-operator.yaml" \
-			| yq eval '(select(documentIndex==1).spec.template.spec.containers[] | select(.name=="manager").env[] | select(.name=="DISABLE_TELEMETRY").value) = "true"' \
-			| yq eval '(select(documentIndex==1).spec.template.spec.containers[] | select(.name=="manager").env[] | select(.name=="LOG_LEVEL").value) = "DEBUG"' \
-			| kubectl -n "${OPERATOR_NS:-$NAMESPACE}" apply -f -
+		operator_file="${DEPLOY_DIR}/cw-operator.yaml"
 	else
-		kubectl -n "${OPERATOR_NS:-$NAMESPACE}" apply -f "${DEPLOY_DIR}/rbac.yaml"
-
-		yq eval \
-			"$(printf 'select(documentIndex==1).spec.template.spec.containers[0].image="%s"' "${IMAGE}")" \
-			"${DEPLOY_DIR}/operator.yaml" \
-			| yq eval '(select(documentIndex==1).spec.template.spec.containers[] | select(.name=="manager").env[] | select(.name=="DISABLE_TELEMETRY").value) = "true"' \
-			| yq eval '(select(documentIndex==1).spec.template.spec.containers[] | select(.name=="manager").env[] | select(.name=="LOG_LEVEL").value) = "DEBUG"' \
-			| kubectl -n "${OPERATOR_NS:-$NAMESPACE}" apply -f -
+		operator_file="${DEPLOY_DIR}/-operator.yaml"
 	fi
+
+	yq eval \
+		"$(printf 'select(documentIndex==1).spec.template.spec.containers[0].image="%s"' "${IMAGE}")" \
+		"${operator_file}" \
+		| yq eval '(select(documentIndex==1).spec.template.spec.containers[] | select(.name=="manager").env[] | select(.name=="DISABLE_TELEMETRY").value) = "true"' \
+		| yq eval '(select(documentIndex==1).spec.template.spec.containers[] | select(.name=="manager").env[] | select(.name=="LOG_LEVEL").value) = "DEBUG"' \
+		| kubectl -n "${OPERATOR_NS:-$NAMESPACE}" apply -f -
 }
 
 upgrade_operator_image() {
@@ -136,8 +148,8 @@ deploy_tls_cluster_secrets() {
 }
 
 deploy_client() {
-  yq eval "$(printf '.spec.containers[0].image="%s"' "${IMAGE_MYSQL}")" "${TESTS_CONFIG_DIR}/client.yaml" | \
-    kubectl -n "${NAMESPACE}" apply -f -
+	yq eval "$(printf '.spec.containers[0].image="%s"' "${IMAGE_MYSQL}")" "${TESTS_CONFIG_DIR}/client.yaml" \
+		| kubectl -n "${NAMESPACE}" apply -f -
 }
 
 apply_s3_storage_secrets() {
@@ -383,8 +395,9 @@ get_cr() {
 	local image_toolkit=${6:-${IMAGE_TOOLKIT}}
 	local image_haproxy=${7:-${IMAGE_HAPROXY}}
 	local image_pmm_client=${8:-${IMAGE_PMM_CLIENT}}
+	local cr_file=${9:-${DEPLOY_DIR}/cr.yaml}
 
-	yq eval "$(printf '.metadata.name="%s"' "${test_name}${name_suffix:+-$name_suffix}")" "${DEPLOY_DIR}/cr.yaml" \
+	yq eval "$(printf '.metadata.name="%s"' "${test_name}${name_suffix:+-$name_suffix}")" ${cr_file} \
 		| yq eval "$(printf '.spec.initImage="%s"' "${IMAGE}")" - \
 		| yq eval '.spec.secretsName="test-secrets"' - \
 		| yq eval '.spec.sslSecretName="test-ssl"' - \
@@ -461,11 +474,11 @@ get_innodb_cluster_status() {
 wait_until_innodb_ok() {
 	local uri="$1"
 
-  local retry=0
-  until [[ $(get_innodb_cluster_status ${uri} | jq -r .defaultReplicaSet.status) == "OK" ]]; do
-    sleep 5
-    retry=$((retry + 1))
-  done
+	local retry=0
+	until [[ $(get_innodb_cluster_status ${uri} | jq -r .defaultReplicaSet.status) == "OK" ]]; do
+		sleep 5
+		retry=$((retry + 1))
+	done
 }
 
 run_curl() {
@@ -477,8 +490,7 @@ get_innodb_cluster_name() {
 }
 
 get_mysqlsh_uri_for_pod() {
-  local pod=$1
-
+	local pod=$1
 
 	echo "root:root_password@${pod}.$(get_cluster_name)-mysql.${NAMESPACE}"
 }
@@ -673,7 +685,7 @@ wait_cluster_consistency_gr() {
 
 wait_pod() {
 	local pod=$1
-  local ns=${2:-${NAMESPACE}}
+	local ns=${2:-${NAMESPACE}}
 
 	set +o xtrace
 	retry=0
@@ -952,120 +964,120 @@ network_loss() {
 }
 
 wait_until_chaos_applied() {
-      local chaos_type=$1
-      local chaos_name=$2
-
-      local resource
-      case ${chaos_type} in
-        "kill"|"failure"|"full-cluster-crash")
-          resource=podchaos/${chaos_name}
-          ;;
-        "network")
-          resource=networkchaos/${chaos_name}
-          ;;
-      esac
-
-      local retry=0
-      until [[ ${retry} == 30 ]]; do
-        sleep 10
-        retry=$((retry + 1))
-
-        succeeded=$(kubectl -n ${NAMESPACE} get ${resource} -o yaml \
-          | yq '.status.experiment.containerRecords[].events[]
+	local chaos_type=$1
+	local chaos_name=$2
+
+	local resource
+	case ${chaos_type} in
+		"kill" | "failure" | "full-cluster-crash")
+			resource=podchaos/${chaos_name}
+			;;
+		"network")
+			resource=networkchaos/${chaos_name}
+			;;
+	esac
+
+	local retry=0
+	until [[ ${retry} == 30 ]]; do
+		sleep 10
+		retry=$((retry + 1))
+
+		succeeded=$(kubectl -n ${NAMESPACE} get ${resource} -o yaml \
+			| yq '.status.experiment.containerRecords[].events[]
                   | select(.operation == "Apply" and .type == "Succeeded")')
 
-        if [[ -n ${succeeded} ]]; then
-          return
-        fi
-      done
+		if [[ -n ${succeeded} ]]; then
+			return
+		fi
+	done
 
-      echo "Timeout (300s) exceeded while waiting for chaos to be applied"
-      exit 1
+	echo "Timeout (300s) exceeded while waiting for chaos to be applied"
+	exit 1
 }
 
 wait_until_chaos_recovered() {
-      local chaos_type=$1
-      local chaos_name=$2
-
-      local resource
-      case ${chaos_type} in
-        "kill"|"failure")
-          resource=podchaos/${chaos_name}
-          ;;
-        "network")
-          resource=networkchaos/${chaos_name}
-          ;;
-      esac
-
-      local retry=0
-      until [[ ${retry} == 30 ]]; do
-        sleep 10
-        retry=$((retry + 1))
-
-        succeeded=$(kubectl -n ${NAMESPACE} get ${resource} -o yaml \
-          | yq '.status.experiment.containerRecords[].events[]
+	local chaos_type=$1
+	local chaos_name=$2
+
+	local resource
+	case ${chaos_type} in
+		"kill" | "failure")
+			resource=podchaos/${chaos_name}
+			;;
+		"network")
+			resource=networkchaos/${chaos_name}
+			;;
+	esac
+
+	local retry=0
+	until [[ ${retry} == 30 ]]; do
+		sleep 10
+		retry=$((retry + 1))
+
+		succeeded=$(kubectl -n ${NAMESPACE} get ${resource} -o yaml \
+			| yq '.status.experiment.containerRecords[].events[]
                   | select(.operation == "Recover" and .type == "Succeeded")')
 
-        if [[ -n ${succeeded} ]]; then
-          return
-        fi
-      done
+		if [[ -n ${succeeded} ]]; then
+			return
+		fi
+	done
 
-      echo "Timeout (300s) exceeded while waiting for chaos to be recovered"
-      exit 1
+	echo "Timeout (300s) exceeded while waiting for chaos to be recovered"
+	exit 1
 }
 
 check_primary_chaos() {
-      local chaos_type=$1
-      local ns=$2
-      local primary_before_failure=$3
-
-      local chaos_name
-      case ${chaos_type} in
-        "kill")
-          chaos_name="chaos-pod-kill-primary"
-          kill_pods "${ns}" "pod" "${primary_before_failure}" "" "${chaos_name}"
-          ;;
-        "full-cluster-crash")
-          chaos_name="chaos-kill-label-cluster-crash"
-          kill_pods "${ns}" "label" "app.kubernetes.io/instance" "gr-self-healing" "${chaos_name}"
-          ;;
-        "failure")
-          chaos_name="chaos-pod-failure-primary"
-          failure_pod "${ns}" "${primary_before_failure}" "${chaos_name}"
-          ;;
-        "network")
-          chaos_name="chaos-pod-network-loss-primary"
-          network_loss "${ns}" "${primary_before_failure}" "${chaos_name}"
-          ;;
-      esac
-
-      wait_until_chaos_applied ${chaos_type} ${chaos_name}
-      if [[ ${chaos_type} == "failure" || ${chaos_type} == "network" ]]; then
-        wait_until_chaos_recovered ${chaos_type} ${chaos_name}
-      fi
-
-      wait_cluster_consistency_gr "$(get_cluster_name)" 3 3
-
-      primary_after_failure=$(get_primary_from_group_replication)
-      uri=$(get_mysqlsh_uri_for_pod ${primary_after_failure})
-      wait_until_innodb_ok ${uri}
-
-      if [[ "${primary_before_failure}" == "${primary_after_failure}" ]]; then
-          echo "primary pod was not killed! something went wrong."
-          exit 1
-      fi
-
-      uri=$(get_mysqlsh_uri_for_pod $(get_primary_from_group_replication))
-      online_members=$(get_innodb_cluster_status ${uri} \
-          | jq .defaultReplicaSet.topology[].status \
-          | grep ONLINE \
-          | wc -l)
-
-      if [[ ${online_members} != 3 ]]; then
-          echo "expected 3 online members, got ${online_members}"
-          exit 1
-      fi
+	local chaos_type=$1
+	local ns=$2
+	local primary_before_failure=$3
+
+	local chaos_name
+	case ${chaos_type} in
+		"kill")
+			chaos_name="chaos-pod-kill-primary"
+			kill_pods "${ns}" "pod" "${primary_before_failure}" "" "${chaos_name}"
+			;;
+		"full-cluster-crash")
+			chaos_name="chaos-kill-label-cluster-crash"
+			kill_pods "${ns}" "label" "app.kubernetes.io/instance" "gr-self-healing" "${chaos_name}"
+			;;
+		"failure")
+			chaos_name="chaos-pod-failure-primary"
+			failure_pod "${ns}" "${primary_before_failure}" "${chaos_name}"
+			;;
+		"network")
+			chaos_name="chaos-pod-network-loss-primary"
+			network_loss "${ns}" "${primary_before_failure}" "${chaos_name}"
+			;;
+	esac
+
+	wait_until_chaos_applied ${chaos_type} ${chaos_name}
+	if [[ ${chaos_type} == "failure" || ${chaos_type} == "network" ]]; then
+		wait_until_chaos_recovered ${chaos_type} ${chaos_name}
+	fi
+
+	wait_cluster_consistency_gr "$(get_cluster_name)" 3 3
+
+	primary_after_failure=$(get_primary_from_group_replication)
+	uri=$(get_mysqlsh_uri_for_pod ${primary_after_failure})
+	wait_until_innodb_ok ${uri}
+
+	if [[ ${primary_before_failure} == "${primary_after_failure}" ]]; then
+		echo "primary pod was not killed! something went wrong."
+		exit 1
+	fi
+
+	uri=$(get_mysqlsh_uri_for_pod $(get_primary_from_group_replication))
+	online_members=$(get_innodb_cluster_status ${uri} \
+		| jq .defaultReplicaSet.topology[].status \
+		| grep ONLINE \
+		| wc -l)
+
+	if [[ ${online_members} != 3 ]]; then
+		echo "expected 3 online members, got ${online_members}"
+		exit 1
+	fi
 }
 
 renew_certificate() {
@@ -1204,6 +1216,7 @@ check_scheduled_backup_labels() {
 		echo "Label percona.com/backup-ancestor is missing"
 		exit 1
 	fi
+}
 
 latest_operator_version_in_vs() {
 	local latest=$(curl -s https://check.percona.com/versions/v1/ps-operator | jq -r '.versions[].operator' | sort -V | tail -n1)
@@ -1235,12 +1248,18 @@ get_cr_with_latest_versions_in_vs() {
 	local image_haproxy=$(echo ${latest_versions} | jq -r '.versions[].matrix.haproxy[].imagePath')
 	local image_pmm_client=$(echo ${latest_versions} | jq -r '.versions[].matrix.pmm[].imagePath')
 
+	local git_tag="v${version}"
+
+	curl "https://raw.githubusercontent.com/percona/percona-server-mysql-operator/${git_tag}/deploy/cr.yaml" \
+		-o ${TEMP_DIR}/cr.yaml
+
 	get_cr "" \
 		${image_mysql} \
 		${image_backup} \
 		${image_orchestrator} \
 		${image_router} \
 		${image_toolkit} \
 		${image_haproxy} \
-		${image_pmm_client}
+		${image_pmm_client} \
+		${TEMP_DIR}/cr.yaml
 }
diff --git a/e2e-tests/tests/async-upgrade/02-upgrade-operator.yaml b/e2e-tests/tests/async-upgrade/02-upgrade-operator.yaml
@@ -8,5 +8,7 @@ commands:
 
       source ../../functions
 
+      apply_crd
+      apply_rbac
       upgrade_operator_image ${IMAGE}
       wait_deployment percona-server-mysql-operator ${OPERATOR_NS:-$NAMESPACE}
diff --git a/e2e-tests/tests/gr-upgrade/02-upgrade-operator.yaml b/e2e-tests/tests/gr-upgrade/02-upgrade-operator.yaml
@@ -8,5 +8,7 @@ commands:
 
       source ../../functions
 
+      apply_crd
+      apply_rbac
       upgrade_operator_image ${IMAGE}
       wait_deployment percona-server-mysql-operator ${OPERATOR_NS:-$NAMESPACE}