123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357 |
- pipeline {
- options {
- timestamps()
- timeout(time: 30, unit: 'MINUTES') // timeout on this stage
- }
- agent {
- kubernetes {
- label "milvus-test"
- defaultContainer 'main'
- yamlFile "build/ci/jenkins/pod/chaos-test.yaml"
- customWorkspace '/home/jenkins/agent/workspace'
- // idle 5 minutes to wait clean up tasks
- idleMinutes 5
- }
- }
- parameters{
- choice(
- description: 'Chaos Test Type',
- name: 'chaos_type',
- choices: ['pod-kill', 'pod-failure', 'mem-stress', 'network-latency', 'network-partition', 'io-latency']
- )
- choice(
- description: 'Chaos Test Target: \
- mem-stress: datanode, etcd, indexnode, minio, proxy, kafka, querynode, standalone \
- io-fault & io-latency: minio, kafka, etcd ',
- name: 'pod_name',
- choices: ["allstandalone", "allcluster", "standalone", "datacoord", "datanode", "indexcoord", "indexnode", "proxy", "kafka", "querycoord", "querynode", "rootcoord", "etcd", "minio"]
- )
- choice(
- description: 'Chaos Test Task',
- name: 'chaos_task',
- choices: ['chaos-test', 'data-consist-test']
- )
- string(
- description: 'Image Repository',
- name: 'image_repository',
- defaultValue: 'harbor.milvus.io/dockerhub/milvusdb/milvus'
- )
- string(
- description: 'Image Tag',
- name: 'image_tag',
- defaultValue: 'master-latest'
- )
- string(
- description: 'Wait Time after chaos test',
- name: 'idel_time',
- defaultValue: '1'
- )
- string(
- description: 'Etcd Image Repository',
- name: 'etcd_image_repository',
- defaultValue: "milvusdb/etcd"
- )
- string(
- description: 'Etcd Image Tag',
- name: 'etcd_image_tag',
- defaultValue: "3.5.0-r6"
- )
- string(
- description: 'QueryNode Nums',
- name: 'querynode_nums',
- defaultValue: '3'
- )
- string(
- description: 'DataNode Nums',
- name: 'datanode_nums',
- defaultValue: '2'
- )
- string(
- description: 'IndexNode Nums',
- name: 'indexnode_nums',
- defaultValue: '1'
- )
- string(
- description: 'Proxy Nums',
- name: 'proxy_nums',
- defaultValue: '1'
- )
- booleanParam(
- description: 'Keep Env',
- name: 'keep_env',
- defaultValue: 'false'
- )
- }
-
- environment {
- ARTIFACTS = "${env.WORKSPACE}/_artifacts"
- RELEASE_NAME = "${params.pod_name}-${params.chaos_type}-${env.BUILD_ID}"
- NAMESPACE = "chaos-testing"
- }
- stages {
- stage ('Install Dependency') {
- steps {
- container('main') {
- dir ('tests/python_client') {
- script {
- sh "pip install -r requirements.txt --trusted-host https://test.pypi.org"
- }
- }
- }
- }
- }
- stage ('Modify Milvus chart values') {
- steps {
- container('main') {
- dir ('tests/python_client/chaos') {
- script {
- sh """
- yq -i '.kafka.enabled = true' standalone-values.yaml
- yq -i '.kafka.enabled = true' cluster-values.yaml
- yq -i '.queryNode.replicas = "${params.querynode_nums}"' cluster-values.yaml
- yq -i '.dataNode.replicas = "${params.datanode_nums}"' cluster-values.yaml
- yq -i '.indexNode.replicas = "${params.indexnode_nums}"' cluster-values.yaml
- yq -i '.proxy.replicas = "${params.proxy_nums}"' cluster-values.yaml
- yq -i '.etcd.image.repository = "${params.etcd_image_repository}"' cluster-values.yaml
- yq -i '.etcd.image.tag = "${params.etcd_image_tag}"' cluster-values.yaml
- yq -i '.etcd.image.repository = "${params.etcd_image_repository}"' standalone-values.yaml
- yq -i '.etcd.image.tag = "${params.etcd_image_tag}"' standalone-values.yaml
- """
- }
- }
- }
- }
- }
- stage ('Deploy Milvus') {
- options {
- timeout(time: 15, unit: 'MINUTES') // timeout on this stage
- }
- steps {
- container('main') {
- dir ('tests/python_client/chaos/scripts') {
- script {
- def image_tag_modified = ""
- if ("${params.image_tag}" == "master-latest") {
- image_tag_modified = sh(returnStdout: true, script: 'bash ../../../../scripts/docker_image_find_tag.sh -n milvusdb/milvus -t master-latest -f master- -F -L -q').trim()
- }
- else {
- image_tag_modified = "${params.image_tag}"
- }
- sh "echo ${image_tag_modified}"
- sh "echo ${params.chaos_type}"
- sh "helm repo add milvus https://zilliztech.github.io/milvus-helm"
- sh "helm repo update"
- def pod_name = "${params.pod_name}"
- if (pod_name.contains("standalone")){
- sh"""
- IMAGE_TAG="${image_tag_modified}" \
- REPOSITORY="${params.image_repository}" \
- RELEASE_NAME="${env.RELEASE_NAME}" \
- bash install_milvus_standalone.sh
- """
- }else{
- sh"""
- IMAGE_TAG="${image_tag_modified}" \
- REPOSITORY="${params.image_repository}" \
- RELEASE_NAME="${env.RELEASE_NAME}" \
- bash install_milvus_cluster.sh
- """
- }
- sh "kubectl wait --for=condition=Ready pod -l app.kubernetes.io/instance=${env.RELEASE_NAME} -n ${env.NAMESPACE} --timeout=360s"
- sh "kubectl wait --for=condition=Ready pod -l release=${env.RELEASE_NAME} -n ${env.NAMESPACE} --timeout=360s"
- sh "kubectl get pods -o wide|grep ${env.RELEASE_NAME}"
- }
- }
- }
- }
- }
- stage ('Run e2e test before chaos') {
- options {
- timeout(time: 5, unit: 'MINUTES') // timeout on this stage
- }
- steps {
- container('main') {
- dir ('tests/python_client/chaos') {
- script {
- def host = sh(returnStdout: true, script: "kubectl get svc/${env.RELEASE_NAME}-milvus -o jsonpath=\"{.spec.clusterIP}\"").trim()
- sh "pytest -s -v ../testcases/test_e2e.py --host $host --log-cli-level=INFO --capture=no"
- }
- }
- }
- }
-
- }
- stage ('Run hello_milvus before chaos') {
- options {
- timeout(time: 5, unit: 'MINUTES') // timeout on this stage
- }
- steps {
- container('main') {
- dir ('tests/python_client/chaos') {
- script {
- def host = sh(returnStdout: true, script: "kubectl get svc/${env.RELEASE_NAME}-milvus -o jsonpath=\"{.spec.clusterIP}\"").trim()
- sh "python3 scripts/hello_milvus.py --host $host"
- }
- }
- }
- }
-
- }
- stage ('Run chaos test'){
- options {
- timeout(time: 15, unit: 'MINUTES') // timeout on this stage
- }
- steps {
- container('main') {
- dir ('tests/python_client/chaos') {
- script {
- sh"""
- POD_NAME="${params.pod_name}" \
- CHAOS_TYPE="${params.chaos_type}" \
- RELEASE_NAME="${env.RELEASE_NAME}" \
- bash scripts/modify_config.sh
- """
- if ("${params.chaos_task}" == "chaos-test"){
- def host = sh(returnStdout: true, script: "kubectl get svc/${env.RELEASE_NAME}-milvus -o jsonpath=\"{.spec.clusterIP}\"").trim()
- sh "timeout 14m pytest -s -v test_chaos.py --host $host --log-cli-level=INFO --capture=no || echo 'chaos test fail' "
- }
- if ("${params.chaos_task}" == "data-consist-test"){
- def host = sh(returnStdout: true, script: "kubectl get svc/${env.RELEASE_NAME}-milvus -o jsonpath=\"{.spec.clusterIP}\"").trim()
- sh "timeout 14m pytest -s -v test_chaos_data_consist.py --host $host --log-cli-level=INFO --capture=no || echo 'chaos test fail' "
- }
- echo "chaos test done"
- sh "kubectl wait --for=condition=Ready pod -l app.kubernetes.io/instance=${env.RELEASE_NAME} -n ${env.NAMESPACE} --timeout=360s"
- sh "kubectl wait --for=condition=Ready pod -l release=${env.RELEASE_NAME} -n ${env.NAMESPACE} --timeout=360s"
- sh "kubectl get pods -o wide|grep ${env.RELEASE_NAME}"
- }
- }
- }
- }
-
- }
- stage ('result analysis') {
- steps {
- container('main') {
- dir ('tests/python_client/chaos/reports') {
- script {
- echo "result analysis"
- sh "cat ${env.RELEASE_NAME}.log || echo 'no log file'"
- }
- }
- }
- }
- }
- stage ('Milvus Idle Time') {
- steps {
- container('main') {
- dir ('tests/python_client/chaos') {
- script {
- echo "sleep ${params.idel_time}m"
- sh "sleep ${params.idel_time}m"
- }
- }
- }
- }
- }
- stage ('run e2e test after chaos') {
- options {
- timeout(time: 5, unit: 'MINUTES') // timeout on this stage
- }
- steps {
- container('main') {
- dir ('tests/python_client/chaos') {
- script {
- def host = sh(returnStdout: true, script: "kubectl get svc/${env.RELEASE_NAME}-milvus -o jsonpath=\"{.spec.clusterIP}\"").trim()
- sh "pytest -s -v ../testcases/test_e2e.py --host $host --log-cli-level=INFO --capture=no"
- sh "kubectl get pods -o wide|grep ${env.RELEASE_NAME}"
- }
- }
- }
- }
-
- }
- stage ('Run hello_milvus after chaos') {
- options {
- timeout(time: 5, unit: 'MINUTES') // timeout on this stage
- }
- steps {
- container('main') {
- dir ('tests/python_client/chaos') {
- script {
- def host = sh(returnStdout: true, script: "kubectl get svc/${env.RELEASE_NAME}-milvus -o jsonpath=\"{.spec.clusterIP}\"").trim()
- sh "python3 scripts/hello_milvus.py --host $host"
- sh "kubectl get pods -o wide|grep ${env.RELEASE_NAME}"
- }
- }
- }
- }
- }
- stage ('Verify all collections after chaos') {
- options {
- timeout(time: 10, unit: 'MINUTES') // timeout on this stage
- }
- steps {
- container('main') {
- dir ('tests/python_client/chaos') {
- script {
- def host = sh(returnStdout: true, script: "kubectl get svc/${env.RELEASE_NAME}-milvus -o jsonpath=\"{.spec.clusterIP}\"").trim()
- sh "python3 scripts/verify_all_collections.py --host $host"
- sh "kubectl get pods -o wide|grep ${env.RELEASE_NAME}"
- }
- }
- }
- }
- }
- }
- post {
- always {
- echo 'upload logs'
- container('main') {
- dir ('tests/python_client/chaos') {
- script {
- echo "get pod status"
- sh "kubectl get pods -o wide|grep ${env.RELEASE_NAME} || true"
- echo "collecte logs"
- sh "bash ../../scripts/export_log_k8s.sh ${env.NAMESPACE} ${env.RELEASE_NAME} k8s_log/${env.RELEASE_NAME} || true"
- sh "tar -zcvf artifacts-${env.RELEASE_NAME}-pytest-logs.tar.gz /tmp/ci_logs/ --remove-files || true"
- sh "tar -zcvf artifacts-${env.RELEASE_NAME}-server-logs.tar.gz k8s_log/ --remove-files || true"
- archiveArtifacts artifacts: "artifacts-${env.RELEASE_NAME}-pytest-logs.tar.gz", allowEmptyArchive: true
- archiveArtifacts artifacts: "artifacts-${env.RELEASE_NAME}-server-logs.tar.gz", allowEmptyArchive: true
- if ("${params.keep_env}" == "false"){
- sh "bash scripts/uninstall_milvus.sh ${env.RELEASE_NAME}"
- }
- }
- }
- }
-
- }
- success {
- echo 'I succeeeded!'
- container('main') {
- dir ('tests/python_client/chaos/scripts') {
- script {
- sh "bash uninstall_milvus.sh ${env.RELEASE_NAME} || true"
- }
- }
- }
- }
- unstable {
- echo 'I am unstable :/'
- }
- failure {
- echo 'I failed :('
- }
- changed {
- echo 'Things were different before...'
- }
- }
- }
|