diff --git a/charts/kafka/kafka-broker-pod-failure/ansible/engine.yaml b/charts/kafka/kafka-broker-pod-failure/ansible/engine.yaml new file mode 100644 index 0000000..90f79dc --- /dev/null +++ b/charts/kafka/kafka-broker-pod-failure/ansible/engine.yaml @@ -0,0 +1,79 @@ +apiVersion: litmuschaos.io/v1alpha1 +kind: ChaosEngine +metadata: + name: kafka-chaos + namespace: default +spec: + # It can be true/false + annotationCheck: 'true' + # It can be active/stop + engineState: 'active' + #ex. values: ns1:name=percona,ns2:run=nginx + auxiliaryAppInfo: '' + appinfo: + appns: 'default' + applabel: 'app=cp-kafka' + appkind: 'statefulset' + chaosServiceAccount: kafka-broker-pod-failure-sa + monitoring: false + # It can be delete/retain + jobCleanUpPolicy: 'delete' + experiments: + - name: kafka-broker-pod-failure + spec: + components: + env: + # choose based on available kafka broker replicas + - name: KAFKA_REPLICATION_FACTOR + value: '3' + + # get via 'kubectl get pods --show-labels -n ' + - name: KAFKA_LABEL + value: 'app=cp-kafka' + + - name: KAFKA_NAMESPACE + value: 'default' + + # get via 'kubectl get svc -n ' + - name: KAFKA_SERVICE + value: 'kafka-cp-kafka-headless' + + # get via 'kubectl get svc -n ' + - name: KAFKA_PORT + value: '9092' + + # Recommended timeout for EKS platform: 60000 ms + - name: KAFKA_CONSUMER_TIMEOUT + value: '30000' # in milliseconds + + # ensure to set the instance name if using KUDO operator + - name: KAFKA_INSTANCE_NAME + value: '' + + - name: ZOOKEEPER_NAMESPACE + value: 'default' + + # get via 'kubectl get pods --show-labels -n ' + - name: ZOOKEEPER_LABEL + value: 'app=cp-zookeeper' + + # get via 'kubectl get svc -n + - name: ZOOKEEPER_SERVICE + value: 'kafka-cp-zookeeper-headless' + + # get via 'kubectl get svc -n + - name: ZOOKEEPER_PORT + value: '2181' + + # set chaos duration (in sec) as desired + - name: TOTAL_CHAOS_DURATION + value: '60' + + # set chaos interval (in sec) as desired + - name: CHAOS_INTERVAL + value: '20' + + # pod failures without '--force' & default terminationGracePeriodSeconds + - name: FORCE + value: 'false' + diff --git a/charts/kafka/kafka-broker-pod-failure/ansible/experiment.yaml b/charts/kafka/kafka-broker-pod-failure/ansible/experiment.yaml new file mode 100644 index 0000000..a7f7b1e --- /dev/null +++ b/charts/kafka/kafka-broker-pod-failure/ansible/experiment.yaml @@ -0,0 +1,128 @@ +apiVersion: litmuschaos.io/v1alpha1 +description: + message: | + Deleting a kafka broker pod +kind: ChaosExperiment +metadata: + name: kafka-broker-pod-failure +spec: + definition: + scope: Cluster + permissions: + - apiGroups: + - "" + - "apps" + - "batch" + - "litmuschaos.io" + resources: + - "statefulsets" + - "deployments" + - "events" + - "pods/log" + - "configmaps" + - "jobs" + - "pods" + - "pods/exec" + - "chaosengines" + - "chaosexperiments" + - "chaosresults" + verbs: + - "create" + - "get" + - "delete" + - "list" + - "patch" + - apiGroups: + - "" + resources: + - "nodes" + verbs: + - "get" + - "list" + image: "litmuschaos/ansible-runner:latest" + imagePullPolicy: Always + args: + - -c + - ansible-playbook ./experiments/kafka/kafka-broker-pod-failure/kafka-broker-pod-failure-ansible-logic.yml -i /etc/ansible/hosts -vv; exit 0 + command: + - /bin/bash + env: + + - name: ANSIBLE_STDOUT_CALLBACK + value: 'default' + + - name: KAFKA_KIND + value: 'statefulset' + + - name: KAFKA_LIVENESS_STREAM + value: 'enabled' + + - name: KAFKA_LIVENESS_IMAGE + value: 'litmuschaos/kafka-client:ci' + + # set to 'enabled' if you have auth set up + - name: KAFKA_SASL_AUTH + value: 'disabled' + + # Recommended timeout for EKS platform: 60000 ms + - name: KAFKA_CONSUMER_TIMEOUT + value: '30000' #in ms + + - name: TOTAL_CHAOS_DURATION + value: '15' + + - name: CHAOS_INTERVAL + value: '5' + + # provide the kill count + - name: KILL_COUNT + value: '' + + - name: FORCE + value: 'true' + + - name: KAFKA_INSTANCE_NAME + value: '' + + - name: KAFKA_NAMESPACE + value: '' + + - name: KAFKA_LABEL + value: '' + + - name: KAFKA_BROKER + value: '' + + - name: KAFKA_REPLICATION_FACTOR + value: '' + + - name: KAFKA_SERVICE + value: '' + + - name: KAFKA_PORT + value: '' + + - name: ZOOKEEPER_NAMESPACE + value: '' + + - name: ZOOKEEPER_LABEL + value: '' + + - name: ZOOKEEPER_SERVICE + value: '' + + - name: ZOOKEEPER_PORT + value: '' + + ## env var that describes the library used to execute the chaos + ## default: litmus. Supported values: litmus + - name: LIB + value: 'litmus' + + - name: LIB_IMAGE + value: 'litmuschaos/pod-delete-helper:latest' + + labels: + name: kafka-broker-pod-failure + app.kubernetes.io/part-of: litmus + diff --git a/charts/kafka/kafka-broker-pod-failure/ansible/rbac.yaml b/charts/kafka/kafka-broker-pod-failure/ansible/rbac.yaml new file mode 100644 index 0000000..cf78684 --- /dev/null +++ b/charts/kafka/kafka-broker-pod-failure/ansible/rbac.yaml @@ -0,0 +1,39 @@ +apiVersion: v1 +kind: ServiceAccount +metadata: + name: kafka-broker-pod-failure-sa + namespace: default + labels: + name: kafka-broker-pod-failure-sa + app.kubernetes.io/part-of: litmus +--- +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRole +metadata: + name: kafka-broker-pod-failure-sa + labels: + name: kafka-broker-pod-failure-sa + app.kubernetes.io/part-of: litmus +rules: +- apiGroups: ["","litmuschaos.io","batch","apps"] + resources: ["pods","deployments","pods/log","events","jobs","pods/exec","statefulsets","configmaps","chaosengines","chaosexperiments","chaosresults"] + verbs: ["create","list","get","patch","delete"] +- apiGroups: [""] + resources: ["nodes"] + verbs: ["get","list"] +--- +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRoleBinding +metadata: + name: kafka-broker-pod-failure-sa + labels: + name: kafka-broker-pod-failure-sa + app.kubernetes.io/part-of: litmus +roleRef: + apiGroup: rbac.authorization.k8s.io + kind: ClusterRole + name: kafka-broker-pod-failure-sa +subjects: +- kind: ServiceAccount + name: kafka-broker-pod-failure-sa + namespace: default diff --git a/charts/kafka/kafka-broker-pod-failure/engine.yaml b/charts/kafka/kafka-broker-pod-failure/engine.yaml index 2895ca8..caa7c19 100644 --- a/charts/kafka/kafka-broker-pod-failure/engine.yaml +++ b/charts/kafka/kafka-broker-pod-failure/engine.yaml @@ -75,4 +75,5 @@ spec: # pod failures without '--force' & default terminationGracePeriodSeconds - name: FORCE - value: 'false' \ No newline at end of file + value: 'false' + \ No newline at end of file diff --git a/charts/kafka/kafka-broker-pod-failure/experiment.yaml b/charts/kafka/kafka-broker-pod-failure/experiment.yaml index 5501b43..2da7324 100644 --- a/charts/kafka/kafka-broker-pod-failure/experiment.yaml +++ b/charts/kafka/kafka-broker-pod-failure/experiment.yaml @@ -39,18 +39,15 @@ spec: verbs: - "get" - "list" - image: "litmuschaos/ansible-runner:latest" + image: "litmuschaos/go-runner:latest" imagePullPolicy: Always args: - -c - - ansible-playbook ./experiments/kafka/kafka-broker-pod-failure/kafka-broker-pod-failure-ansible-logic.yml -i /etc/ansible/hosts -vv; exit 0 + - ./experiments -name kafka-broker-pod-failure command: - /bin/bash env: - - name: ANSIBLE_STDOUT_CALLBACK - value: 'default' - - name: KAFKA_KIND value: 'statefulset' @@ -60,10 +57,6 @@ spec: - name: KAFKA_LIVENESS_IMAGE value: 'litmuschaos/kafka-client:ci' - # set to 'enabled' if you have auth set up - - name: KAFKA_SASL_AUTH - value: 'disabled' - # Recommended timeout for EKS platform: 60000 ms - name: KAFKA_CONSUMER_TIMEOUT value: '30000' #in ms @@ -78,6 +71,11 @@ spec: - name: KILL_COUNT value: '' + ## it defines the sequence of chaos execution for multiple target pods + ## supported values: serial, parallel + - name: SEQUENCE + value: 'parallel' + - name: FORCE value: 'true' @@ -118,9 +116,6 @@ spec: ## default: litmus. Supported values: litmus - name: LIB value: 'litmus' - - - name: LIB_IMAGE - value: 'litmuschaos/pod-delete-helper:latest' labels: name: kafka-broker-pod-failure diff --git a/charts/kafka/kafka-broker-pod-failure/kafka-broker-pod-failure.chartserviceversion.yaml b/charts/kafka/kafka-broker-pod-failure/kafka-broker-pod-failure.chartserviceversion.yaml index c6b03ed..0c4be3e 100644 --- a/charts/kafka/kafka-broker-pod-failure/kafka-broker-pod-failure.chartserviceversion.yaml +++ b/charts/kafka/kafka-broker-pod-failure/kafka-broker-pod-failure.chartserviceversion.yaml @@ -31,7 +31,7 @@ spec: name: Mayadata links: - name: Source Code - url: https://github.com/litmuschaos/litmus-ansible/tree/master/experiments/kafka/kafka-broker-pod-failure + url: https://github.com/litmuschaos/litmus-go/tree/master/experiments/kafka/kafka-broker-pod-failure - name: Documentation url: https://docs.litmuschaos.io/docs/kafka-broker-pod-failure/ - name: Video diff --git a/service-accounts/litmus-admin-rbac.yaml b/service-accounts/litmus-admin-rbac.yaml index 55bc0b1..af7d2bb 100644 --- a/service-accounts/litmus-admin-rbac.yaml +++ b/service-accounts/litmus-admin-rbac.yaml @@ -14,9 +14,12 @@ metadata: labels: name: litmus-admin rules: -- apiGroups: ["","apps","batch","extensions","litmuschaos.io","openebs.io","storage.k8s.io"] - resources: ["chaosengines","chaosexperiments","chaosresults","cstorpools","cstorvolumereplicas","configmaps","secrets","pods","pods/exec","pods/log","pods/eviction","jobs","replicasets","deployments","daemonsets","statefulsets","persistentvolumeclaims","persistentvolumes","storageclasses","services","events"] - verbs: ["create","delete","get","list","patch","update"] +- apiGroups: ["","apps","batch","extensions","litmuschaos.io"] + resources: ["pods","pods/exec","pods/eviction","jobs","daemonsets","events","chaosresults","chaosengines"] + verbs: ["create","delete","get","list","patch","update", "deletecollection"] +- apiGroups: ["","apps","litmuschaos.io"] + resources: ["configmaps","secrets","services","chaosexperiments","pods/log","replicasets","deployments","statefulsets","services"] + verbs: ["get","list","patch","update"] - apiGroups: [""] resources: ["nodes"] verbs: ["get","list","patch","update"] @@ -34,4 +37,4 @@ roleRef: subjects: - kind: ServiceAccount name: litmus-admin - namespace: litmus \ No newline at end of file + namespace: litmus