tests_fuzz/utils/pod_failure.rs
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
// Copyright 2023 Greptime Team
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
use std::collections::BTreeMap;
use kube::Api;
use crate::error::Result;
use crate::utils::crd::common::{Mode, SelectorBuilder};
use crate::utils::crd::pod::{Action, PodChaos, PodChaosSpecBuilder};
/// Injects a pod failure into a specific datanode within a Kubernetes cluster.
///
/// This function constructs a `PodChaos` custom resource to simulate a pod failure for the specified
/// datanode, and creates this resource in the Kubernetes cluster using the provided client.
pub async fn inject_datanode_pod_failure(
client: kube::Client,
namespace: &str,
cluster_name: &str,
datanode_id: u64,
duration_secs: usize,
) -> Result<String> {
let mut selector = BTreeMap::new();
let pod_name = format!("{}-datanode-{}", cluster_name, datanode_id);
selector.insert(
"statefulset.kubernetes.io/pod-name".into(),
pod_name.clone(),
);
let selector = SelectorBuilder::default()
.label_selectors(selector)
.build()
.unwrap();
let spec = PodChaosSpecBuilder::default()
.duration(format!("{duration_secs}s"))
.selector(selector)
.action(Action::PodFailure)
.mode(Mode::One)
.build()
.unwrap();
let chaos_name = format!("{pod_name}-pod-failure");
let cr = PodChaos::new(&chaos_name, spec);
let api: Api<PodChaos> = Api::namespaced(client, namespace);
api.create(&Default::default(), &cr).await.unwrap();
Ok(chaos_name)
}
/// Recovers a pod from a failure by deleting the associated PodChaos resource.
///
/// This function deletes the PodChaos custom resource with the specified name, effectively
/// recovering the pod from the injected failure.
pub async fn recover_pod_failure(client: kube::Client, namespace: &str, name: &str) -> Result<()> {
let api: Api<PodChaos> = Api::namespaced(client, namespace);
api.delete(name, &Default::default()).await.unwrap();
Ok(())
}