Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

fix: use heuristics to determine when to query ddb table ttl #307

Merged
merged 2 commits into from
Apr 15, 2024
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
115 changes: 90 additions & 25 deletions momento/src/commands/cloud_linter/dynamodb.rs
Original file line number Diff line number Diff line change
Expand Up @@ -164,33 +164,91 @@ impl ResourceWithMetrics for DynamoDbResource {
}
}

pub(crate) async fn append_ttl_to_appropriate_resources(
config: &SdkConfig,
mut resources: Vec<Resource>,
limiter: Arc<DefaultDirectRateLimiter>,
) -> Result<Vec<Resource>, CliError> {
log::debug!("describing ttl for dynamodb tables");
let ddb_client = aws_sdk_dynamodb::Client::new(config);
let describe_ddb_ttl_bar =
ProgressBar::new(resources.len() as u64).with_message("Describing Dynamo DB Ttl");
describe_ddb_ttl_bar
.set_style(ProgressStyle::with_template(" {msg} {bar} {eta}").expect("invalid template"));
for resource in &mut resources {
describe_ddb_ttl_bar.inc(1);
match resource {
Resource::DynamoDb(r) => {
if r.resource_type == ResourceType::DynamoDbGsi {
continue;
}
let consumed_write_ops_index = r.metrics.iter().position(|p| {
p.name
.eq_ignore_ascii_case("consumedwritecapacityunits_sum")
});
match consumed_write_ops_index {
Some(index) => {
let consumed_write_capacity =
r.metrics.get(index).expect("index should exist");
let sum: f64 = consumed_write_capacity.values.iter().sum();
// a basic heuristic around whether or not we care to check to see if a ttl exists on a ddb table. If the dynamodb table
// has less than 100 tps average, then we don't care to check if ttl is enabled or not.
if sum < 100.0 * 60.0 * 60.0 * 24.0 * 30.0 {
bruuuuuuuce marked this conversation as resolved.
Show resolved Hide resolved
log::debug!("skipping ttl check for table {}", r.id);
continue;
}
log::debug!("querying ttl for table {}", r.id);
let ttl_enabled =
fetch_ddb_ttl(&ddb_client, &r.id, Arc::clone(&limiter)).await?;
r.metadata.ttl_enabled = ttl_enabled;
}
// we did not find that metric, and therefore we assume that there are no consumed capacity units, meaning we don't care to
// check for a ttl on the ddb table
None => {
continue;
}
}
}
Resource::ElastiCache(_) => {
continue;
}
};
}
describe_ddb_ttl_bar.finish();
Ok(resources)
}

pub(crate) async fn get_ddb_resources(
config: &SdkConfig,
limiter: Arc<DefaultDirectRateLimiter>,
) -> Result<Vec<Resource>, CliError> {
let ddb_client = aws_sdk_dynamodb::Client::new(config);

let bar = ProgressBar::new_spinner().with_message("Listing Dynamo DB tables");
bar.enable_steady_tick(Duration::from_millis(100));
let list_ddb_tables_bar = ProgressBar::new_spinner().with_message("Listing Dynamo DB tables");
list_ddb_tables_bar.enable_steady_tick(Duration::from_millis(100));
let table_names = list_table_names(&ddb_client, Arc::clone(&limiter)).await?;
bar.finish();
list_ddb_tables_bar.finish();

let bar =
let describe_ddb_tables_bar =
ProgressBar::new(table_names.len() as u64).with_message("Describing Dynamo DB tables");
bar.set_style(ProgressStyle::with_template(" {msg} {bar} {eta}").expect("invalid template"));
let mut resources = Vec::new();
describe_ddb_tables_bar
.set_style(ProgressStyle::with_template(" {msg} {bar} {eta}").expect("invalid template"));
let mut ddb_resources: Vec<DynamoDbResource> = Vec::new();
for table_name in table_names {
let instances = fetch_ddb_resources(&ddb_client, &table_name, Arc::clone(&limiter)).await?;
let wrapped_resources = instances
.into_iter()
.map(Resource::DynamoDb)
.collect::<Vec<Resource>>();
resources.extend(wrapped_resources);
bar.inc(1);
for instance in instances {
ddb_resources.push(instance);
}
describe_ddb_tables_bar.inc(1);
}
bar.finish();
describe_ddb_tables_bar.finish();

Ok(resources)
let wrapped_resources = ddb_resources
.into_iter()
.map(Resource::DynamoDb)
.collect::<Vec<Resource>>();

Ok(wrapped_resources)
}

async fn list_table_names(
Expand Down Expand Up @@ -218,19 +276,11 @@ async fn list_table_names(
Ok(table_names)
}

async fn fetch_ddb_resources(
async fn fetch_ddb_ttl(
bruuuuuuuce marked this conversation as resolved.
Show resolved Hide resolved
ddb_client: &aws_sdk_dynamodb::Client,
table_name: &str,
limiter: Arc<DefaultDirectRateLimiter>,
) -> Result<Vec<DynamoDbResource>, CliError> {
let region = ddb_client
.config()
.region()
.map(|r| r.as_ref())
.ok_or(CliError {
msg: "No region configured for client".to_string(),
})?;

) -> Result<bool, CliError> {
let ttl = rate_limit(Arc::clone(&limiter), || async {
ddb_client
.describe_time_to_live()
Expand All @@ -247,6 +297,21 @@ async fn fetch_ddb_resources(
..
})
);
Ok(ttl_enabled)
}

async fn fetch_ddb_resources(
ddb_client: &aws_sdk_dynamodb::Client,
table_name: &str,
limiter: Arc<DefaultDirectRateLimiter>,
) -> Result<Vec<DynamoDbResource>, CliError> {
let region = ddb_client
.config()
.region()
.map(|r| r.as_ref())
.ok_or(CliError {
msg: "No region configured for client".to_string(),
})?;

let description = rate_limit(Arc::clone(&limiter), || async {
ddb_client
Expand Down Expand Up @@ -309,7 +374,7 @@ async fn fetch_ddb_resources(
billing_mode,
gsi_count,
item_count,
ttl_enabled,
ttl_enabled: false,
is_global_table,
lsi_count,
table_class,
Expand Down
1 change: 1 addition & 0 deletions momento/src/commands/cloud_linter/elasticache.rs
Original file line number Diff line number Diff line change
Expand Up @@ -104,6 +104,7 @@ pub(crate) async fn get_elasticache_resources(
config: &SdkConfig,
limiter: Arc<DefaultDirectRateLimiter>,
) -> Result<Vec<Resource>, CliError> {
log::debug!("describing elasticache resources");
let region = config.region().map(|r| r.as_ref()).ok_or(CliError {
msg: "No region configured for client".to_string(),
})?;
Expand Down
29 changes: 23 additions & 6 deletions momento/src/commands/cloud_linter/linter_cli.rs
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,8 @@ use crate::commands::cloud_linter::resource::DataFormat;
use crate::commands::cloud_linter::utils::check_aws_credentials;
use crate::error::CliError;

use super::dynamodb::append_ttl_to_appropriate_resources;

pub async fn run_cloud_linter(region: String) -> Result<(), CliError> {
let config = aws_config::defaults(BehaviorVersion::latest())
.region(Region::new(region))
Expand All @@ -28,17 +30,32 @@ pub async fn run_cloud_linter(region: String) -> Result<(), CliError> {
let output_file_path = "linter_results.json.gz";
check_output_is_writable(output_file_path).await?;

let quota =
Quota::per_second(core::num::NonZeroU32::new(1).expect("should create non-zero quota"));
let limiter = Arc::new(RateLimiter::direct(quota));
let control_plane_quota = Quota::per_second(
core::num::NonZeroU32::new(10).expect("should create non-zero control_plane_quota"),
);
let control_plane_limiter = Arc::new(RateLimiter::direct(control_plane_quota));

let describe_ttl_quota = Quota::per_second(
core::num::NonZeroU32::new(1).expect("should create non-zero describe_ttl_quota"),
);
let describe_ttl_limiter = Arc::new(RateLimiter::direct(describe_ttl_quota));

let mut resources = get_ddb_resources(&config, Arc::clone(&limiter)).await?;
let metrics_quota =
Quota::per_second(core::num::NonZeroU32::new(20).expect("should create non-zero quota"));
let metrics_limiter = Arc::new(RateLimiter::direct(metrics_quota));
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

i like this stuff


let mut resources = get_ddb_resources(&config, Arc::clone(&control_plane_limiter)).await?;

let mut elasticache_resources =
get_elasticache_resources(&config, Arc::clone(&limiter)).await?;
get_elasticache_resources(&config, Arc::clone(&control_plane_limiter)).await?;
resources.append(&mut elasticache_resources);

let resources = append_metrics_to_resources(&config, Arc::clone(&limiter), resources).await?;
let resources =
append_metrics_to_resources(&config, Arc::clone(&metrics_limiter), resources).await?;

let resources =
append_ttl_to_appropriate_resources(&config, resources, Arc::clone(&describe_ttl_limiter))
.await?;

let data_format = DataFormat { resources };

Expand Down
4 changes: 2 additions & 2 deletions momento/src/commands/cloud_linter/metrics.rs
Original file line number Diff line number Diff line change
Expand Up @@ -18,8 +18,8 @@ use crate::error::CliError;

#[derive(Serialize, Deserialize)]
pub(crate) struct Metric {
name: String,
values: Vec<f64>,
pub name: String,
pub values: Vec<f64>,
}

pub(crate) struct MetricTarget {
Expand Down
2 changes: 1 addition & 1 deletion momento/src/commands/cloud_linter/resource.rs
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ pub(crate) enum Resource {
ElastiCache(ElastiCacheResource),
}

#[derive(Debug, Serialize)]
#[derive(Debug, Serialize, PartialEq)]
pub(crate) enum ResourceType {
#[serde(rename = "AWS::DynamoDB::GSI")]
DynamoDbGsi,
Expand Down
Loading