From 66770af5115b3bcc9b11b2a098e74a228996dcb2 Mon Sep 17 00:00:00 2001 From: Brooks Date: Thu, 5 Dec 2024 13:23:11 -0500 Subject: [PATCH] Adds search subcommand to agave-store-tool (#3950) --- Cargo.lock | 2 + accounts-db/store-tool/Cargo.toml | 4 +- accounts-db/store-tool/src/main.rs | 210 +++++++++++++++++++++++++---- 3 files changed, 188 insertions(+), 28 deletions(-) diff --git a/Cargo.lock b/Cargo.lock index df475474990d0c..741abccc1239d7 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -223,7 +223,9 @@ dependencies = [ name = "agave-store-tool" version = "2.2.0" dependencies = [ + "ahash 0.8.11", "clap 2.33.3", + "rayon", "solana-accounts-db", "solana-sdk", "solana-version", diff --git a/accounts-db/store-tool/Cargo.toml b/accounts-db/store-tool/Cargo.toml index 3d425bbbccaea9..dca989d72e4178 100644 --- a/accounts-db/store-tool/Cargo.toml +++ b/accounts-db/store-tool/Cargo.toml @@ -1,6 +1,6 @@ [package] name = "agave-store-tool" -description = "Tool to inspect account storage files" +description = "Tool for account storage files" publish = false version = { workspace = true } authors = { workspace = true } @@ -10,7 +10,9 @@ license = { workspace = true } edition = { workspace = true } [dependencies] +ahash = { workspace = true } clap = { workspace = true } +rayon = { workspace = true } solana-accounts-db = { workspace = true, features = ["dev-context-only-utils"] } solana-sdk = { workspace = true } solana-version = { workspace = true } diff --git a/accounts-db/store-tool/src/main.rs b/accounts-db/store-tool/src/main.rs index 4eaae9e07ae30d..d06768017f8c58 100644 --- a/accounts-db/store-tool/src/main.rs +++ b/accounts-db/store-tool/src/main.rs @@ -1,48 +1,131 @@ use { - clap::{crate_description, crate_name, value_t_or_exit, App, Arg}, + ahash::HashSet, + clap::{ + crate_description, crate_name, value_t_or_exit, values_t_or_exit, App, AppSettings, Arg, + ArgMatches, SubCommand, + }, + rayon::prelude::*, solana_accounts_db::append_vec::AppendVec, - solana_sdk::{account::ReadableAccount, system_instruction::MAX_PERMITTED_DATA_LENGTH}, - std::{mem::ManuallyDrop, num::Saturating}, + solana_sdk::{ + account::ReadableAccount, pubkey::Pubkey, system_instruction::MAX_PERMITTED_DATA_LENGTH, + }, + std::{ + fs, io, + mem::ManuallyDrop, + num::Saturating, + path::{Path, PathBuf}, + }, }; +const CMD_INSPECT: &str = "inspect"; +const CMD_SEARCH: &str = "search"; + fn main() { let matches = App::new(crate_name!()) .about(crate_description!()) .version(solana_version::version!()) - .arg( - Arg::with_name("file") - .index(1) - .takes_value(true) - .value_name("PATH") - .help("Account storage file to open"), + .global_setting(AppSettings::ArgRequiredElseHelp) + .global_setting(AppSettings::ColoredHelp) + .global_setting(AppSettings::InferSubcommands) + .global_setting(AppSettings::UnifiedHelpMessage) + .global_setting(AppSettings::VersionlessSubcommands) + .subcommand( + SubCommand::with_name(CMD_INSPECT) + .about("Inspects an account storage file and display each account's information") + .arg( + Arg::with_name("path") + .index(1) + .takes_value(true) + .value_name("PATH") + .help("Account storage file to inspect"), + ) + .arg( + Arg::with_name("verbose") + .short("v") + .long("verbose") + .takes_value(false) + .help("Show additional account information"), + ), ) - .arg( - Arg::with_name("verbose") - .short("v") - .long("verbose") - .takes_value(false) - .help("Show additional account information"), + .subcommand( + SubCommand::with_name(CMD_SEARCH) + .about("Searches for accounts") + .arg( + Arg::with_name("path") + .index(1) + .takes_value(true) + .value_name("PATH") + .help("Account storage directory to search"), + ) + .arg( + Arg::with_name("addresses") + .index(2) + .takes_value(true) + .value_name("PUBKEYS") + .value_delimiter(",") + .help("Search for the entries of one or more pubkeys, delimited by commas"), + ) + .arg( + Arg::with_name("verbose") + .short("v") + .long("verbose") + .takes_value(false) + .help("Show additional account information"), + ), ) .get_matches(); - let verbose = matches.is_present("verbose"); - let file = value_t_or_exit!(matches, "file", String); - let store = AppendVec::new_for_store_tool(&file).unwrap_or_else(|err| { - eprintln!("failed to open storage file '{file}': {err}"); + let subcommand = matches.subcommand(); + let subcommand_str = subcommand.0.to_string(); + match subcommand { + (CMD_INSPECT, Some(subcommand_matches)) => cmd_inspect(&matches, subcommand_matches), + (CMD_SEARCH, Some(subcommand_matches)) => cmd_search(&matches, subcommand_matches), + _ => unreachable!(), + } + .unwrap_or_else(|err| { + eprintln!("Error: '{subcommand_str}' failed: {err}"); std::process::exit(1); }); +} + +fn cmd_inspect( + _app_matches: &ArgMatches<'_>, + subcommand_matches: &ArgMatches<'_>, +) -> Result<(), String> { + let path = value_t_or_exit!(subcommand_matches, "path", String); + let verbose = subcommand_matches.is_present("verbose"); + do_inspect(path, verbose) +} + +fn cmd_search( + _app_matches: &ArgMatches<'_>, + subcommand_matches: &ArgMatches<'_>, +) -> Result<(), String> { + let path = value_t_or_exit!(subcommand_matches, "path", String); + let addresses = values_t_or_exit!(subcommand_matches, "addresses", Pubkey); + let addresses = HashSet::from_iter(addresses); + let verbose = subcommand_matches.is_present("verbose"); + do_search(path, addresses, verbose) +} + +fn do_inspect(file: impl AsRef, verbose: bool) -> Result<(), String> { + let storage = AppendVec::new_for_store_tool(file.as_ref()).map_err(|err| { + format!( + "failed to open account storage file '{}': {err}", + file.as_ref().display(), + ) + })?; // By default, when the AppendVec is dropped, the backing file will be removed. // We do not want to remove the backing file here in the store-tool, so prevent dropping. - let store = ManuallyDrop::new(store); + let storage = ManuallyDrop::new(storage); - // max data size is 10 MiB (10,485,760 bytes) - // therefore, the max width is ceil(log(10485760)) - let data_size_width = (MAX_PERMITTED_DATA_LENGTH as f64).log10().ceil() as usize; - let offset_width = (store.capacity() as f64).log(16.0).ceil() as usize; + let data_size_width = width10(MAX_PERMITTED_DATA_LENGTH); + let offset_width = width16(storage.capacity()); let mut num_accounts = Saturating(0usize); let mut stored_accounts_size = Saturating(0); - store.scan_accounts(|account| { + let mut lamports = Saturating(0); + storage.scan_accounts(|account| { if verbose { println!("{account:?}"); } else { @@ -57,12 +140,85 @@ fn main() { } num_accounts += 1; stored_accounts_size += account.stored_size(); + lamports += account.lamports(); }); println!( - "number of accounts: {}, stored accounts size: {}, file size: {}", + "number of accounts: {}, stored accounts size: {}, file size: {}, lamports: {}", num_accounts, stored_accounts_size, - store.capacity(), + storage.capacity(), + lamports, ); + Ok(()) +} + +fn do_search( + dir: impl AsRef, + addresses: HashSet, + verbose: bool, +) -> Result<(), String> { + fn get_files_in(dir: impl AsRef) -> Result, io::Error> { + let mut files = Vec::new(); + let entries = fs::read_dir(dir)?; + for entry in entries { + let path = entry?.path(); + if path.is_file() { + let path = fs::canonicalize(path)?; + files.push(path); + } + } + Ok(files) + } + + let files = get_files_in(&dir).map_err(|err| { + format!( + "failed to get files in dir '{}': {err}", + dir.as_ref().display(), + ) + })?; + files.par_iter().for_each(|file| { + let Ok(storage) = AppendVec::new_for_store_tool(file).inspect_err(|err| { + eprintln!( + "failed to open account storage file '{}': {err}", + file.display(), + ) + }) else { + return; + }; + // By default, when the AppendVec is dropped, the backing file will be removed. + // We do not want to remove the backing file here in the store-tool, so prevent dropping. + let storage = ManuallyDrop::new(storage); + + let file_name = Path::new(file.file_name().expect("path is a file")); + storage.scan_accounts(|account| { + if addresses.contains(account.pubkey()) { + if verbose { + println!("storage: {}, {account:?}", file_name.display()); + } else { + println!( + "storage: {}, offset: {}, pubkey: {}, owner: {}, data size: {}, lamports: {}", + file_name.display(), + account.offset(), + account.pubkey(), + account.owner(), + account.data_len(), + account.lamports(), + ); + } + } + }); + }); + + Ok(()) +} + +/// Returns the number of characters required to print `x` in base-10 +fn width10(x: u64) -> usize { + (x as f64).log10().ceil() as usize +} + +/// Returns the number of characters required to print `x` in base-16 +fn width16(x: u64) -> usize { + (x as f64).log(16.0).ceil() as usize }