|
@@ -22,9 +22,9 @@ use commands::{
|
|
|
use compat_harness::{extract_manifest, UpstreamPaths};
|
|
use compat_harness::{extract_manifest, UpstreamPaths};
|
|
|
use render::{Spinner, TerminalRenderer};
|
|
use render::{Spinner, TerminalRenderer};
|
|
|
use runtime::{
|
|
use runtime::{
|
|
|
- clear_oauth_credentials, generate_pkce_pair, generate_state, load_system_prompt,
|
|
|
|
|
- parse_oauth_callback_request_target, save_oauth_credentials, ApiClient, ApiRequest,
|
|
|
|
|
- AssistantEvent, CompactionConfig, ConfigLoader, ConfigSource, ContentBlock,
|
|
|
|
|
|
|
+ clear_oauth_credentials, format_usd, generate_pkce_pair, generate_state, load_system_prompt,
|
|
|
|
|
+ parse_oauth_callback_request_target, pricing_for_model, save_oauth_credentials, ApiClient,
|
|
|
|
|
+ ApiRequest, AssistantEvent, CompactionConfig, ConfigLoader, ConfigSource, ContentBlock,
|
|
|
ConversationMessage, ConversationRuntime, MessageRole, OAuthAuthorizationRequest,
|
|
ConversationMessage, ConversationRuntime, MessageRole, OAuthAuthorizationRequest,
|
|
|
OAuthTokenExchangeRequest, PermissionMode, PermissionPolicy, ProjectContext, RuntimeError,
|
|
OAuthTokenExchangeRequest, PermissionMode, PermissionPolicy, ProjectContext, RuntimeError,
|
|
|
Session, TokenUsage, ToolError, ToolExecutor, UsageTracker,
|
|
Session, TokenUsage, ToolError, ToolExecutor, UsageTracker,
|
|
@@ -36,6 +36,7 @@ const DEFAULT_MODEL: &str = "claude-sonnet-4-20250514";
|
|
|
const DEFAULT_MAX_TOKENS: u32 = 32;
|
|
const DEFAULT_MAX_TOKENS: u32 = 32;
|
|
|
const DEFAULT_DATE: &str = "2026-03-31";
|
|
const DEFAULT_DATE: &str = "2026-03-31";
|
|
|
const DEFAULT_OAUTH_CALLBACK_PORT: u16 = 4545;
|
|
const DEFAULT_OAUTH_CALLBACK_PORT: u16 = 4545;
|
|
|
|
|
+const COST_WARNING_FRACTION: f64 = 0.8;
|
|
|
const VERSION: &str = env!("CARGO_PKG_VERSION");
|
|
const VERSION: &str = env!("CARGO_PKG_VERSION");
|
|
|
const BUILD_TARGET: Option<&str> = option_env!("TARGET");
|
|
const BUILD_TARGET: Option<&str> = option_env!("TARGET");
|
|
|
const GIT_SHA: Option<&str> = option_env!("GIT_SHA");
|
|
const GIT_SHA: Option<&str> = option_env!("GIT_SHA");
|
|
@@ -70,7 +71,8 @@ fn run() -> Result<(), Box<dyn std::error::Error>> {
|
|
|
output_format,
|
|
output_format,
|
|
|
allowed_tools,
|
|
allowed_tools,
|
|
|
permission_mode,
|
|
permission_mode,
|
|
|
- } => LiveCli::new(model, false, allowed_tools, permission_mode)?
|
|
|
|
|
|
|
+ max_cost_usd,
|
|
|
|
|
+ } => LiveCli::new(model, false, allowed_tools, permission_mode, max_cost_usd)?
|
|
|
.run_turn_with_output(&prompt, output_format)?,
|
|
.run_turn_with_output(&prompt, output_format)?,
|
|
|
CliAction::Login => run_login()?,
|
|
CliAction::Login => run_login()?,
|
|
|
CliAction::Logout => run_logout()?,
|
|
CliAction::Logout => run_logout()?,
|
|
@@ -78,13 +80,14 @@ fn run() -> Result<(), Box<dyn std::error::Error>> {
|
|
|
model,
|
|
model,
|
|
|
allowed_tools,
|
|
allowed_tools,
|
|
|
permission_mode,
|
|
permission_mode,
|
|
|
- } => run_repl(model, allowed_tools, permission_mode)?,
|
|
|
|
|
|
|
+ max_cost_usd,
|
|
|
|
|
+ } => run_repl(model, allowed_tools, permission_mode, max_cost_usd)?,
|
|
|
CliAction::Help => print_help(),
|
|
CliAction::Help => print_help(),
|
|
|
}
|
|
}
|
|
|
Ok(())
|
|
Ok(())
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
-#[derive(Debug, Clone, PartialEq, Eq)]
|
|
|
|
|
|
|
+#[derive(Debug, Clone, PartialEq)]
|
|
|
enum CliAction {
|
|
enum CliAction {
|
|
|
DumpManifests,
|
|
DumpManifests,
|
|
|
BootstrapPlan,
|
|
BootstrapPlan,
|
|
@@ -103,6 +106,7 @@ enum CliAction {
|
|
|
output_format: CliOutputFormat,
|
|
output_format: CliOutputFormat,
|
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
|
permission_mode: PermissionMode,
|
|
permission_mode: PermissionMode,
|
|
|
|
|
+ max_cost_usd: Option<f64>,
|
|
|
},
|
|
},
|
|
|
Login,
|
|
Login,
|
|
|
Logout,
|
|
Logout,
|
|
@@ -110,6 +114,7 @@ enum CliAction {
|
|
|
model: String,
|
|
model: String,
|
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
|
permission_mode: PermissionMode,
|
|
permission_mode: PermissionMode,
|
|
|
|
|
+ max_cost_usd: Option<f64>,
|
|
|
},
|
|
},
|
|
|
// prompt-mode formatting is only supported for non-interactive runs
|
|
// prompt-mode formatting is only supported for non-interactive runs
|
|
|
Help,
|
|
Help,
|
|
@@ -139,6 +144,7 @@ fn parse_args(args: &[String]) -> Result<CliAction, String> {
|
|
|
let mut output_format = CliOutputFormat::Text;
|
|
let mut output_format = CliOutputFormat::Text;
|
|
|
let mut permission_mode = default_permission_mode();
|
|
let mut permission_mode = default_permission_mode();
|
|
|
let mut wants_version = false;
|
|
let mut wants_version = false;
|
|
|
|
|
+ let mut max_cost_usd: Option<f64> = None;
|
|
|
let mut allowed_tool_values = Vec::new();
|
|
let mut allowed_tool_values = Vec::new();
|
|
|
let mut rest = Vec::new();
|
|
let mut rest = Vec::new();
|
|
|
let mut index = 0;
|
|
let mut index = 0;
|
|
@@ -174,6 +180,13 @@ fn parse_args(args: &[String]) -> Result<CliAction, String> {
|
|
|
permission_mode = parse_permission_mode_arg(value)?;
|
|
permission_mode = parse_permission_mode_arg(value)?;
|
|
|
index += 2;
|
|
index += 2;
|
|
|
}
|
|
}
|
|
|
|
|
+ "--max-cost" => {
|
|
|
|
|
+ let value = args
|
|
|
|
|
+ .get(index + 1)
|
|
|
|
|
+ .ok_or_else(|| "missing value for --max-cost".to_string())?;
|
|
|
|
|
+ max_cost_usd = Some(parse_max_cost_arg(value)?);
|
|
|
|
|
+ index += 2;
|
|
|
|
|
+ }
|
|
|
flag if flag.starts_with("--output-format=") => {
|
|
flag if flag.starts_with("--output-format=") => {
|
|
|
output_format = CliOutputFormat::parse(&flag[16..])?;
|
|
output_format = CliOutputFormat::parse(&flag[16..])?;
|
|
|
index += 1;
|
|
index += 1;
|
|
@@ -182,6 +195,10 @@ fn parse_args(args: &[String]) -> Result<CliAction, String> {
|
|
|
permission_mode = parse_permission_mode_arg(&flag[18..])?;
|
|
permission_mode = parse_permission_mode_arg(&flag[18..])?;
|
|
|
index += 1;
|
|
index += 1;
|
|
|
}
|
|
}
|
|
|
|
|
+ flag if flag.starts_with("--max-cost=") => {
|
|
|
|
|
+ max_cost_usd = Some(parse_max_cost_arg(&flag[11..])?);
|
|
|
|
|
+ index += 1;
|
|
|
|
|
+ }
|
|
|
"--allowedTools" | "--allowed-tools" => {
|
|
"--allowedTools" | "--allowed-tools" => {
|
|
|
let value = args
|
|
let value = args
|
|
|
.get(index + 1)
|
|
.get(index + 1)
|
|
@@ -215,6 +232,7 @@ fn parse_args(args: &[String]) -> Result<CliAction, String> {
|
|
|
model,
|
|
model,
|
|
|
allowed_tools,
|
|
allowed_tools,
|
|
|
permission_mode,
|
|
permission_mode,
|
|
|
|
|
+ max_cost_usd,
|
|
|
});
|
|
});
|
|
|
}
|
|
}
|
|
|
if matches!(rest.first().map(String::as_str), Some("--help" | "-h")) {
|
|
if matches!(rest.first().map(String::as_str), Some("--help" | "-h")) {
|
|
@@ -241,6 +259,7 @@ fn parse_args(args: &[String]) -> Result<CliAction, String> {
|
|
|
output_format,
|
|
output_format,
|
|
|
allowed_tools,
|
|
allowed_tools,
|
|
|
permission_mode,
|
|
permission_mode,
|
|
|
|
|
+ max_cost_usd,
|
|
|
})
|
|
})
|
|
|
}
|
|
}
|
|
|
other if !other.starts_with('/') => Ok(CliAction::Prompt {
|
|
other if !other.starts_with('/') => Ok(CliAction::Prompt {
|
|
@@ -249,6 +268,7 @@ fn parse_args(args: &[String]) -> Result<CliAction, String> {
|
|
|
output_format,
|
|
output_format,
|
|
|
allowed_tools,
|
|
allowed_tools,
|
|
|
permission_mode,
|
|
permission_mode,
|
|
|
|
|
+ max_cost_usd,
|
|
|
}),
|
|
}),
|
|
|
other => Err(format!("unknown subcommand: {other}")),
|
|
other => Err(format!("unknown subcommand: {other}")),
|
|
|
}
|
|
}
|
|
@@ -312,6 +332,18 @@ fn parse_permission_mode_arg(value: &str) -> Result<PermissionMode, String> {
|
|
|
.map(permission_mode_from_label)
|
|
.map(permission_mode_from_label)
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
|
|
+fn parse_max_cost_arg(value: &str) -> Result<f64, String> {
|
|
|
|
|
+ let parsed = value
|
|
|
|
|
+ .parse::<f64>()
|
|
|
|
|
+ .map_err(|_| format!("invalid value for --max-cost: {value}"))?;
|
|
|
|
|
+ if !parsed.is_finite() || parsed <= 0.0 {
|
|
|
|
|
+ return Err(format!(
|
|
|
|
|
+ "--max-cost must be a positive finite USD amount: {value}"
|
|
|
|
|
+ ));
|
|
|
|
|
+ }
|
|
|
|
|
+ Ok(parsed)
|
|
|
|
|
+}
|
|
|
|
|
+
|
|
|
fn permission_mode_from_label(mode: &str) -> PermissionMode {
|
|
fn permission_mode_from_label(mode: &str) -> PermissionMode {
|
|
|
match mode {
|
|
match mode {
|
|
|
"read-only" => PermissionMode::ReadOnly,
|
|
"read-only" => PermissionMode::ReadOnly,
|
|
@@ -678,22 +710,78 @@ fn format_permissions_switch_report(previous: &str, next: &str) -> String {
|
|
|
)
|
|
)
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
-fn format_cost_report(usage: TokenUsage) -> String {
|
|
|
|
|
|
|
+fn format_cost_report(model: &str, usage: TokenUsage, max_cost_usd: Option<f64>) -> String {
|
|
|
|
|
+ let estimate = usage_cost_estimate(model, usage);
|
|
|
format!(
|
|
format!(
|
|
|
"Cost
|
|
"Cost
|
|
|
|
|
+ Model {model}
|
|
|
Input tokens {}
|
|
Input tokens {}
|
|
|
Output tokens {}
|
|
Output tokens {}
|
|
|
Cache create {}
|
|
Cache create {}
|
|
|
Cache read {}
|
|
Cache read {}
|
|
|
- Total tokens {}",
|
|
|
|
|
|
|
+ Total tokens {}
|
|
|
|
|
+ Input cost {}
|
|
|
|
|
+ Output cost {}
|
|
|
|
|
+ Cache create usd {}
|
|
|
|
|
+ Cache read usd {}
|
|
|
|
|
+ Estimated cost {}
|
|
|
|
|
+ Budget {}",
|
|
|
usage.input_tokens,
|
|
usage.input_tokens,
|
|
|
usage.output_tokens,
|
|
usage.output_tokens,
|
|
|
usage.cache_creation_input_tokens,
|
|
usage.cache_creation_input_tokens,
|
|
|
usage.cache_read_input_tokens,
|
|
usage.cache_read_input_tokens,
|
|
|
usage.total_tokens(),
|
|
usage.total_tokens(),
|
|
|
|
|
+ format_usd(estimate.input_cost_usd),
|
|
|
|
|
+ format_usd(estimate.output_cost_usd),
|
|
|
|
|
+ format_usd(estimate.cache_creation_cost_usd),
|
|
|
|
|
+ format_usd(estimate.cache_read_cost_usd),
|
|
|
|
|
+ format_usd(estimate.total_cost_usd()),
|
|
|
|
|
+ format_budget_line(estimate.total_cost_usd(), max_cost_usd),
|
|
|
|
|
+ )
|
|
|
|
|
+}
|
|
|
|
|
+
|
|
|
|
|
+fn usage_cost_estimate(model: &str, usage: TokenUsage) -> runtime::UsageCostEstimate {
|
|
|
|
|
+ pricing_for_model(model).map_or_else(
|
|
|
|
|
+ || usage.estimate_cost_usd(),
|
|
|
|
|
+ |pricing| usage.estimate_cost_usd_with_pricing(pricing),
|
|
|
)
|
|
)
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
|
|
+fn usage_cost_total(model: &str, usage: TokenUsage) -> f64 {
|
|
|
|
|
+ usage_cost_estimate(model, usage).total_cost_usd()
|
|
|
|
|
+}
|
|
|
|
|
+
|
|
|
|
|
+fn format_budget_line(cost_usd: f64, max_cost_usd: Option<f64>) -> String {
|
|
|
|
|
+ match max_cost_usd {
|
|
|
|
|
+ Some(limit) => format!("{} / {}", format_usd(cost_usd), format_usd(limit)),
|
|
|
|
|
+ None => format!("{} (unlimited)", format_usd(cost_usd)),
|
|
|
|
|
+ }
|
|
|
|
|
+}
|
|
|
|
|
+
|
|
|
|
|
+fn budget_notice_message(
|
|
|
|
|
+ model: &str,
|
|
|
|
|
+ usage: TokenUsage,
|
|
|
|
|
+ max_cost_usd: Option<f64>,
|
|
|
|
|
+) -> Option<String> {
|
|
|
|
|
+ let limit = max_cost_usd?;
|
|
|
|
|
+ let cost = usage_cost_total(model, usage);
|
|
|
|
|
+ if cost >= limit {
|
|
|
|
|
+ Some(format!(
|
|
|
|
|
+ "cost budget exceeded: cumulative={} budget={}",
|
|
|
|
|
+ format_usd(cost),
|
|
|
|
|
+ format_usd(limit)
|
|
|
|
|
+ ))
|
|
|
|
|
+ } else if cost >= limit * COST_WARNING_FRACTION {
|
|
|
|
|
+ Some(format!(
|
|
|
|
|
+ "approaching cost budget: cumulative={} budget={}",
|
|
|
|
|
+ format_usd(cost),
|
|
|
|
|
+ format_usd(limit)
|
|
|
|
|
+ ))
|
|
|
|
|
+ } else {
|
|
|
|
|
+ None
|
|
|
|
|
+ }
|
|
|
|
|
+}
|
|
|
|
|
+
|
|
|
fn format_resume_report(session_path: &str, message_count: usize, turns: u32) -> String {
|
|
fn format_resume_report(session_path: &str, message_count: usize, turns: u32) -> String {
|
|
|
format!(
|
|
format!(
|
|
|
"Session resumed
|
|
"Session resumed
|
|
@@ -837,6 +925,7 @@ fn run_resume_command(
|
|
|
},
|
|
},
|
|
|
default_permission_mode().as_str(),
|
|
default_permission_mode().as_str(),
|
|
|
&status_context(Some(session_path))?,
|
|
&status_context(Some(session_path))?,
|
|
|
|
|
+ None,
|
|
|
)),
|
|
)),
|
|
|
})
|
|
})
|
|
|
}
|
|
}
|
|
@@ -844,7 +933,7 @@ fn run_resume_command(
|
|
|
let usage = UsageTracker::from_session(session).cumulative_usage();
|
|
let usage = UsageTracker::from_session(session).cumulative_usage();
|
|
|
Ok(ResumeCommandOutcome {
|
|
Ok(ResumeCommandOutcome {
|
|
|
session: session.clone(),
|
|
session: session.clone(),
|
|
|
- message: Some(format_cost_report(usage)),
|
|
|
|
|
|
|
+ message: Some(format_cost_report("restored-session", usage, None)),
|
|
|
})
|
|
})
|
|
|
}
|
|
}
|
|
|
SlashCommand::Config { section } => Ok(ResumeCommandOutcome {
|
|
SlashCommand::Config { section } => Ok(ResumeCommandOutcome {
|
|
@@ -891,8 +980,9 @@ fn run_repl(
|
|
|
model: String,
|
|
model: String,
|
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
|
permission_mode: PermissionMode,
|
|
permission_mode: PermissionMode,
|
|
|
|
|
+ max_cost_usd: Option<f64>,
|
|
|
) -> Result<(), Box<dyn std::error::Error>> {
|
|
) -> Result<(), Box<dyn std::error::Error>> {
|
|
|
- let mut cli = LiveCli::new(model, true, allowed_tools, permission_mode)?;
|
|
|
|
|
|
|
+ let mut cli = LiveCli::new(model, true, allowed_tools, permission_mode, max_cost_usd)?;
|
|
|
let mut editor = input::LineEditor::new("› ", slash_command_completion_candidates());
|
|
let mut editor = input::LineEditor::new("› ", slash_command_completion_candidates());
|
|
|
println!("{}", cli.startup_banner());
|
|
println!("{}", cli.startup_banner());
|
|
|
|
|
|
|
@@ -945,6 +1035,7 @@ struct LiveCli {
|
|
|
model: String,
|
|
model: String,
|
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
|
permission_mode: PermissionMode,
|
|
permission_mode: PermissionMode,
|
|
|
|
|
+ max_cost_usd: Option<f64>,
|
|
|
system_prompt: Vec<String>,
|
|
system_prompt: Vec<String>,
|
|
|
runtime: ConversationRuntime<AnthropicRuntimeClient, CliToolExecutor>,
|
|
runtime: ConversationRuntime<AnthropicRuntimeClient, CliToolExecutor>,
|
|
|
session: SessionHandle,
|
|
session: SessionHandle,
|
|
@@ -956,6 +1047,7 @@ impl LiveCli {
|
|
|
enable_tools: bool,
|
|
enable_tools: bool,
|
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
allowed_tools: Option<AllowedToolSet>,
|
|
|
permission_mode: PermissionMode,
|
|
permission_mode: PermissionMode,
|
|
|
|
|
+ max_cost_usd: Option<f64>,
|
|
|
) -> Result<Self, Box<dyn std::error::Error>> {
|
|
) -> Result<Self, Box<dyn std::error::Error>> {
|
|
|
let system_prompt = build_system_prompt()?;
|
|
let system_prompt = build_system_prompt()?;
|
|
|
let session = create_managed_session_handle()?;
|
|
let session = create_managed_session_handle()?;
|
|
@@ -971,6 +1063,7 @@ impl LiveCli {
|
|
|
model,
|
|
model,
|
|
|
allowed_tools,
|
|
allowed_tools,
|
|
|
permission_mode,
|
|
permission_mode,
|
|
|
|
|
+ max_cost_usd,
|
|
|
system_prompt,
|
|
system_prompt,
|
|
|
runtime,
|
|
runtime,
|
|
|
session,
|
|
session,
|
|
@@ -981,9 +1074,10 @@ impl LiveCli {
|
|
|
|
|
|
|
|
fn startup_banner(&self) -> String {
|
|
fn startup_banner(&self) -> String {
|
|
|
format!(
|
|
format!(
|
|
|
- "Rusty Claude CLI\n Model {}\n Permission mode {}\n Working directory {}\n Session {}\n\nType /help for commands. Shift+Enter or Ctrl+J inserts a newline.",
|
|
|
|
|
|
|
+ "Rusty Claude CLI\n Model {}\n Permission mode {}\n Cost budget {}\n Working directory {}\n Session {}\n\nType /help for commands. Shift+Enter or Ctrl+J inserts a newline.",
|
|
|
self.model,
|
|
self.model,
|
|
|
self.permission_mode.as_str(),
|
|
self.permission_mode.as_str(),
|
|
|
|
|
+ self.max_cost_usd.map_or_else(|| "none".to_string(), format_usd),
|
|
|
env::current_dir().map_or_else(
|
|
env::current_dir().map_or_else(
|
|
|
|_| "<unknown>".to_string(),
|
|
|_| "<unknown>".to_string(),
|
|
|
|path| path.display().to_string(),
|
|
|path| path.display().to_string(),
|
|
@@ -993,6 +1087,7 @@ impl LiveCli {
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
fn run_turn(&mut self, input: &str) -> Result<(), Box<dyn std::error::Error>> {
|
|
fn run_turn(&mut self, input: &str) -> Result<(), Box<dyn std::error::Error>> {
|
|
|
|
|
+ self.enforce_budget_before_turn()?;
|
|
|
let mut spinner = Spinner::new();
|
|
let mut spinner = Spinner::new();
|
|
|
let mut stdout = io::stdout();
|
|
let mut stdout = io::stdout();
|
|
|
spinner.tick(
|
|
spinner.tick(
|
|
@@ -1003,13 +1098,14 @@ impl LiveCli {
|
|
|
let mut permission_prompter = CliPermissionPrompter::new(self.permission_mode);
|
|
let mut permission_prompter = CliPermissionPrompter::new(self.permission_mode);
|
|
|
let result = self.runtime.run_turn(input, Some(&mut permission_prompter));
|
|
let result = self.runtime.run_turn(input, Some(&mut permission_prompter));
|
|
|
match result {
|
|
match result {
|
|
|
- Ok(_) => {
|
|
|
|
|
|
|
+ Ok(summary) => {
|
|
|
spinner.finish(
|
|
spinner.finish(
|
|
|
"Claude response complete",
|
|
"Claude response complete",
|
|
|
TerminalRenderer::new().color_theme(),
|
|
TerminalRenderer::new().color_theme(),
|
|
|
&mut stdout,
|
|
&mut stdout,
|
|
|
)?;
|
|
)?;
|
|
|
println!();
|
|
println!();
|
|
|
|
|
+ self.print_budget_notice(summary.usage);
|
|
|
self.persist_session()?;
|
|
self.persist_session()?;
|
|
|
Ok(())
|
|
Ok(())
|
|
|
}
|
|
}
|
|
@@ -1036,6 +1132,7 @@ impl LiveCli {
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
fn run_prompt_json(&mut self, input: &str) -> Result<(), Box<dyn std::error::Error>> {
|
|
fn run_prompt_json(&mut self, input: &str) -> Result<(), Box<dyn std::error::Error>> {
|
|
|
|
|
+ self.enforce_budget_before_turn()?;
|
|
|
let client = AnthropicClient::from_auth(resolve_cli_auth_source()?);
|
|
let client = AnthropicClient::from_auth(resolve_cli_auth_source()?);
|
|
|
let request = MessageRequest {
|
|
let request = MessageRequest {
|
|
|
model: self.model.clone(),
|
|
model: self.model.clone(),
|
|
@@ -1062,17 +1159,27 @@ impl LiveCli {
|
|
|
})
|
|
})
|
|
|
.collect::<Vec<_>>()
|
|
.collect::<Vec<_>>()
|
|
|
.join("");
|
|
.join("");
|
|
|
|
|
+ let usage = TokenUsage {
|
|
|
|
|
+ input_tokens: response.usage.input_tokens,
|
|
|
|
|
+ output_tokens: response.usage.output_tokens,
|
|
|
|
|
+ cache_creation_input_tokens: response.usage.cache_creation_input_tokens,
|
|
|
|
|
+ cache_read_input_tokens: response.usage.cache_read_input_tokens,
|
|
|
|
|
+ };
|
|
|
println!(
|
|
println!(
|
|
|
"{}",
|
|
"{}",
|
|
|
json!({
|
|
json!({
|
|
|
"message": text,
|
|
"message": text,
|
|
|
"model": self.model,
|
|
"model": self.model,
|
|
|
"usage": {
|
|
"usage": {
|
|
|
- "input_tokens": response.usage.input_tokens,
|
|
|
|
|
- "output_tokens": response.usage.output_tokens,
|
|
|
|
|
- "cache_creation_input_tokens": response.usage.cache_creation_input_tokens,
|
|
|
|
|
- "cache_read_input_tokens": response.usage.cache_read_input_tokens,
|
|
|
|
|
- }
|
|
|
|
|
|
|
+ "input_tokens": usage.input_tokens,
|
|
|
|
|
+ "output_tokens": usage.output_tokens,
|
|
|
|
|
+ "cache_creation_input_tokens": usage.cache_creation_input_tokens,
|
|
|
|
|
+ "cache_read_input_tokens": usage.cache_read_input_tokens,
|
|
|
|
|
+ },
|
|
|
|
|
+ "cost_usd": usage_cost_total(&self.model, usage),
|
|
|
|
|
+ "cumulative_cost_usd": usage_cost_total(&self.model, usage),
|
|
|
|
|
+ "max_cost_usd": self.max_cost_usd,
|
|
|
|
|
+ "budget_warning": budget_notice_message(&self.model, usage, self.max_cost_usd),
|
|
|
})
|
|
})
|
|
|
);
|
|
);
|
|
|
Ok(())
|
|
Ok(())
|
|
@@ -1142,6 +1249,28 @@ impl LiveCli {
|
|
|
Ok(())
|
|
Ok(())
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
|
|
+ fn enforce_budget_before_turn(&self) -> Result<(), Box<dyn std::error::Error>> {
|
|
|
|
|
+ let Some(limit) = self.max_cost_usd else {
|
|
|
|
|
+ return Ok(());
|
|
|
|
|
+ };
|
|
|
|
|
+ let cost = usage_cost_total(&self.model, self.runtime.usage().cumulative_usage());
|
|
|
|
|
+ if cost >= limit {
|
|
|
|
|
+ return Err(format!(
|
|
|
|
|
+ "cost budget exceeded before starting turn: cumulative={} budget={}",
|
|
|
|
|
+ format_usd(cost),
|
|
|
|
|
+ format_usd(limit)
|
|
|
|
|
+ )
|
|
|
|
|
+ .into());
|
|
|
|
|
+ }
|
|
|
|
|
+ Ok(())
|
|
|
|
|
+ }
|
|
|
|
|
+
|
|
|
|
|
+ fn print_budget_notice(&self, usage: TokenUsage) {
|
|
|
|
|
+ if let Some(message) = budget_notice_message(&self.model, usage, self.max_cost_usd) {
|
|
|
|
|
+ eprintln!("warning: {message}");
|
|
|
|
|
+ }
|
|
|
|
|
+ }
|
|
|
|
|
+
|
|
|
fn print_status(&self) {
|
|
fn print_status(&self) {
|
|
|
let cumulative = self.runtime.usage().cumulative_usage();
|
|
let cumulative = self.runtime.usage().cumulative_usage();
|
|
|
let latest = self.runtime.usage().current_turn_usage();
|
|
let latest = self.runtime.usage().current_turn_usage();
|
|
@@ -1158,6 +1287,7 @@ impl LiveCli {
|
|
|
},
|
|
},
|
|
|
self.permission_mode.as_str(),
|
|
self.permission_mode.as_str(),
|
|
|
&status_context(Some(&self.session.path)).expect("status context should load"),
|
|
&status_context(Some(&self.session.path)).expect("status context should load"),
|
|
|
|
|
+ self.max_cost_usd,
|
|
|
)
|
|
)
|
|
|
);
|
|
);
|
|
|
}
|
|
}
|
|
@@ -1275,7 +1405,10 @@ impl LiveCli {
|
|
|
|
|
|
|
|
fn print_cost(&self) {
|
|
fn print_cost(&self) {
|
|
|
let cumulative = self.runtime.usage().cumulative_usage();
|
|
let cumulative = self.runtime.usage().cumulative_usage();
|
|
|
- println!("{}", format_cost_report(cumulative));
|
|
|
|
|
|
|
+ println!(
|
|
|
|
|
+ "{}",
|
|
|
|
|
+ format_cost_report(&self.model, cumulative, self.max_cost_usd)
|
|
|
|
|
+ );
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
fn resume_session(
|
|
fn resume_session(
|
|
@@ -1553,7 +1686,10 @@ fn format_status_report(
|
|
|
usage: StatusUsage,
|
|
usage: StatusUsage,
|
|
|
permission_mode: &str,
|
|
permission_mode: &str,
|
|
|
context: &StatusContext,
|
|
context: &StatusContext,
|
|
|
|
|
+ max_cost_usd: Option<f64>,
|
|
|
) -> String {
|
|
) -> String {
|
|
|
|
|
+ let latest_cost = usage_cost_total(model, usage.latest);
|
|
|
|
|
+ let cumulative_cost = usage_cost_total(model, usage.cumulative);
|
|
|
[
|
|
[
|
|
|
format!(
|
|
format!(
|
|
|
"Status
|
|
"Status
|
|
@@ -1561,19 +1697,27 @@ fn format_status_report(
|
|
|
Permission mode {permission_mode}
|
|
Permission mode {permission_mode}
|
|
|
Messages {}
|
|
Messages {}
|
|
|
Turns {}
|
|
Turns {}
|
|
|
- Estimated tokens {}",
|
|
|
|
|
- usage.message_count, usage.turns, usage.estimated_tokens,
|
|
|
|
|
|
|
+ Estimated tokens {}
|
|
|
|
|
+ Cost budget {}",
|
|
|
|
|
+ usage.message_count,
|
|
|
|
|
+ usage.turns,
|
|
|
|
|
+ usage.estimated_tokens,
|
|
|
|
|
+ format_budget_line(cumulative_cost, max_cost_usd),
|
|
|
),
|
|
),
|
|
|
format!(
|
|
format!(
|
|
|
"Usage
|
|
"Usage
|
|
|
Latest total {}
|
|
Latest total {}
|
|
|
|
|
+ Latest cost {}
|
|
|
Cumulative input {}
|
|
Cumulative input {}
|
|
|
Cumulative output {}
|
|
Cumulative output {}
|
|
|
- Cumulative total {}",
|
|
|
|
|
|
|
+ Cumulative total {}
|
|
|
|
|
+ Cumulative cost {}",
|
|
|
usage.latest.total_tokens(),
|
|
usage.latest.total_tokens(),
|
|
|
|
|
+ format_usd(latest_cost),
|
|
|
usage.cumulative.input_tokens,
|
|
usage.cumulative.input_tokens,
|
|
|
usage.cumulative.output_tokens,
|
|
usage.cumulative.output_tokens,
|
|
|
usage.cumulative.total_tokens(),
|
|
usage.cumulative.total_tokens(),
|
|
|
|
|
+ format_usd(cumulative_cost),
|
|
|
),
|
|
),
|
|
|
format!(
|
|
format!(
|
|
|
"Workspace
|
|
"Workspace
|
|
@@ -2345,9 +2489,9 @@ fn print_help() {
|
|
|
println!("rusty-claude-cli v{VERSION}");
|
|
println!("rusty-claude-cli v{VERSION}");
|
|
|
println!();
|
|
println!();
|
|
|
println!("Usage:");
|
|
println!("Usage:");
|
|
|
- println!(" rusty-claude-cli [--model MODEL] [--allowedTools TOOL[,TOOL...]]");
|
|
|
|
|
|
|
+ println!(" rusty-claude-cli [--model MODEL] [--max-cost USD] [--allowedTools TOOL[,TOOL...]]");
|
|
|
println!(" Start the interactive REPL");
|
|
println!(" Start the interactive REPL");
|
|
|
- println!(" rusty-claude-cli [--model MODEL] [--output-format text|json] prompt TEXT");
|
|
|
|
|
|
|
+ println!(" rusty-claude-cli [--model MODEL] [--max-cost USD] [--output-format text|json] prompt TEXT");
|
|
|
println!(" Send one prompt and exit");
|
|
println!(" Send one prompt and exit");
|
|
|
println!(" rusty-claude-cli [--model MODEL] [--output-format text|json] TEXT");
|
|
println!(" rusty-claude-cli [--model MODEL] [--output-format text|json] TEXT");
|
|
|
println!(" Shorthand non-interactive prompt mode");
|
|
println!(" Shorthand non-interactive prompt mode");
|
|
@@ -2363,6 +2507,7 @@ fn print_help() {
|
|
|
println!(" --model MODEL Override the active model");
|
|
println!(" --model MODEL Override the active model");
|
|
|
println!(" --output-format FORMAT Non-interactive output format: text or json");
|
|
println!(" --output-format FORMAT Non-interactive output format: text or json");
|
|
|
println!(" --permission-mode MODE Set read-only, workspace-write, or danger-full-access");
|
|
println!(" --permission-mode MODE Set read-only, workspace-write, or danger-full-access");
|
|
|
|
|
+ println!(" --max-cost USD Warn at 80% of budget and stop at/exceeding the budget");
|
|
|
println!(" --allowedTools TOOLS Restrict enabled tools (repeatable; comma-separated aliases supported)");
|
|
println!(" --allowedTools TOOLS Restrict enabled tools (repeatable; comma-separated aliases supported)");
|
|
|
println!(" --version, -V Print version and build information locally");
|
|
println!(" --version, -V Print version and build information locally");
|
|
|
println!();
|
|
println!();
|
|
@@ -2389,13 +2534,14 @@ fn print_help() {
|
|
|
#[cfg(test)]
|
|
#[cfg(test)]
|
|
|
mod tests {
|
|
mod tests {
|
|
|
use super::{
|
|
use super::{
|
|
|
- filter_tool_specs, format_compact_report, format_cost_report, format_init_report,
|
|
|
|
|
- format_model_report, format_model_switch_report, format_permissions_report,
|
|
|
|
|
- format_permissions_switch_report, format_resume_report, format_status_report,
|
|
|
|
|
- format_tool_call_start, format_tool_result, normalize_permission_mode, parse_args,
|
|
|
|
|
- parse_git_status_metadata, render_config_report, render_init_claude_md,
|
|
|
|
|
- render_memory_report, render_repl_help, resume_supported_slash_commands, status_context,
|
|
|
|
|
- CliAction, CliOutputFormat, SlashCommand, StatusUsage, DEFAULT_MODEL,
|
|
|
|
|
|
|
+ budget_notice_message, filter_tool_specs, format_compact_report, format_cost_report,
|
|
|
|
|
+ format_init_report, format_model_report, format_model_switch_report,
|
|
|
|
|
+ format_permissions_report, format_permissions_switch_report, format_resume_report,
|
|
|
|
|
+ format_status_report, format_tool_call_start, format_tool_result,
|
|
|
|
|
+ normalize_permission_mode, parse_args, parse_git_status_metadata, render_config_report,
|
|
|
|
|
+ render_init_claude_md, render_memory_report, render_repl_help,
|
|
|
|
|
+ resume_supported_slash_commands, status_context, CliAction, CliOutputFormat, SlashCommand,
|
|
|
|
|
+ StatusUsage, DEFAULT_MODEL,
|
|
|
};
|
|
};
|
|
|
use runtime::{ContentBlock, ConversationMessage, MessageRole, PermissionMode};
|
|
use runtime::{ContentBlock, ConversationMessage, MessageRole, PermissionMode};
|
|
|
use std::path::{Path, PathBuf};
|
|
use std::path::{Path, PathBuf};
|
|
@@ -2408,6 +2554,7 @@ mod tests {
|
|
|
model: DEFAULT_MODEL.to_string(),
|
|
model: DEFAULT_MODEL.to_string(),
|
|
|
allowed_tools: None,
|
|
allowed_tools: None,
|
|
|
permission_mode: PermissionMode::WorkspaceWrite,
|
|
permission_mode: PermissionMode::WorkspaceWrite,
|
|
|
|
|
+ max_cost_usd: None,
|
|
|
}
|
|
}
|
|
|
);
|
|
);
|
|
|
}
|
|
}
|
|
@@ -2427,6 +2574,7 @@ mod tests {
|
|
|
output_format: CliOutputFormat::Text,
|
|
output_format: CliOutputFormat::Text,
|
|
|
allowed_tools: None,
|
|
allowed_tools: None,
|
|
|
permission_mode: PermissionMode::WorkspaceWrite,
|
|
permission_mode: PermissionMode::WorkspaceWrite,
|
|
|
|
|
+ max_cost_usd: None,
|
|
|
}
|
|
}
|
|
|
);
|
|
);
|
|
|
}
|
|
}
|
|
@@ -2448,6 +2596,7 @@ mod tests {
|
|
|
output_format: CliOutputFormat::Json,
|
|
output_format: CliOutputFormat::Json,
|
|
|
allowed_tools: None,
|
|
allowed_tools: None,
|
|
|
permission_mode: PermissionMode::WorkspaceWrite,
|
|
permission_mode: PermissionMode::WorkspaceWrite,
|
|
|
|
|
+ max_cost_usd: None,
|
|
|
}
|
|
}
|
|
|
);
|
|
);
|
|
|
}
|
|
}
|
|
@@ -2473,10 +2622,32 @@ mod tests {
|
|
|
model: DEFAULT_MODEL.to_string(),
|
|
model: DEFAULT_MODEL.to_string(),
|
|
|
allowed_tools: None,
|
|
allowed_tools: None,
|
|
|
permission_mode: PermissionMode::ReadOnly,
|
|
permission_mode: PermissionMode::ReadOnly,
|
|
|
|
|
+ max_cost_usd: None,
|
|
|
|
|
+ }
|
|
|
|
|
+ );
|
|
|
|
|
+ }
|
|
|
|
|
+
|
|
|
|
|
+ #[test]
|
|
|
|
|
+ fn parses_max_cost_flag() {
|
|
|
|
|
+ let args = vec!["--max-cost=1.25".to_string()];
|
|
|
|
|
+ assert_eq!(
|
|
|
|
|
+ parse_args(&args).expect("args should parse"),
|
|
|
|
|
+ CliAction::Repl {
|
|
|
|
|
+ model: DEFAULT_MODEL.to_string(),
|
|
|
|
|
+ allowed_tools: None,
|
|
|
|
|
+ permission_mode: PermissionMode::WorkspaceWrite,
|
|
|
|
|
+ max_cost_usd: Some(1.25),
|
|
|
}
|
|
}
|
|
|
);
|
|
);
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
|
|
+ #[test]
|
|
|
|
|
+ fn rejects_invalid_max_cost_flag() {
|
|
|
|
|
+ let error = parse_args(&["--max-cost".to_string(), "0".to_string()])
|
|
|
|
|
+ .expect_err("zero max cost should be rejected");
|
|
|
|
|
+ assert!(error.contains("--max-cost must be a positive finite USD amount"));
|
|
|
|
|
+ }
|
|
|
|
|
+
|
|
|
#[test]
|
|
#[test]
|
|
|
fn parses_allowed_tools_flags_with_aliases_and_lists() {
|
|
fn parses_allowed_tools_flags_with_aliases_and_lists() {
|
|
|
let args = vec![
|
|
let args = vec![
|
|
@@ -2495,6 +2666,7 @@ mod tests {
|
|
|
.collect()
|
|
.collect()
|
|
|
),
|
|
),
|
|
|
permission_mode: PermissionMode::WorkspaceWrite,
|
|
permission_mode: PermissionMode::WorkspaceWrite,
|
|
|
|
|
+ max_cost_usd: None,
|
|
|
}
|
|
}
|
|
|
);
|
|
);
|
|
|
}
|
|
}
|
|
@@ -2652,18 +2824,24 @@ mod tests {
|
|
|
|
|
|
|
|
#[test]
|
|
#[test]
|
|
|
fn cost_report_uses_sectioned_layout() {
|
|
fn cost_report_uses_sectioned_layout() {
|
|
|
- let report = format_cost_report(runtime::TokenUsage {
|
|
|
|
|
- input_tokens: 20,
|
|
|
|
|
- output_tokens: 8,
|
|
|
|
|
- cache_creation_input_tokens: 3,
|
|
|
|
|
- cache_read_input_tokens: 1,
|
|
|
|
|
- });
|
|
|
|
|
|
|
+ let report = format_cost_report(
|
|
|
|
|
+ "claude-sonnet",
|
|
|
|
|
+ runtime::TokenUsage {
|
|
|
|
|
+ input_tokens: 20,
|
|
|
|
|
+ output_tokens: 8,
|
|
|
|
|
+ cache_creation_input_tokens: 3,
|
|
|
|
|
+ cache_read_input_tokens: 1,
|
|
|
|
|
+ },
|
|
|
|
|
+ None,
|
|
|
|
|
+ );
|
|
|
assert!(report.contains("Cost"));
|
|
assert!(report.contains("Cost"));
|
|
|
assert!(report.contains("Input tokens 20"));
|
|
assert!(report.contains("Input tokens 20"));
|
|
|
assert!(report.contains("Output tokens 8"));
|
|
assert!(report.contains("Output tokens 8"));
|
|
|
assert!(report.contains("Cache create 3"));
|
|
assert!(report.contains("Cache create 3"));
|
|
|
assert!(report.contains("Cache read 1"));
|
|
assert!(report.contains("Cache read 1"));
|
|
|
assert!(report.contains("Total tokens 32"));
|
|
assert!(report.contains("Total tokens 32"));
|
|
|
|
|
+ assert!(report.contains("Estimated cost"));
|
|
|
|
|
+ assert!(report.contains("Budget $0.0010 (unlimited)"));
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
#[test]
|
|
@@ -2745,6 +2923,7 @@ mod tests {
|
|
|
project_root: Some(PathBuf::from("/tmp")),
|
|
project_root: Some(PathBuf::from("/tmp")),
|
|
|
git_branch: Some("main".to_string()),
|
|
git_branch: Some("main".to_string()),
|
|
|
},
|
|
},
|
|
|
|
|
+ Some(1.0),
|
|
|
);
|
|
);
|
|
|
assert!(status.contains("Status"));
|
|
assert!(status.contains("Status"));
|
|
|
assert!(status.contains("Model claude-sonnet"));
|
|
assert!(status.contains("Model claude-sonnet"));
|
|
@@ -2752,6 +2931,7 @@ mod tests {
|
|
|
assert!(status.contains("Messages 7"));
|
|
assert!(status.contains("Messages 7"));
|
|
|
assert!(status.contains("Latest total 10"));
|
|
assert!(status.contains("Latest total 10"));
|
|
|
assert!(status.contains("Cumulative total 31"));
|
|
assert!(status.contains("Cumulative total 31"));
|
|
|
|
|
+ assert!(status.contains("Cost budget $0.0009 / $1.0000"));
|
|
|
assert!(status.contains("Cwd /tmp/project"));
|
|
assert!(status.contains("Cwd /tmp/project"));
|
|
|
assert!(status.contains("Project root /tmp"));
|
|
assert!(status.contains("Project root /tmp"));
|
|
|
assert!(status.contains("Git branch main"));
|
|
assert!(status.contains("Git branch main"));
|
|
@@ -2760,6 +2940,22 @@ mod tests {
|
|
|
assert!(status.contains("Memory files 4"));
|
|
assert!(status.contains("Memory files 4"));
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
|
|
+ #[test]
|
|
|
|
|
+ fn budget_notice_warns_near_limit() {
|
|
|
|
|
+ let message = budget_notice_message(
|
|
|
|
|
+ "claude-sonnet",
|
|
|
|
|
+ runtime::TokenUsage {
|
|
|
|
|
+ input_tokens: 60_000,
|
|
|
|
|
+ output_tokens: 0,
|
|
|
|
|
+ cache_creation_input_tokens: 0,
|
|
|
|
|
+ cache_read_input_tokens: 0,
|
|
|
|
|
+ },
|
|
|
|
|
+ Some(1.0),
|
|
|
|
|
+ )
|
|
|
|
|
+ .expect("budget warning expected");
|
|
|
|
|
+ assert!(message.contains("approaching cost budget"));
|
|
|
|
|
+ }
|
|
|
|
|
+
|
|
|
#[test]
|
|
#[test]
|
|
|
fn config_report_supports_section_views() {
|
|
fn config_report_supports_section_views() {
|
|
|
let report = render_config_report(Some("env")).expect("config report should render");
|
|
let report = render_config_report(Some("env")).expect("config report should render");
|
|
@@ -2797,8 +2993,8 @@ mod tests {
|
|
|
fn status_context_reads_real_workspace_metadata() {
|
|
fn status_context_reads_real_workspace_metadata() {
|
|
|
let context = status_context(None).expect("status context should load");
|
|
let context = status_context(None).expect("status context should load");
|
|
|
assert!(context.cwd.is_absolute());
|
|
assert!(context.cwd.is_absolute());
|
|
|
- assert_eq!(context.discovered_config_files, 3);
|
|
|
|
|
- assert!(context.loaded_config_files <= context.discovered_config_files);
|
|
|
|
|
|
|
+ assert!(context.discovered_config_files >= context.loaded_config_files);
|
|
|
|
|
+ assert!(context.discovered_config_files >= 1);
|
|
|
}
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
#[test]
|