Module: Clacky::Agent::CostTracker

Included in:: Clacky::Agent

Defined in:: lib/clacky/agent/cost_tracker.rb

Overview

Cost tracking and token usage statistics Manages cost calculation, token estimation, and usage display

Instance Method Summary collapse

#collect_iteration_tokens(usage, cost) ⇒ Hash

Collect token usage data for current iteration and return it.
#track_cost(usage, raw_api_usage: nil) ⇒ Object

Track cost from API usage Updates total cost and displays iteration statistics.

Instance Method Details

#collect_iteration_tokens(usage, cost) ⇒ `Hash`

Collect token usage data for current iteration and return it. Does NOT call @ui directly — the caller is responsible for displaying at the right moment (e.g. after show_assistant_message).

Parameters:

usage (Hash) —

Usage data from API
cost (Float) —

Cost for this iteration

Returns:

(Hash) —

token_data ready for show_token_usage

# File 'lib/clacky/agent/cost_tracker.rb', line 101

def collect_iteration_tokens(usage, cost)
  prompt_tokens = usage[:prompt_tokens] || 0
  completion_tokens = usage[:completion_tokens] || 0
  total_tokens = usage[:total_tokens] || (prompt_tokens + completion_tokens)
  cache_write = usage[:cache_creation_input_tokens] || 0
  cache_read = usage[:cache_read_input_tokens] || 0

  # Calculate token delta from previous iteration.
  #
  # Two conventions exist for total_tokens across providers:
  #   - OpenAI (default):    cumulative per-request input+output (grows
  #                          with history every turn). Delta = total - prev.
  #   - Anthropic direct:    already the per-turn new compute
  #                          (raw_input + cache_creation + output).
  #                          The MessageFormat sets :total_is_per_turn so
  #                          we use total_tokens directly as the delta.
  #
  # Without this branch, Anthropic's per-turn total would be treated as
  # cumulative and produce negative / nonsensical deltas whenever cached
  # prefixes make the per-turn new-compute smaller than the previous turn.
  delta_tokens =
    if usage[:total_is_per_turn]
      total_tokens
    else
      total_tokens - @previous_total_tokens
    end
  @previous_total_tokens = total_tokens  # Update for next iteration

  {
    delta_tokens: delta_tokens,
    prompt_tokens: prompt_tokens,
    completion_tokens: completion_tokens,
    total_tokens: total_tokens,
    cache_write: cache_write,
    cache_read: cache_read,
    cost: cost,
    cost_source: @cost_source
  }
end

#track_cost(usage, raw_api_usage: nil) ⇒ `Object`

Track cost from API usage Updates total cost and displays iteration statistics

Parameters:

usage (Hash) —

Usage data from API response
raw_api_usage (Hash, nil) (defaults to: nil) —

Raw API usage data for debugging

# File 'lib/clacky/agent/cost_tracker.rb', line 12

def track_cost(usage, raw_api_usage: nil)
  # Priority 1: Use API-provided cost if available (OpenRouter, LiteLLM, etc.)
  iteration_cost = nil
  if usage[:api_cost]
    @total_cost += usage[:api_cost]
    @cost_source = :api
    @task_cost_source = :api
    iteration_cost = usage[:api_cost]
    @ui&.log("Using API-provided cost: $#{usage[:api_cost]}", level: :debug) if @config.verbose
  else
    # Priority 2: Calculate from tokens using ModelPricing
    result = ModelPricing.calculate_cost(model: current_model, usage: usage)
    cost = result[:cost]
    pricing_source = result[:source]

    # Only accumulate cost when the model has known pricing.
    # Unknown models return nil — display N/A, don't add to total.
    if cost
      @total_cost += cost
      iteration_cost = cost
      @cost_source = pricing_source
      @task_cost_source = pricing_source
    end

    if @config.verbose
      if cost
        source_label = pricing_source == :price ? "model pricing" : "default pricing"
        @ui&.log("Calculated cost for #{@config.model_name} using #{source_label}: $#{cost.round(6)}", level: :debug)
      else
        @ui&.log("No pricing data available for #{@config.model_name} — cost is unknown", level: :debug)
      end
      @ui&.log("Usage breakdown: prompt=#{usage[:prompt_tokens]}, completion=#{usage[:completion_tokens]}, cache_write=#{usage[:cache_creation_input_tokens] || 0}, cache_read=#{usage[:cache_read_input_tokens] || 0}", level: :debug)
    end
  end

  # Collect token usage data for this iteration (returned to caller for deferred display)
  token_data = collect_iteration_tokens(usage, iteration_cost)

  # Update session bar cost in real-time (don't wait for agent.run to finish)
  @ui&.update_sessionbar(cost: @total_cost, cost_source: @cost_source)

  # Track cache usage statistics (global)
  @cache_stats[:total_requests] += 1

  if usage[:cache_creation_input_tokens]
    @cache_stats[:cache_creation_input_tokens] += usage[:cache_creation_input_tokens]
  end

  if usage[:cache_read_input_tokens]
    @cache_stats[:cache_read_input_tokens] += usage[:cache_read_input_tokens]
    @cache_stats[:cache_hit_requests] += 1
  end

  # Store raw API usage samples (keep last 3 for debugging)
  if raw_api_usage
    @cache_stats[:raw_api_usage_samples] ||= []
    @cache_stats[:raw_api_usage_samples] << raw_api_usage
    @cache_stats[:raw_api_usage_samples] = @cache_stats[:raw_api_usage_samples].last(3)
  end

  # Track cache usage for current task
  if @task_cache_stats
    @task_cache_stats[:total_requests] += 1

    if usage[:cache_creation_input_tokens]
      @task_cache_stats[:cache_creation_input_tokens] += usage[:cache_creation_input_tokens]
    end

    if usage[:cache_read_input_tokens]
      @task_cache_stats[:cache_read_input_tokens] += usage[:cache_read_input_tokens]
      @task_cache_stats[:cache_hit_requests] += 1
    end
  end

  # Return token_data so the caller can display it at the right moment
  token_data
end