Module: Legion::LLM::Inference::ContextAccounting

Defined in:: lib/legion/llm/inference/context_accounting.rb

Constant Summary collapse

TOKEN_CHAR_DIVISOR =

SCHEMA_VERSION =

TOKEN_KEYS =

%i[
  request_message_estimated_tokens
  loaded_history_estimated_tokens
  curated_history_estimated_tokens
  curation_saved_estimated_tokens
  stripped_thinking_estimated_tokens
  archived_history_estimated_tokens
  archive_saved_estimated_tokens
  context_window_saved_estimated_tokens
  rag_injected_estimated_tokens
  system_prompt_estimated_tokens
  baseline_system_estimated_tokens
  tool_definition_estimated_tokens
  final_context_estimated_tokens
].freeze

COUNT_KEYS =

%i[
  loaded_history_message_count
  curated_history_message_count
  archived_history_message_count
  stripped_thinking_message_count
  context_window_message_count_before
  context_window_message_count_after
  rag_entry_count
  tool_definition_count
].freeze

CONTEXT_ACCOUNTING_STATUS_RANK =

{
  'missing'             => 0,
  'profile_skipped'     => 1,
  'partial'             => 2,
  'estimated'           => 3,
  'provider_reconciled' => 4
}.freeze

Class Method Summary collapse

.content_text(content) ⇒ Object
.empty(status: :estimated) ⇒ Object
.estimate_json_tokens(value) ⇒ Object
.estimate_message_tokens(messages) ⇒ Object
.estimate_text_tokens(text) ⇒ Object
.event(event_type:, component:, before_tokens:, after_tokens:, before_count: 0, after_count: 0, metadata: {}) ⇒ Object
.message_text(message) ⇒ Object

Class Method Details

.content_text(content) ⇒ `Object`

# File 'lib/legion/llm/inference/context_accounting.rb', line 88

def content_text(content)
  return content.to_s unless content.is_a?(Array)

  content.map do |part|
    part.is_a?(Hash) ? (part[:text] || part[:content]).to_s : part.to_s
  end.join("\n")
end

.empty(status: :estimated) ⇒ `Object`

# File 'lib/legion/llm/inference/context_accounting.rb', line 47

def empty(status: :estimated)
  {
    schema_version:   SCHEMA_VERSION,
    status:           status,
    estimator:        { name: :legion_char_div_four, version: 1 },
    counts:           COUNT_KEYS.to_h { |key| [key, 0] },
    tokens:           TOKEN_KEYS.to_h { |key| [key, 0] },
    reconciliation:   {},
    component_status: {
      context_load:   :not_observed,
      curation:       :not_observed,
      archive:        :not_observed,
      rag:            :not_observed,
      tools:          :not_observed,
      system:         :not_observed,
      context_window: :not_observed,
      thinking_strip: :not_observed
    },
    events:           []
  }
end

.estimate_json_tokens(value) ⇒ `Object`



77
78
79

# File 'lib/legion/llm/inference/context_accounting.rb', line 77

def estimate_json_tokens(value)
  estimate_text_tokens(Legion::JSON.dump(value || {}))
end

.estimate_message_tokens(messages) ⇒ `Object`



73
74
75

# File 'lib/legion/llm/inference/context_accounting.rb', line 73

def estimate_message_tokens(messages)
  Array(messages).sum { |message| estimate_text_tokens(message_text(message)) }
end

.estimate_text_tokens(text) ⇒ `Object`



69
70
71

# File 'lib/legion/llm/inference/context_accounting.rb', line 69

def estimate_text_tokens(text)
  (text.to_s.length / TOKEN_CHAR_DIVISOR.to_f).ceil
end

.event(event_type:, component:, before_tokens:, after_tokens:, before_count: 0, after_count: 0, metadata: {}) ⇒ `Object`

# File 'lib/legion/llm/inference/context_accounting.rb', line 96

def event(event_type:, component:, before_tokens:, after_tokens:, before_count: 0, after_count: 0, metadata: {})
  {
    event_type:              event_type,
    component:               component,
    estimated_tokens_before: before_tokens.to_i,
    estimated_tokens_after:  after_tokens.to_i,
    estimated_tokens_delta:  after_tokens.to_i - before_tokens.to_i,
    message_count_before:    before_count.to_i,
    message_count_after:     after_count.to_i,
    metadata:                metadata
  }
end

.message_text(message) ⇒ `Object`

# File 'lib/legion/llm/inference/context_accounting.rb', line 81

def message_text(message)
  return message.to_s unless message.is_a?(Hash)

  content = message[:content]
  content_text(content)
end

Module: Legion::LLM::Inference::ContextAccounting

Constant Summary collapse

Class Method Summary collapse

Class Method Details

.content_text(content) ⇒ Object

.empty(status: :estimated) ⇒ Object

.estimate_json_tokens(value) ⇒ Object

.estimate_message_tokens(messages) ⇒ Object

.estimate_text_tokens(text) ⇒ Object

.event(event_type:, component:, before_tokens:, after_tokens:, before_count: 0, after_count: 0, metadata: {}) ⇒ Object

.message_text(message) ⇒ Object

.content_text(content) ⇒ `Object`

.empty(status: :estimated) ⇒ `Object`

.estimate_json_tokens(value) ⇒ `Object`

.estimate_message_tokens(messages) ⇒ `Object`

.estimate_text_tokens(text) ⇒ `Object`

.event(event_type:, component:, before_tokens:, after_tokens:, before_count: 0, after_count: 0, metadata: {}) ⇒ `Object`

.message_text(message) ⇒ `Object`