Class: Collavre::AiClient

Inherits:

Object

Object
Collavre::AiClient

show all

Defined in:: app/services/collavre/ai_client.rb

Constant Summary collapse

SYSTEM_INSTRUCTIONS =

<<~PROMPT.freeze
  You are a senior expert teammate. Respond:
  - Be concise and focus on the essentials (avoid unnecessary verbosity).
  - Use short bullet points only when helpful.
  - State only what you're confident about; briefly note any uncertainty.
  - Respond in the asker's language (prefer the latest user message). Keep code and error messages in their original form.
PROMPT

Instance Attribute Summary collapse

#last_input_tokens ⇒ Object readonly

Returns the value of attribute last_input_tokens.
#last_output_tokens ⇒ Object readonly

Returns the value of attribute last_output_tokens.

Instance Method Summary collapse

#ask(prompt) ⇒ Object

Ask a follow-up question using the existing conversation context.
#chat(contents, tools: [], &block) ⇒ Object
#initialize(vendor:, model:, system_prompt:, llm_api_key: nil, gateway_url: nil, context: {}, log_interactions: true) ⇒ AiClient constructor

log_interactions: persist each call to ActivityLog.

Constructor Details

#initialize(vendor:, model:, system_prompt:, llm_api_key: nil, gateway_url: nil, context: {}, log_interactions: true) ⇒ `AiClient`

log_interactions: persist each call to ActivityLog. Default true. Pass false for ephemeral, high-frequency calls on text the user has not submitted (e.g. inline typo correction on debounced typing) so private drafts are never written to server-side activity logs.

# File 'app/services/collavre/ai_client.rb', line 17

def initialize(vendor:, model:, system_prompt:, llm_api_key: nil, gateway_url: nil, context: {}, log_interactions: true)
  @vendor = vendor
  @model = model
  @system_prompt = system_prompt
  @llm_api_key = llm_api_key
  @gateway_url = gateway_url
  @context = context
  @log_interactions = log_interactions
  @last_input_tokens = 0
  @last_output_tokens = 0
end

Instance Attribute Details

#last_input_tokens ⇒ `Object` (readonly)

Returns the value of attribute last_input_tokens.



11
12
13

# File 'app/services/collavre/ai_client.rb', line 11

def last_input_tokens
  @last_input_tokens
end

#last_output_tokens ⇒ `Object` (readonly)

Returns the value of attribute last_output_tokens.



11
12
13

# File 'app/services/collavre/ai_client.rb', line 11

def last_output_tokens
  @last_output_tokens
end

Instance Method Details

#ask(prompt) ⇒ `Object`

Ask a follow-up question using the existing conversation context. Used to generate approval summaries with full conversation history. Returns the response content string, or nil on failure.

# File 'app/services/collavre/ai_client.rb', line 101

def ask(prompt)
  return nil unless @conversation

  # Disable tool calls for summary generation to avoid recursive approval
  @conversation.with_tools(replace: true)
  response = @conversation.ask(prompt)
  response&.content&.strip.presence
rescue StandardError => e
  Rails.logger.warn("AiClient#ask failed: #{e.class} #{e.message}")
  nil
end

#chat(contents, tools: [], &block) ⇒ `Object`

# File 'app/services/collavre/ai_client.rb', line 29

def chat(contents, tools: [], &block)
  response_content = +""
  error_message = nil
  input_tokens = nil
  output_tokens = nil

  normalized_vendor = vendor.to_s.downcase
  unless VENDOR_TO_PROVIDER.key?(normalized_vendor)
    Rails.logger.warn "Unsupported LLM vendor '#{@vendor}'. Attempting to use default (google)."
  end

  @conversation = build_conversation(tools)
  add_messages(@conversation, contents)

  response = @conversation.complete do |chunk|
    delta = extract_chunk_content(chunk)
    next if delta.blank?

    response_content << delta
    yield delta if block_given?
  end

  if response
    response_content = response.content.to_s if response.content.present?

    # Extract token usage directly from response object (RubyLLM style)
    if response.respond_to?(:input_tokens)
      input_tokens = response.input_tokens
    end

    if response.respond_to?(:output_tokens)
      output_tokens = response.output_tokens
    end
  end

  response_content.presence
rescue ApprovalPendingError
  # Preserve conversation for follow-up (e.g. generating approval summary)
  raise
rescue CancelledError
  raise # Re-raise cancellation errors without catching them
rescue StandardError => e
  error_message = "[#{e.class.name}] #{e.message}"
  # When log_interactions is false (inline typo correction runs on the user's
  # *unsubmitted* draft), the LLM error message can echo the request text. Log
  # only the error class to app logs so private drafts never leak — matching the
  # no-log guarantee already enforced on the parse path (TypoCorrector) and the
  # ActivityLog gate below. error_message stays intact for the gated ensure log
  # and the streamed yield (which goes back to the same user).
  Rails.logger.error "AI Client error: #{@log_interactions ? error_message : "[#{e.class.name}]"}"
  Rails.logger.error "Partial response length: #{response_content.length} chars" if response_content.present?
  Rails.logger.debug e.backtrace.join("\n")
  yield "\n\n⚠️ AI Error: #{error_message}" if block_given?
  nil
ensure
  @last_input_tokens = input_tokens || 0
  @last_output_tokens = output_tokens || 0
  if @log_interactions
    log_interaction(
      messages: @conversation&.messages&.to_a || Array(contents),
      tools: @conversation&.tools&.to_a || [],
      response_content: response_content.presence,
      error_message: error_message,
      input_tokens: input_tokens,
      output_tokens: output_tokens
    )
  end
end