Class: Llmemory::Memory

Inherits:

Object

Object
Llmemory::Memory

show all

Defined in:: lib/llmemory/memory.rb

Constant Summary collapse

DEFAULT_SESSION_ID =

"default"

STATE_KEY_MESSAGES =

:messages

Instance Method Summary collapse

#add_message(role:, content:) ⇒ Object
#check_context_window! ⇒ Object
#clear_session! ⇒ Object
#compact!(max_bytes: nil) ⇒ Object
#consolidate! ⇒ Object
#context_tokens ⇒ Object
#episodic ⇒ Object

Episodic long-term memory (CoALA): records and retrieves agent trajectories.
#initialize(user_id:, session_id: DEFAULT_SESSION_ID, checkpoint: nil, long_term: nil, long_term_type: nil, retrieval_engine: nil, working_memory: nil, episodic: nil, procedural: nil, api_key: nil) ⇒ Memory constructor

A new instance of Memory.
#last_user_message ⇒ Object
#maintain!(**opts) ⇒ Object

Cognitive maintenance pass: consolidate -> reflect -> mine skills -> expire, in one step, closing the CoALA learning loop.
#maybe_flush_memory! ⇒ Object
#messages ⇒ Object
#mine_skills!(window: SkillMining::Miner::DEFAULT_WINDOW, outcomes: nil, auto_register: false) ⇒ Object

Mines recent episodes for reusable skills (Voyager-style).
#procedural ⇒ Object

Procedural long-term memory (Voyager-style skill library).
#prune!(mode: nil) ⇒ Object
#reason(template:, into: Actions::Reason::DEFAULT_SLOT, parse: nil) ⇒ Object

Reasoning action: render a prompt from working memory, call the LLM, write the result back.
#recall_for(query: nil, max_tokens: nil) ⇒ Object
#reflect!(window: 10, category: "insights") ⇒ Object

Reflects over recent episodes and writes distilled insights to the semantic store (file/graph) with provenance back to source episodes.
#retrieve(query, max_tokens: nil) ⇒ Object
#should_auto_consolidate? ⇒ Boolean
#should_compact? ⇒ Boolean
#user_id ⇒ Object
#with_overflow_recovery(max_retries: 2, &block) ⇒ Object
#working_memory ⇒ Object

Structured working memory for this session (CoALA working memory), parallel to the message checkpoint.

Constructor Details

#initialize(user_id:, session_id: DEFAULT_SESSION_ID, checkpoint: nil, long_term: nil, long_term_type: nil, retrieval_engine: nil, working_memory: nil, episodic: nil, procedural: nil, api_key: nil) ⇒ `Memory`

Returns a new instance of Memory.

# File 'lib/llmemory/memory.rb', line 13

def initialize(user_id:, session_id: DEFAULT_SESSION_ID, checkpoint: nil, long_term: nil, long_term_type: nil, retrieval_engine: nil, working_memory: nil, episodic: nil, procedural: nil, api_key: nil)
  @user_id = user_id
  @session_id = session_id
  @checkpoint = checkpoint || ShortTerm::Checkpoint.new(user_id: user_id, session_id: session_id)
  @working_memory = working_memory
  @episodic = episodic
  @procedural = procedural
  @llm = api_key.to_s.empty? ? nil : Llmemory::LLM.client(api_key: api_key)
  type = long_term_type || Llmemory.configuration.long_term_type || :file_based
  @long_term = long_term || build_long_term(type)
  @retrieval_engine = retrieval_engine || Retrieval::Engine.new(@long_term, llm: @llm)
end

Instance Method Details

#add_message(role:, content:) ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 76

def add_message(role:, content:)
  msgs = messages
  msgs << { role: role.to_sym, content: content.to_s }
  save_state(messages: msgs, **preserved_flush_state)
  true
end

#check_context_window! ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 204

def check_context_window!
  return false if messages.empty?

  flushed = false
  if should_auto_consolidate? && Llmemory.configuration.memory_flush_enabled
    consolidate!
    flushed = true
  end

  compacted = false
  if should_compact?
    compacted = compact!
  end

  flushed || compacted
end

#clear_session! ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 136

def clear_session!
  @checkpoint.clear_state
  true
end

#compact!(max_bytes: nil) ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 141

def compact!(max_bytes: nil)
  max = max_bytes || Llmemory.configuration.compact_max_bytes
  msgs = messages
  current_bytes = messages_byte_size(msgs)
  return false if current_bytes <= max

  flushed = flush_memory_before_compaction!(msgs)

  old_msgs, recent_msgs = split_messages_by_bytes(msgs, max)
  return false if old_msgs.empty?

  summary = summarize_messages(old_msgs)
  compacted = [{ role: :system, content: summary }] + recent_msgs
  state = restore_state_for_save
  flush_ts = flushed ? Time.now : (state[:last_flush_at] || state["last_flush_at"])
  save_state(messages: compacted, last_compact_at: Time.now, last_flush_at: flush_ts)
  true
end

#consolidate! ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 128

def consolidate!
  msgs = messages
  return true if msgs.empty?
  conversation_text = msgs.map { |m| format_message(m) }.join("\n")
  @long_term.memorize(conversation_text)
  true
end

#context_tokens ⇒ `Object`



169
170
171

# File 'lib/llmemory/memory.rb', line 169

def context_tokens
  estimated_tokens(messages)
end

#episodic ⇒ `Object`

Episodic long-term memory (CoALA): records and retrieves agent trajectories. Additive — coexists with the semantic store (file/graph). Lazily built.



34
35
36

# File 'lib/llmemory/memory.rb', line 34

def episodic
  @episodic ||= LongTerm::Episodic::Memory.new(user_id: @user_id)
end

#last_user_message ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 107

def last_user_message
  msgs = messages
  idx = msgs.rindex { |m| (m[:role] || m["role"]).to_s == "user" }
  idx ? (msgs[idx][:content] || msgs[idx]["content"]).to_s : ""
end

#maintain!(**opts) ⇒ `Object`

Cognitive maintenance pass: consolidate -> reflect -> mine skills -> expire, in one step, closing the CoALA learning loop. Each step is isolated; a failure in one is captured in the report and never aborts the others.

# File 'lib/llmemory/memory.rb', line 68

def maintain!(**opts)
  Maintenance::CognitivePass.run!(
    @user_id,
    memory: self, episodic: episodic, procedural: procedural, semantic: @long_term, llm: @llm,
    **opts
  )
end

#maybe_flush_memory! ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 160

def maybe_flush_memory!
  return false unless Llmemory.configuration.memory_flush_enabled
  msgs = messages
  return false if msgs.empty?
  return false if estimated_tokens(msgs) < Llmemory.configuration.memory_flush_threshold_tokens

  consolidate!
end

#messages ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 83

def messages
  state = @checkpoint.restore_state
  return [] unless state.is_a?(Hash)
  list = state[STATE_KEY_MESSAGES] || state[STATE_KEY_MESSAGES.to_s]
  list = list.is_a?(Array) ? list.dup : []
  sanitize_messages(list)
end

#mine_skills!(window: SkillMining::Miner::DEFAULT_WINDOW, outcomes: nil, auto_register: false) ⇒ `Object`

Mines recent episodes for reusable skills (Voyager-style). Human-in-the-loop by default: returns skill proposals and writes nothing. With ‘auto_register: true`, registers them in procedural memory (with provenance back to the source episodes) and returns the new skill ids.

# File 'lib/llmemory/memory.rb', line 60

def mine_skills!(window: SkillMining::Miner::DEFAULT_WINDOW, outcomes: nil, auto_register: false)
  SkillMining::Miner.new(episodic: episodic, procedural: procedural, llm: @llm)
    .mine(window: window, outcomes: outcomes, auto_register: auto_register)
end

#procedural ⇒ `Object`

Procedural long-term memory (Voyager-style skill library). Lazily built.



39
40
41

# File 'lib/llmemory/memory.rb', line 39

def procedural
  @procedural ||= LongTerm::Procedural::Memory.new(user_id: @user_id)
end

#prune!(mode: nil) ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 113

def prune!(mode: nil)
  return false unless Llmemory.configuration.prune_tool_results_enabled

  msgs = messages
  return false if msgs.empty?

  mode ||= Llmemory.configuration.prune_tool_results_mode
  pruner = ShortTerm::Pruner.new(
    soft_trim_max_bytes: Llmemory.configuration.prune_tool_results_max_bytes
  )
  pruned = pruner.prune!(msgs, mode: mode)
  save_state(messages: pruned, **preserved_flush_state)
  true
end

#reason(template:, into: Actions::Reason::DEFAULT_SLOT, parse: nil) ⇒ `Object`

Reasoning action: render a prompt from working memory, call the LLM, write the result back. Composable; does not touch long-term memory.



52
53
54

# File 'lib/llmemory/memory.rb', line 52

def reason(template:, into: Actions::Reason::DEFAULT_SLOT, parse: nil)
  Actions::Reason.call(working_memory: working_memory, template: template, into: into, parse: parse, llm: @llm)
end

#recall_for(query: nil, max_tokens: nil) ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 98

def recall_for(query: nil, max_tokens: nil)
  return "" unless Llmemory.configuration.auto_recall_enabled

  effective_query = query || last_user_message
  return "" if effective_query.to_s.strip.empty?

  retrieve(effective_query, max_tokens: max_tokens)
end

#reflect!(window: 10, category: "insights") ⇒ `Object`

Reflects over recent episodes and writes distilled insights to the semantic store (file/graph) with provenance back to source episodes.

# File 'lib/llmemory/memory.rb', line 45

def reflect!(window: 10, category: "insights")
  Reflection::Reflector.new(episodic: episodic, semantic: @long_term, llm: @llm)
    .reflect(window: window, category: category)
end

#retrieve(query, max_tokens: nil) ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 91

def retrieve(query, max_tokens: nil)
  msgs = pruned_messages
  short_context = format_short_term_context(msgs)
  long_context = @retrieval_engine.retrieve_for_inference(query, user_id: @user_id, max_tokens: max_tokens)
  combine_contexts(short_context, long_context)
end

#should_auto_consolidate? ⇒ `Boolean`

Returns:

(Boolean)

# File 'lib/llmemory/memory.rb', line 173

def should_auto_consolidate?
  ctx = context_tokens
  threshold = Llmemory.configuration.context_window_tokens - Llmemory.configuration.reserve_tokens
  ctx >= threshold
end

#should_compact? ⇒ `Boolean`

Returns:

(Boolean)

# File 'lib/llmemory/memory.rb', line 179

def should_compact?
  ctx = context_tokens
  threshold = Llmemory.configuration.context_window_tokens - Llmemory.configuration.reserve_tokens
  ctx >= threshold
end

#user_id ⇒ `Object`



221
222
223

# File 'lib/llmemory/memory.rb', line 221

def user_id
  @user_id
end

#with_overflow_recovery(max_retries: 2, &block) ⇒ `Object`

# File 'lib/llmemory/memory.rb', line 185

def with_overflow_recovery(max_retries: 2, &block)
  return yield unless Llmemory.configuration.overflow_recovery_enabled
  return yield unless block_given?

  retries = 0
  begin
    yield
  rescue Llmemory::LLMError => e
    msg = e.message.to_s.downcase
    overflow = msg.include?("context") || msg.include?("token") || msg.include?("overflow") || msg.include?("limit")
    raise unless overflow && retries < max_retries

    prune! if Llmemory.configuration.prune_tool_results_enabled
    compact!
    retries += 1
    retry
  end
end

#working_memory ⇒ `Object`

Structured working memory for this session (CoALA working memory), parallel to the message checkpoint. Lazily built.



28
29
30

# File 'lib/llmemory/memory.rb', line 28

def working_memory
  @working_memory ||= WorkingMemory.new(user_id: @user_id, session_id: @session_id)
end

Class: Llmemory::Memory

Constant Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(user_id:, session_id: DEFAULT_SESSION_ID, checkpoint: nil, long_term: nil, long_term_type: nil, retrieval_engine: nil, working_memory: nil, episodic: nil, procedural: nil, api_key: nil) ⇒ Memory

Instance Method Details

#add_message(role:, content:) ⇒ Object

#check_context_window! ⇒ Object

#clear_session! ⇒ Object

#compact!(max_bytes: nil) ⇒ Object

#consolidate! ⇒ Object

#context_tokens ⇒ Object

#episodic ⇒ Object

#last_user_message ⇒ Object

#maintain!(**opts) ⇒ Object

#maybe_flush_memory! ⇒ Object

#messages ⇒ Object

#mine_skills!(window: SkillMining::Miner::DEFAULT_WINDOW, outcomes: nil, auto_register: false) ⇒ Object

#procedural ⇒ Object

#prune!(mode: nil) ⇒ Object

#reason(template:, into: Actions::Reason::DEFAULT_SLOT, parse: nil) ⇒ Object

#recall_for(query: nil, max_tokens: nil) ⇒ Object

#reflect!(window: 10, category: "insights") ⇒ Object

#retrieve(query, max_tokens: nil) ⇒ Object

#should_auto_consolidate? ⇒ Boolean

#should_compact? ⇒ Boolean

#user_id ⇒ Object

#with_overflow_recovery(max_retries: 2, &block) ⇒ Object

#working_memory ⇒ Object