Module: Legion::LLM::Discovery

Extended by:
Legion::Logging::Helper
Defined in:
lib/legion/llm/discovery.rb,
lib/legion/llm/discovery/system.rb,
lib/legion/llm/discovery/memory_gate.rb,
lib/legion/llm/discovery/rule_generator.rb

Defined Under Namespace

Modules: MemoryGate, RuleGenerator, System

Constant Summary collapse

EMBEDDING_TIER_ORDER =
%w[local direct fleet openai_compat cloud frontier].freeze

Class Attribute Summary collapse

Class Method Summary collapse

Class Attribute Details

.embedding_fallback_chainObject (readonly)

Returns the value of attribute embedding_fallback_chain.



23
24
25
# File 'lib/legion/llm/discovery.rb', line 23

def embedding_fallback_chain
  @embedding_fallback_chain
end

.embedding_instanceObject (readonly)

Returns the value of attribute embedding_instance.



23
24
25
# File 'lib/legion/llm/discovery.rb', line 23

def embedding_instance
  @embedding_instance
end

.embedding_modelObject (readonly)

Returns the value of attribute embedding_model.



23
24
25
# File 'lib/legion/llm/discovery.rb', line 23

def embedding_model
  @embedding_model
end

.embedding_providerObject (readonly)

Returns the value of attribute embedding_provider.



23
24
25
# File 'lib/legion/llm/discovery.rb', line 23

def embedding_provider
  @embedding_provider
end

Class Method Details

.can_embed?Boolean

Returns:

  • (Boolean)


25
26
27
# File 'lib/legion/llm/discovery.rb', line 25

def can_embed?
  @can_embed == true
end

.detect_embedding_capabilityObject



43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
# File 'lib/legion/llm/discovery.rb', line 43

def detect_embedding_capability
  log.debug '[llm][discovery] action=detect_embedding_capability.enter'

  if detect_embedding_from_registry
    log.debug '[llm][discovery] action=detect_embedding_capability registry_hit=true'
    return
  end

  embedding_settings = self.embedding_settings
  found = find_embedding_provider(embedding_settings)
  if found
    @can_embed = true
    @embedding_provider = found[:provider]
    @embedding_model = found[:model]
    @embedding_fallback_chain = build_embedding_fallback_chain(embedding_settings)
    log.info "[llm][discovery] embedding available provider=#{@embedding_provider} model=#{@embedding_model}"
  else
    @can_embed = false
    @embedding_fallback_chain = []
    log.info '[llm][discovery] no embedding provider available'
  end
rescue StandardError => e
  @can_embed = false
  @embedding_fallback_chain = []
  handle_exception(e, level: :warn, operation: 'llm.discovery.detect_embedding_capability')
end

.discovered_instancesObject

Returns discovered instances grouped by provider for RuleGenerator compatibility. Each provider maps to a hash of instance_id => { models: […], base_url: … }



72
73
74
75
76
77
78
79
80
81
82
83
# File 'lib/legion/llm/discovery.rb', line 72

def discovered_instances
  models = discovered_models
  result = {}
  models.each do |m|
    provider = m[:provider]
    instance = m[:instance] || :default
    result[provider] ||= {}
    result[provider][instance] ||= { models: [] }
    result[provider][instance][:models] << normalize_model_for_rules(m)
  end
  result
end

.discovered_modelsObject

Flat list of all discovered models across all registry adapters. TTL-cached; call refresh_discovered_models! to force a refresh.



87
88
89
90
91
92
# File 'lib/legion/llm/discovery.rb', line 87

def discovered_models
  return @discovered_models_cache if @discovered_models_cache && !discovered_models_stale?

  refresh_discovered_models!
  @discovered_models_cache || []
end

.model_available?(model, provider: nil, instance: nil) ⇒ Boolean

Check whether a specific model is available from any registered provider.

Returns:

  • (Boolean)


95
96
97
98
99
100
101
102
103
# File 'lib/legion/llm/discovery.rb', line 95

def model_available?(model, provider: nil, instance: nil)
  psym = provider&.to_sym
  isym = instance&.to_sym
  discovered_models.any? do |m|
    name_matches?(m[:model], model) &&
      (psym.nil? || m[:provider] == psym) &&
      (isym.nil? || m[:instance] == isym)
  end
end

.model_size(model, provider: nil, instance: nil) ⇒ Object

Return the size in bytes for a discovered model, or nil if unknown.



106
107
108
109
110
111
112
113
114
115
# File 'lib/legion/llm/discovery.rb', line 106

def model_size(model, provider: nil, instance: nil)
  psym = provider&.to_sym
  isym = instance&.to_sym
  entry = discovered_models.find do |m|
    name_matches?(m[:model], model) &&
      (psym.nil? || m[:provider] == psym) &&
      (isym.nil? || m[:instance] == isym)
  end
  entry&.dig(:size_bytes)
end

.refresh_discovered_models!Object



117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
# File 'lib/legion/llm/discovery.rb', line 117

def refresh_discovered_models!
  log.debug '[llm][discovery] action=refresh_discovered_models'
  return unless defined?(Call::Registry)

  models = Call::Registry.all_instances.flat_map do |entry|
    adapter = entry[:adapter]
    next [] unless adapter.respond_to?(:offerings)

    begin
      Array(adapter.offerings).map do |offering|
        {
          model:           (offering[:id] || offering[:name] || offering[:model]).to_s,
          provider:        entry[:provider],
          instance:        entry[:instance],
          tier:            entry.dig(:metadata, :tier),
          size_bytes:      offering[:size_bytes] || offering[:size],
          capabilities:    offering[:capabilities] || [],
          context_length:  offering[:context_length] || offering[:max_model_len],
          parameter_count: offering[:parameter_count]
        }
      end
    rescue StandardError => e
      handle_exception(e, level:     :debug,
                          operation: "discovery.offerings.#{entry[:provider]}/#{entry[:instance]}")
      []
    end
  end

  @discovered_models_cache = models
  @discovered_models_at = Time.now
  log.debug "[llm][discovery] action=refresh_discovered_models count=#{models.size}"
end

.reset!Object



150
151
152
153
154
155
156
157
158
159
# File 'lib/legion/llm/discovery.rb', line 150

def reset!
  log.debug '[llm][discovery] reset'
  @can_embed = nil
  @embedding_provider = nil
  @embedding_model = nil
  @embedding_instance = nil
  @embedding_fallback_chain = nil
  @discovered_models_cache = nil
  @discovered_models_at = nil
end

.runObject



29
30
31
32
33
34
35
36
37
38
39
40
41
# File 'lib/legion/llm/discovery.rb', line 29

def run
  log.debug '[llm][discovery] run.enter'
  System.refresh! if discovery_enabled?

  refresh_discovered_models!
  models = discovered_models
  log.info "[llm][discovery] model_count=#{models.size} " \
           "models=#{models.map { |m| m[:model] }.join(', ')}"
  log.info "[llm][discovery] system total_mb=#{System.total_memory_mb} " \
           "available_mb=#{System.available_memory_mb}"
rescue StandardError => e
  handle_exception(e, level: :warn, operation: 'llm.discovery.run')
end