Class: Toy::LLM::Recipes::LoRAMetal

Inherits:

Object

Object
Toy::LLM::Recipes::LoRAMetal

show all

Defined in:: lib/toy/llm/recipes/lora_metal.rb

Overview

The LoRAMetal fine-tune recipe. realize! builds the frozen-base + LoRAMetal-Q-adapter forward+CE+backward+AdamW graph on a Toy::LLM::Engine::LlamaSeqEngineMetal (base weights mmap’d from the GGUF, only the rank-r adapters + Adam moments are trainable), then step! drives one training step. The caller (fixture) owns the loaded GGUF handle, the experiment config, and the per-step input Mats.

Instance Attribute Summary collapse

#lora_cache ⇒ Object

Returns the value of attribute lora_cache.
#lora_step_index ⇒ Object

Returns the value of attribute lora_step_index.
#lora_t_hp ⇒ Object

Returns the value of attribute lora_t_hp.
#lora_t_labels ⇒ Object

Returns the value of attribute lora_t_labels.
#lora_t_loss ⇒ Object

Returns the value of attribute lora_t_loss.

Instance Method Summary collapse

#initialize ⇒ LoRAMetal constructor

A new instance of LoRAMetal.
#realize!(gguf_handle, cfg, rank, opts) ⇒ Object

Realize the LoRAMetal graph.
#step!(seq_ids, positions, m_labels, m_hp, is_first) ⇒ Object

ONE training step.

Constructor Details

#initialize ⇒ `LoRAMetal`

Returns a new instance of LoRAMetal.

# File 'lib/toy/llm/recipes/lora_metal.rb', line 54

def initialize
  @lora_cache      = Toy::LLM::Engine::LlamaSeqEngineMetal.new
  @lora_t_loss     = nil
  @lora_t_labels   = nil
  @lora_t_hp       = nil
  @lora_step_index = 0
end

Instance Attribute Details

#lora_cache ⇒ `Object`

Returns the value of attribute lora_cache.



52
53
54

# File 'lib/toy/llm/recipes/lora_metal.rb', line 52

def lora_cache
  @lora_cache
end

#lora_step_index ⇒ `Object`

Returns the value of attribute lora_step_index.



52
53
54

# File 'lib/toy/llm/recipes/lora_metal.rb', line 52

def lora_step_index
  @lora_step_index
end

#lora_t_hp ⇒ `Object`

Returns the value of attribute lora_t_hp.



52
53
54

# File 'lib/toy/llm/recipes/lora_metal.rb', line 52

def lora_t_hp
  @lora_t_hp
end

#lora_t_labels ⇒ `Object`

Returns the value of attribute lora_t_labels.



52
53
54

# File 'lib/toy/llm/recipes/lora_metal.rb', line 52

def lora_t_labels
  @lora_t_labels
end

#lora_t_loss ⇒ `Object`

Returns the value of attribute lora_t_loss.



52
53
54

# File 'lib/toy/llm/recipes/lora_metal.rb', line 52

def lora_t_loss
  @lora_t_loss
end

Instance Method Details

#realize!(gguf_handle, cfg, rank, opts) ⇒ `Object`

Realize the LoRAMetal graph. Delegates VERBATIM to the cache in the reference’s order (03_finetune_lora.rb:67-76): enable_lora_q!(rank) + enable_lora_q_adamw! (set the two flags BEFORE realize), then realize_for_mmap (mmap the frozen base in place), then the seeded upload_lora_q_init!(seed, init_scale) (deterministic adapter init), then build_training_step (forward + CE + backward + opt_step_adamw on the adapters baked into the ggml graph). Stashes the returned

t_loss, t_labels, t_hp: triple. ‘opts` is a Toy::LLM::RecipeOptions

(toy#64 item 1); the lora mmap path consumes its t_seq / untied / qkv_bias / seed / init_scale (NO t_batch / weight_dtype knob on realize_for_mmap). ‘rank` is lora-specific so it stays a leading positional. Unpacked in the engine’s exact positional order, so the realize is byte-identical. Returns nil.

# File 'lib/toy/llm/recipes/lora_metal.rb', line 75

def realize!(gguf_handle, cfg, rank, opts)
  @lora_cache.enable_lora_q!(rank)
  @lora_cache.enable_lora_q_adamw!
  @lora_cache.realize_for_mmap(gguf_handle, cfg, opts.t_seq,
                               opts.untied, opts.qkv_bias)
  @lora_cache.upload_lora_q_init!(opts.seed, opts.init_scale)
  result         = @lora_cache.build_training_step
  @lora_t_loss   = result[0]
  @lora_t_labels = result[1]
  @lora_t_hp     = result[2]
  nil
end

#step!(seq_ids, positions, m_labels, m_hp, is_first) ⇒ `Object`

ONE training step. Op order is VERBATIM from 03_finetune_lora.rb:179-191 (and LITERALLY IDENTICAL to FromScratch#step!): graph_reset on the first step else reset_grads_only; the four uploads in order (token_ids/positions/labels/hp); compute_backward; download_row_major(t_loss, 1, 1). is_first selects the reset; the NOT used for the reset decision, so the caller stays in full control of the step==first branch. Returns the loss Float. Per-step input Mats (including the bias-corrected hp row) are built by the caller.

# File 'lib/toy/llm/recipes/lora_metal.rb', line 98

def step!(seq_ids, positions, m_labels, m_hp, is_first)
  s = @lora_cache.sess
  if is_first
    TinyNNMetal.tnn_graph_reset(s)
  else
    TinyNNMetal.tnn_graph_reset_grads_only(s)
  end
  TinyNNMetal.upload_int_array(s, @lora_cache.t_seq_token_ids, seq_ids)
  TinyNNMetal.upload_int_array(s, @lora_cache.t_seq_positions, positions)
  TinyNNMetal.upload_row_major(s, @lora_t_labels, m_labels)
  TinyNNMetal.upload_row_major(s, @lora_t_hp,     m_hp)
  TinyNNMetal.tnn_compute_backward(s)
  loss_mat = TinyNNMetal.download_row_major(s, @lora_t_loss, 1, 1)
  loss_mat.flat[0]
end

Class: Toy::LLM::Recipes::LoRAMetal

Overview

Instance Attribute Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize ⇒ LoRAMetal

Instance Attribute Details

#lora_cache ⇒ Object

#lora_step_index ⇒ Object

#lora_t_hp ⇒ Object

#lora_t_labels ⇒ Object

#lora_t_loss ⇒ Object