Class: LlamaCpp::LlamaContextParams

Inherits:

Object

Object
LlamaCpp::LlamaContextParams

show all

Defined in:: ext/llama_cpp/llama_cpp.c,
ext/llama_cpp/llama_cpp.c

Overview

“struct llama_context_params” wrapper class

Instance Method Summary collapse

#attention_type ⇒ Integer
#attention_type=(attention_type) ⇒ Integer
#defrag_thold ⇒ Float
#defrag_thold=(defrag_thold) ⇒ Float
#embeddings ⇒ Boolean
#embeddings=(embeddings) ⇒ Boolean
#flash_attn_type ⇒ Integer
#flash_attn_type=(flash_attn_type) ⇒ Integer
#kv_unified ⇒ Boolean
#kv_unified=(kv_unified) ⇒ Boolean
#n_batch ⇒ Integer
#n_batch=(n_batch) ⇒ Integer
#n_ctx ⇒ Integer
#n_ctx=(n_ctx) ⇒ Integer
#n_seq_max ⇒ Integer
#n_seq_max=(n_seq_max) ⇒ Integer
#n_threads ⇒ Integer
#n_threads=(n_threads) ⇒ Integer
#n_threads_batch ⇒ Integer
#n_threads_batch=(n_threads_batch) ⇒ Integer
#n_ubatch ⇒ Integer
#n_ubatch=(n_ubatch) ⇒ Integer
#no_perf ⇒ Boolean
#no_perf=(no_perf) ⇒ Boolean
#offload_kqv ⇒ Boolean
#offload_kqv=(offload_kqv) ⇒ Boolean
#op_offload ⇒ Boolean
#op_offload=(op_offload) ⇒ Boolean
#pooling_type ⇒ Integer
#pooling_type=(pooling_type) ⇒ Integer
#rope_freq_base ⇒ Float
#rope_freq_base=(rope_freq_base) ⇒ Float
#rope_freq_scale ⇒ Float
#rope_freq_scale=(rope_freq_scale) ⇒ Float
#rope_scaling_type ⇒ Integer
#rope_scaling_type=(rope_scaling_type) ⇒ Integer
#swa_full ⇒ Boolean
#swa_full=(swa_full) ⇒ Boolean
#type_k ⇒ Integer
#type_k=(type_k) ⇒ Integer
#type_v ⇒ Integer
#type_v=(type_v) ⇒ Integer
#yarn_attn_factor ⇒ Float
#yarn_attn_factor=(yarn_attn_factor) ⇒ Float
#yarn_beta_fast ⇒ Float
#yarn_beta_fast=(yarn_beta_fast) ⇒ Float
#yarn_beta_slow ⇒ Float
#yarn_beta_slow=(yarn_beta_slow) ⇒ Float
#yarn_ext_factor ⇒ Float
#yarn_ext_factor=(yarn_ext_factor) ⇒ Float
#yarn_orig_ctx ⇒ Integer
#yarn_orig_ctx=(yarn_orig_ctx) ⇒ Integer

Instance Method Details

#attention_type ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 699

static VALUE llama_context_params_get_attention_type(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return INT2NUM(data->attention_type);
}

#attention_type=(attention_type) ⇒ `Integer`

Parameters:

attention_type (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 704

static VALUE llama_context_params_set_attention_type(VALUE self, VALUE attention_type) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->attention_type = (enum llama_attention_type)NUM2INT(attention_type);
  return attention_type;
}

#defrag_thold ⇒ `Float`

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 798

static VALUE llama_context_params_get_defrag_thold(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return DBL2NUM(data->defrag_thold);
}

#defrag_thold=(defrag_thold) ⇒ `Float`

Parameters:

defrag_thold (Float)

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 803

static VALUE llama_context_params_set_defrag_thold(VALUE self, VALUE defrag_thold) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->defrag_thold = NUM2DBL(defrag_thold);
  return defrag_thold;
}

#embeddings ⇒ `Boolean`

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 831

static VALUE llama_context_params_get_embeddings(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return data->embeddings ? Qtrue : Qfalse;
}

#embeddings=(embeddings) ⇒ `Boolean`

Parameters:

embeddings (Boolean)

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 836

static VALUE llama_context_params_set_embeddings(VALUE self, VALUE embeddings) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->embeddings = RTEST(embeddings) ? true : false;
  return embeddings;
}

#flash_attn_type ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 710

static VALUE llama_context_params_get_flash_attn_type(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return INT2NUM(data->flash_attn_type);
}

#flash_attn_type=(flash_attn_type) ⇒ `Integer`

Parameters:

flash_attn_type (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 715

static VALUE llama_context_params_set_flash_attn_type(VALUE self, VALUE flash_attn_type) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->flash_attn_type = (enum llama_flash_attn_type)NUM2INT(flash_attn_type);
  return flash_attn_type;
}

#kv_unified ⇒ `Boolean`

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 886

static VALUE llama_context_params_get_kv_unified(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return data->kv_unified ? Qtrue : Qfalse;
}

#kv_unified=(kv_unified) ⇒ `Boolean`

Parameters:

kv_unified (Boolean)

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 891

static VALUE llama_context_params_set_kv_unified(VALUE self, VALUE kv_unified) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->kv_unified = RTEST(kv_unified) ? true : false;
  return kv_unified;
}

#n_batch ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 622

static VALUE llama_context_params_get_n_batch(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return UINT2NUM(data->n_batch);
}

#n_batch=(n_batch) ⇒ `Integer`

Parameters:

n_batch (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 627

static VALUE llama_context_params_set_n_batch(VALUE self, VALUE n_batch) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->n_batch = NUM2UINT(n_batch);
  return n_batch;
}

#n_ctx ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 611

static VALUE llama_context_params_get_n_ctx(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return UINT2NUM(data->n_ctx);
}

#n_ctx=(n_ctx) ⇒ `Integer`

Parameters:

n_ctx (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 616

static VALUE llama_context_params_set_n_ctx(VALUE self, VALUE n_ctx) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->n_ctx = NUM2UINT(n_ctx);
  return n_ctx;
}

#n_seq_max ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 644

static VALUE llama_context_params_get_n_seq_max(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return UINT2NUM(data->n_seq_max);
}

#n_seq_max=(n_seq_max) ⇒ `Integer`

Parameters:

n_seq_max (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 649

static VALUE llama_context_params_set_n_seq_max(VALUE self, VALUE n_seq_max) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->n_seq_max = NUM2UINT(n_seq_max);
  return n_seq_max;
}

#n_threads ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 655

static VALUE llama_context_params_get_n_threads(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return INT2NUM(data->n_threads);
}

#n_threads=(n_threads) ⇒ `Integer`

Parameters:

n_threads (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 660

static VALUE llama_context_params_set_n_threads(VALUE self, VALUE n_threads) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->n_threads = NUM2INT(n_threads);
  return n_threads;
}

#n_threads_batch ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 666

static VALUE llama_context_params_get_n_threads_batch(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return INT2NUM(data->n_threads_batch);
}

#n_threads_batch=(n_threads_batch) ⇒ `Integer`

Parameters:

n_threads_batch (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 671

static VALUE llama_context_params_set_n_threads_batch(VALUE self, VALUE n_threads_batch) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->n_threads = NUM2INT(n_threads_batch);
  return n_threads_batch;
}

#n_ubatch ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 633

static VALUE llama_context_params_get_n_ubatch(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return UINT2NUM(data->n_ubatch);
}

#n_ubatch=(n_ubatch) ⇒ `Integer`

Parameters:

n_ubatch (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 638

static VALUE llama_context_params_set_n_ubatch(VALUE self, VALUE n_ubatch) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->n_ubatch = NUM2UINT(n_ubatch);
  return n_ubatch;
}

#no_perf ⇒ `Boolean`

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 853

static VALUE llama_context_params_get_no_perf(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return data->no_perf ? Qtrue : Qfalse;
}

#no_perf=(no_perf) ⇒ `Boolean`

Parameters:

no_perf (Boolean)

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 858

static VALUE llama_context_params_set_no_perf(VALUE self, VALUE no_perf) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->no_perf = RTEST(no_perf) ? true : false;
  return no_perf;
}

#offload_kqv ⇒ `Boolean`

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 842

static VALUE llama_context_params_get_offload_kqv(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return data->offload_kqv ? Qtrue : Qfalse;
}

#offload_kqv=(offload_kqv) ⇒ `Boolean`

Parameters:

offload_kqv (Boolean)

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 847

static VALUE llama_context_params_set_offload_kqv(VALUE self, VALUE offload_kqv) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->offload_kqv = RTEST(offload_kqv) ? true : false;
  return offload_kqv;
}

#op_offload ⇒ `Boolean`

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 864

static VALUE llama_context_params_get_op_offload(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return data->op_offload ? Qtrue : Qfalse;
}

#op_offload=(op_offload) ⇒ `Boolean`

Parameters:

op_offload (Boolean)

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 869

static VALUE llama_context_params_set_op_offload(VALUE self, VALUE op_offload) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->op_offload = RTEST(op_offload) ? true : false;
  return op_offload;
}

#pooling_type ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 688

static VALUE llama_context_params_get_pooling_type(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return INT2NUM(data->pooling_type);
}

#pooling_type=(pooling_type) ⇒ `Integer`

Parameters:

pooling_type (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 693

static VALUE llama_context_params_set_pooling_type(VALUE self, VALUE pooling_type) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->pooling_type = (enum llama_pooling_type)NUM2INT(pooling_type);
  return pooling_type;
}

#rope_freq_base ⇒ `Float`

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 721

static VALUE llama_context_params_get_rope_freq_base(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return DBL2NUM(data->rope_freq_base);
}

#rope_freq_base=(rope_freq_base) ⇒ `Float`

Parameters:

rope_freq_base (Float)

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 726

static VALUE llama_context_params_set_rope_freq_base(VALUE self, VALUE rope_freq_base) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->rope_freq_base = NUM2DBL(rope_freq_base);
  return rope_freq_base;
}

#rope_freq_scale ⇒ `Float`

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 732

static VALUE llama_context_params_get_rope_freq_scale(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return DBL2NUM(data->rope_freq_scale);
}

#rope_freq_scale=(rope_freq_scale) ⇒ `Float`

Parameters:

rope_freq_scale (Float)

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 737

static VALUE llama_context_params_set_rope_freq_scale(VALUE self, VALUE rope_freq_scale) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->rope_freq_scale = NUM2DBL(rope_freq_scale);
  return rope_freq_scale;
}

#rope_scaling_type ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 677

static VALUE llama_context_params_get_rope_scaling_type(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return INT2NUM(data->rope_scaling_type);
}

#rope_scaling_type=(rope_scaling_type) ⇒ `Integer`

Parameters:

rope_scaling_type (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 682

static VALUE llama_context_params_set_rope_scaling_type(VALUE self, VALUE rope_scaling_type) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->rope_scaling_type = (enum llama_rope_scaling_type)NUM2INT(rope_scaling_type);
  return rope_scaling_type;
}

#swa_full ⇒ `Boolean`

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 875

static VALUE llama_context_params_get_swa_full(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return data->swa_full ? Qtrue : Qfalse;
}

#swa_full=(swa_full) ⇒ `Boolean`

Parameters:

swa_full (Boolean)

Returns:

(Boolean)

# File 'ext/llama_cpp/llama_cpp.c', line 880

static VALUE llama_context_params_set_swa_full(VALUE self, VALUE swa_full) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->swa_full = RTEST(swa_full) ? true : false;
  return swa_full;
}

#type_k ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 809

static VALUE llama_context_params_get_type_k(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return INT2NUM(data->type_k);
}

#type_k=(type_k) ⇒ `Integer`

Parameters:

type_k (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 814

static VALUE llama_context_params_set_type_k(VALUE self, VALUE type_k) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->type_k = (enum ggml_type)NUM2INT(type_k);
  return type_k;
}

#type_v ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 820

static VALUE llama_context_params_get_type_v(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return INT2NUM(data->type_v);
}

#type_v=(type_v) ⇒ `Integer`

Parameters:

type_v (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 825

static VALUE llama_context_params_set_type_v(VALUE self, VALUE type_v) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->type_v = (enum ggml_type)NUM2INT(type_v);
  return type_v;
}

#yarn_attn_factor ⇒ `Float`

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 754

static VALUE llama_context_params_get_yarn_attn_factor(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return DBL2NUM(data->yarn_attn_factor);
}

#yarn_attn_factor=(yarn_attn_factor) ⇒ `Float`

Parameters:

yarn_attn_factor (Float)

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 759

static VALUE llama_context_params_set_yarn_attn_factor(VALUE self, VALUE yarn_attn_factor) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->yarn_attn_factor = NUM2DBL(yarn_attn_factor);
  return yarn_attn_factor;
}

#yarn_beta_fast ⇒ `Float`

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 765

static VALUE llama_context_params_get_yarn_beta_fast(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return DBL2NUM(data->yarn_beta_fast);
}

#yarn_beta_fast=(yarn_beta_fast) ⇒ `Float`

Parameters:

yarn_beta_fast (Float)

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 770

static VALUE llama_context_params_set_yarn_beta_fast(VALUE self, VALUE yarn_beta_fast) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->yarn_beta_fast = NUM2DBL(yarn_beta_fast);
  return yarn_beta_fast;
}

#yarn_beta_slow ⇒ `Float`

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 776

static VALUE llama_context_params_get_yarn_beta_slow(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return DBL2NUM(data->yarn_beta_slow);
}

#yarn_beta_slow=(yarn_beta_slow) ⇒ `Float`

Parameters:

yarn_beta_slow (Float)

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 781

static VALUE llama_context_params_set_yarn_beta_slow(VALUE self, VALUE yarn_beta_slow) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->yarn_beta_slow = NUM2DBL(yarn_beta_slow);
  return yarn_beta_slow;
}

#yarn_ext_factor ⇒ `Float`

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 743

static VALUE llama_context_params_get_yarn_ext_factor(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return DBL2NUM(data->yarn_ext_factor);
}

#yarn_ext_factor=(yarn_ext_factor) ⇒ `Float`

Parameters:

yarn_ext_factor (Float)

Returns:

(Float)

# File 'ext/llama_cpp/llama_cpp.c', line 748

static VALUE llama_context_params_set_yarn_ext_factor(VALUE self, VALUE yarn_ext_factor) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->yarn_ext_factor = NUM2DBL(yarn_ext_factor);
  return yarn_ext_factor;
}

#yarn_orig_ctx ⇒ `Integer`

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 787

static VALUE llama_context_params_get_yarn_orig_ctx(VALUE self) {
  struct llama_context_params* data = get_llama_context_params(self);
  return UINT2NUM(data->yarn_orig_ctx);
}

#yarn_orig_ctx=(yarn_orig_ctx) ⇒ `Integer`

Parameters:

yarn_orig_ctx (Integer)

Returns:

(Integer)

# File 'ext/llama_cpp/llama_cpp.c', line 792

static VALUE llama_context_params_set_yarn_orig_ctx(VALUE self, VALUE yarn_orig_ctx) {
  struct llama_context_params* data = get_llama_context_params(self);
  data->yarn_orig_ctx = NUM2UINT(yarn_orig_ctx);
  return yarn_orig_ctx;
}

Class: LlamaCpp::LlamaContextParams

Overview

Instance Method Summary collapse

Instance Method Details

#attention_type ⇒ Integer

#attention_type=(attention_type) ⇒ Integer

#defrag_thold ⇒ Float

#defrag_thold=(defrag_thold) ⇒ Float

#embeddings ⇒ Boolean

#embeddings=(embeddings) ⇒ Boolean

#flash_attn_type ⇒ Integer

#flash_attn_type=(flash_attn_type) ⇒ Integer

#kv_unified ⇒ Boolean

#kv_unified=(kv_unified) ⇒ Boolean

#n_batch ⇒ Integer

#n_batch=(n_batch) ⇒ Integer

#n_ctx ⇒ Integer

#n_ctx=(n_ctx) ⇒ Integer

#n_seq_max ⇒ Integer

#n_seq_max=(n_seq_max) ⇒ Integer

#n_threads ⇒ Integer

#n_threads=(n_threads) ⇒ Integer

#n_threads_batch ⇒ Integer

#n_threads_batch=(n_threads_batch) ⇒ Integer

#n_ubatch ⇒ Integer

#n_ubatch=(n_ubatch) ⇒ Integer

#no_perf ⇒ Boolean

#no_perf=(no_perf) ⇒ Boolean

#offload_kqv ⇒ Boolean

#offload_kqv=(offload_kqv) ⇒ Boolean

#op_offload ⇒ Boolean

#op_offload=(op_offload) ⇒ Boolean

#pooling_type ⇒ Integer

#pooling_type=(pooling_type) ⇒ Integer

#rope_freq_base ⇒ Float

#rope_freq_base=(rope_freq_base) ⇒ Float

#rope_freq_scale ⇒ Float

#rope_freq_scale=(rope_freq_scale) ⇒ Float

#rope_scaling_type ⇒ Integer

#rope_scaling_type=(rope_scaling_type) ⇒ Integer

#swa_full ⇒ Boolean

#swa_full=(swa_full) ⇒ Boolean

#type_k ⇒ Integer

#type_k=(type_k) ⇒ Integer

#type_v ⇒ Integer

#type_v=(type_v) ⇒ Integer

#yarn_attn_factor ⇒ Float

#yarn_attn_factor=(yarn_attn_factor) ⇒ Float

#yarn_beta_fast ⇒ Float

#yarn_beta_fast=(yarn_beta_fast) ⇒ Float

#yarn_beta_slow ⇒ Float

#yarn_beta_slow=(yarn_beta_slow) ⇒ Float

#yarn_ext_factor ⇒ Float

#yarn_ext_factor=(yarn_ext_factor) ⇒ Float

#yarn_orig_ctx ⇒ Integer

#yarn_orig_ctx=(yarn_orig_ctx) ⇒ Integer

#attention_type ⇒ `Integer`

#attention_type=(attention_type) ⇒ `Integer`

#defrag_thold ⇒ `Float`

#defrag_thold=(defrag_thold) ⇒ `Float`

#embeddings ⇒ `Boolean`

#embeddings=(embeddings) ⇒ `Boolean`

#flash_attn_type ⇒ `Integer`

#flash_attn_type=(flash_attn_type) ⇒ `Integer`

#kv_unified ⇒ `Boolean`

#kv_unified=(kv_unified) ⇒ `Boolean`

#n_batch ⇒ `Integer`

#n_batch=(n_batch) ⇒ `Integer`

#n_ctx ⇒ `Integer`

#n_ctx=(n_ctx) ⇒ `Integer`

#n_seq_max ⇒ `Integer`

#n_seq_max=(n_seq_max) ⇒ `Integer`

#n_threads ⇒ `Integer`

#n_threads=(n_threads) ⇒ `Integer`

#n_threads_batch ⇒ `Integer`

#n_threads_batch=(n_threads_batch) ⇒ `Integer`

#n_ubatch ⇒ `Integer`

#n_ubatch=(n_ubatch) ⇒ `Integer`

#no_perf ⇒ `Boolean`

#no_perf=(no_perf) ⇒ `Boolean`

#offload_kqv ⇒ `Boolean`

#offload_kqv=(offload_kqv) ⇒ `Boolean`

#op_offload ⇒ `Boolean`

#op_offload=(op_offload) ⇒ `Boolean`

#pooling_type ⇒ `Integer`

#pooling_type=(pooling_type) ⇒ `Integer`

#rope_freq_base ⇒ `Float`

#rope_freq_base=(rope_freq_base) ⇒ `Float`

#rope_freq_scale ⇒ `Float`

#rope_freq_scale=(rope_freq_scale) ⇒ `Float`

#rope_scaling_type ⇒ `Integer`

#rope_scaling_type=(rope_scaling_type) ⇒ `Integer`

#swa_full ⇒ `Boolean`

#swa_full=(swa_full) ⇒ `Boolean`

#type_k ⇒ `Integer`

#type_k=(type_k) ⇒ `Integer`

#type_v ⇒ `Integer`

#type_v=(type_v) ⇒ `Integer`

#yarn_attn_factor ⇒ `Float`

#yarn_attn_factor=(yarn_attn_factor) ⇒ `Float`

#yarn_beta_fast ⇒ `Float`

#yarn_beta_fast=(yarn_beta_fast) ⇒ `Float`

#yarn_beta_slow ⇒ `Float`

#yarn_beta_slow=(yarn_beta_slow) ⇒ `Float`

#yarn_ext_factor ⇒ `Float`

#yarn_ext_factor=(yarn_ext_factor) ⇒ `Float`

#yarn_orig_ctx ⇒ `Integer`

#yarn_orig_ctx=(yarn_orig_ctx) ⇒ `Integer`