|
Strings | antiprompt [get, set] |
|
Strings | api_keys [get, set] |
|
SWIGTYPE_llama_attention_type | attention_type [get, set] |
|
string | cache_type_k [get, set] |
|
string | cache_type_v [get, set] |
|
SWIGTYPE_p_ggml_backend_sched_eval_callback | cb_eval [get, set] |
|
SWIGTYPE_p_void | cb_eval_user_data [get, set] |
|
string | chat_template [get, set] |
|
bool | check_tensors [get, set] |
|
string | chunk_separator [get, set] |
|
int | chunk_size [get, set] |
|
bool | compute_ppl [get, set] |
|
bool | cont_batching [get, set] |
|
Strings | context_files [get, set] |
|
int | control_vector_layer_end [get, set] |
|
int | control_vector_layer_start [get, set] |
|
LlamaControlVectorLoadInfos | control_vectors [get, set] |
|
bool | conversation [get, set] |
|
dimre_method | cvector_dimre_method [get, set] |
|
string | cvector_negative_file [get, set] |
|
string | cvector_outfile [get, set] |
|
string | cvector_positive_file [get, set] |
|
float | defrag_thold [get, set] |
|
bool | display_prompt [get, set] |
|
bool | dump_kv_cache [get, set] |
|
int | embd_normalize [get, set] |
|
string | embd_out [get, set] |
|
string | embd_sep [get, set] |
|
bool | embedding [get, set] |
|
bool | enable_chat_template [get, set] |
|
bool | endpoint_metrics [get, set] |
|
bool | endpoint_slots [get, set] |
|
bool | escape [get, set] |
|
bool | flash_attn [get, set] |
|
int | grp_attn_n [get, set] |
|
int | grp_attn_w [get, set] |
|
bool | hellaswag [get, set] |
|
uint | hellaswag_tasks [get, set] |
|
string | hf_file [get, set] |
|
string | hf_repo [get, set] |
|
string | hf_token [get, set] |
|
string | hostname [get, set] |
|
int | i_chunk [get, set] |
|
int | i_pos [get, set] |
|
bool | ignore_eos [get, set] |
|
Strings | image [get, set] |
|
Strings | in_files [get, set] |
|
bool | infill [get, set] |
|
string | input_prefix [get, set] |
|
bool | input_prefix_bos [get, set] |
|
string | input_suffix [get, set] |
|
bool | interactive [get, set] |
|
bool | interactive_first [get, set] |
|
bool | is_pp_shared [get, set] |
|
bool | kl_divergence [get, set] |
|
SWIGTYPE_p_std__vectorT_llama_model_kv_override_t | kv_overrides [get, set] |
|
bool | log_json [get, set] |
|
string | logdir [get, set] |
|
bool | logits_all [get, set] |
|
string | logits_file [get, set] |
|
string | lookup_cache_dynamic [get, set] |
|
string | lookup_cache_static [get, set] |
|
SWIGTYPE_p_std__vectorT_std__tupleT_std__string_float_t_t | lora_adapter [get, set] |
|
string | lora_outfile [get, set] |
|
int | main_gpu [get, set] |
|
string | mmproj [get, set] |
|
string | model [get, set] |
|
string | model_alias [get, set] |
|
string | model_draft [get, set] |
|
string | model_url [get, set] |
|
bool | multiline_input [get, set] |
|
bool | multiple_choice [get, set] |
|
uint | multiple_choice_tasks [get, set] |
|
int | n_batch [get, set] |
|
int | n_chunks [get, set] |
|
int | n_ctx [get, set] |
|
int | n_draft [get, set] |
|
int | n_gpu_layers [get, set] |
|
int | n_gpu_layers_draft [get, set] |
|
int | n_junk [get, set] |
|
int | n_keep [get, set] |
|
int | n_out_freq [get, set] |
|
int | n_parallel [get, set] |
|
int | n_pca_batch [get, set] |
|
int | n_pca_iterations [get, set] |
|
Int32s | n_pl [get, set] |
|
Int32s | n_pp [get, set] |
|
int | n_predict [get, set] |
|
int | n_print [get, set] |
|
int | n_save_freq [get, set] |
|
int | n_sequences [get, set] |
|
Int32s | n_tg [get, set] |
|
int | n_threads [get, set] |
|
int | n_threads_batch [get, set] |
|
int | n_threads_batch_draft [get, set] |
|
int | n_threads_draft [get, set] |
|
int | n_threads_http [get, set] |
|
int | n_ubatch [get, set] |
|
bool | no_kv_offload [get, set] |
|
SWIGTYPE_p_ggml_numa_strategy | numa [get, set] |
|
string | out_file [get, set] |
|
float | p_split [get, set] |
|
string | path_prompt_cache [get, set] |
|
SWIGTYPE_llama_pooling_type | pooling_type [get, set] |
|
int | port [get, set] |
|
int | ppl_output_type [get, set] |
|
int | ppl_stride [get, set] |
|
bool | process_output [get, set] |
|
string | prompt [get, set] |
|
bool | prompt_cache_all [get, set] |
|
bool | prompt_cache_ro [get, set] |
|
string | prompt_file [get, set] |
|
string | public_path [get, set] |
|
float | rope_freq_base [get, set] |
|
float | rope_freq_scale [get, set] |
|
SWIGTYPE_llama_rope_scaling_type | rope_scaling_type [get, set] |
|
string | rpc_servers [get, set] |
|
uint | seed [get, set] |
|
bool | simple_io [get, set] |
|
float | slot_prompt_similarity [get, set] |
|
string | slot_save_path [get, set] |
|
llama_sampling_params | sparams [get, set] |
|
bool | special [get, set] |
|
SWIGTYPE_llama_split_mode | split_mode [get, set] |
|
bool | spm_infill [get, set] |
|
string | ssl_file_cert [get, set] |
|
string | ssl_file_key [get, set] |
|
string | system_prompt [get, set] |
|
SWIGTYPE_p_float | tensor_split [get, set] |
|
int | timeout_read [get, set] |
|
int | timeout_write [get, set] |
|
bool | usage [get, set] |
|
bool | use_color [get, set] |
|
bool | use_mlock [get, set] |
|
bool | use_mmap [get, set] |
|
bool | verbose_prompt [get, set] |
|
int | verbosity [get, set] |
|
bool | warmup [get, set] |
|
bool | winogrande [get, set] |
|
uint | winogrande_tasks [get, set] |
|
float | yarn_attn_factor [get, set] |
|
float | yarn_beta_fast [get, set] |
|
float | yarn_beta_slow [get, set] |
|
float | yarn_ext_factor [get, set] |
|
int | yarn_orig_ctx [get, set] |
|