14#include <unordered_map>
19struct llama_control_vector_load_info;
39 uint32_t
seed = LLAMA_DEFAULT_SEED;
71 ggml_backend_sched_eval_callback
cb_eval =
nullptr;
74 ggml_numa_strategy
numa = GGML_NUMA_STRATEGY_DISABLED;
76 enum llama_split_mode
split_mode = LLAMA_SPLIT_MODE_LAYER;
78 enum llama_pooling_type
pooling_type = LLAMA_POOLING_TYPE_UNSPECIFIED;
int32_t cpu_get_num_physical_cores()
int32_t cpu_get_num_math()
dimre_method
Definition common-base.h:33
@ DIMRE_METHOD_MEAN
Definition common-base.h:35
@ DIMRE_METHOD_PCA
Definition common-base.h:34
Definition common-base.h:38
int32_t port
Definition common-base.h:172
bool kl_divergence
Definition common-base.h:128
int32_t chunk_size
Definition common-base.h:207
bool verbose_prompt
Definition common-base.h:150
int32_t n_gpu_layers
Definition common-base.h:55
std::vector< std::string > antiprompt
Definition common-base.h:103
std::string hostname
Definition common-base.h:177
bool multiline_input
Definition common-base.h:140
float rope_freq_scale
Definition common-base.h:63
float slot_prompt_similarity
Definition common-base.h:195
float p_split
Definition common-base.h:54
int32_t n_ubatch
Definition common-base.h:48
bool interactive_first
Definition common-base.h:134
int32_t main_gpu
Definition common-base.h:57
std::vector< std::string > api_keys
Definition common-base.h:183
std::string lookup_cache_dynamic
Definition common-base.h:98
std::string chunk_separator
Definition common-base.h:209
std::string cache_type_v
Definition common-base.h:159
bool compute_ppl
Definition common-base.h:223
bool usage
Definition common-base.h:130
std::string prompt
Definition common-base.h:91
int32_t grp_attn_n
Definition common-base.h:59
int32_t n_print
Definition common-base.h:61
bool infill
Definition common-base.h:152
int n_pca_batch
Definition common-base.h:226
std::string model_draft
Definition common-base.h:85
std::string hf_file
Definition common-base.h:90
std::vector< std::tuple< std::string, float > > lora_adapter
Definition common-base.h:107
int32_t timeout_write
Definition common-base.h:174
bool multiple_choice
Definition common-base.h:125
std::string logdir
Definition common-base.h:96
std::string hf_token
Definition common-base.h:88
int32_t n_threads_batch_draft
Definition common-base.h:44
float yarn_attn_factor
Definition common-base.h:65
int32_t timeout_read
Definition common-base.h:173
enum llama_attention_type attention_type
Definition common-base.h:79
size_t multiple_choice_tasks
Definition common-base.h:126
bool use_color
Definition common-base.h:131
std::string logits_file
Definition common-base.h:99
enum llama_rope_scaling_type rope_scaling_type
Definition common-base.h:77
std::string embd_out
Definition common-base.h:168
int32_t n_sequences
Definition common-base.h:53
std::string model
Definition common-base.h:84
std::vector< llama_model_kv_override > kv_overrides
Definition common-base.h:104
int32_t verbosity
Definition common-base.h:111
bool hellaswag
Definition common-base.h:119
bool winogrande
Definition common-base.h:122
uint32_t seed
Definition common-base.h:39
int32_t ppl_stride
Definition common-base.h:115
int32_t control_vector_layer_end
Definition common-base.h:113
std::vector< int32_t > n_pp
Definition common-base.h:200
dimre_method cvector_dimre_method
Definition common-base.h:228
bool enable_chat_template
Definition common-base.h:181
bool use_mmap
Definition common-base.h:148
int32_t n_draft
Definition common-base.h:50
std::string system_prompt
Definition common-base.h:180
float tensor_split[128]
Definition common-base.h:58
std::string lookup_cache_static
Definition common-base.h:97
std::string ssl_file_cert
Definition common-base.h:186
bool logits_all
Definition common-base.h:147
std::string out_file
Definition common-base.h:216
int32_t n_batch
Definition common-base.h:47
int32_t n_threads_batch
Definition common-base.h:43
std::vector< int32_t > n_tg
Definition common-base.h:201
bool display_prompt
Definition common-base.h:151
int32_t n_predict
Definition common-base.h:45
std::string rpc_servers
Definition common-base.h:100
int32_t n_save_freq
Definition common-base.h:219
int32_t n_ctx
Definition common-base.h:46
float yarn_beta_slow
Definition common-base.h:67
int32_t ppl_output_type
Definition common-base.h:116
int32_t n_threads_http
Definition common-base.h:175
int32_t embd_normalize
Definition common-base.h:167
enum llama_pooling_type pooling_type
Definition common-base.h:78
ggml_backend_sched_eval_callback cb_eval
Definition common-base.h:71
std::string chat_template
Definition common-base.h:179
std::string prompt_file
Definition common-base.h:92
std::string ssl_file_key
Definition common-base.h:185
bool process_output
Definition common-base.h:222
std::vector< int32_t > n_pl
Definition common-base.h:202
std::string input_suffix
Definition common-base.h:95
int32_t n_junk
Definition common-base.h:212
bool endpoint_metrics
Definition common-base.h:189
int32_t grp_attn_w
Definition common-base.h:60
int32_t n_keep
Definition common-base.h:49
bool simple_io
Definition common-base.h:141
std::vector< llama_control_vector_load_info > control_vectors
Definition common-base.h:109
bool special
Definition common-base.h:132
bool no_kv_offload
Definition common-base.h:154
float rope_freq_base
Definition common-base.h:62
std::string hf_repo
Definition common-base.h:89
std::string cvector_positive_file
Definition common-base.h:230
std::string public_path
Definition common-base.h:178
bool use_mlock
Definition common-base.h:149
int32_t yarn_orig_ctx
Definition common-base.h:68
std::vector< std::string > image
Definition common-base.h:163
bool embedding
Definition common-base.h:166
bool interactive
Definition common-base.h:133
size_t hellaswag_tasks
Definition common-base.h:120
int32_t n_parallel
Definition common-base.h:52
bool warmup
Definition common-base.h:155
bool prompt_cache_all
Definition common-base.h:136
std::vector< std::string > context_files
Definition common-base.h:205
size_t winogrande_tasks
Definition common-base.h:123
int32_t i_chunk
Definition common-base.h:220
bool is_pp_shared
Definition common-base.h:198
bool prompt_cache_ro
Definition common-base.h:137
bool escape
Definition common-base.h:139
std::string cvector_outfile
Definition common-base.h:229
bool flash_attn
Definition common-base.h:143
int32_t n_chunks
Definition common-base.h:51
bool conversation
Definition common-base.h:135
void * cb_eval_user_data
Definition common-base.h:72
int32_t n_threads_draft
Definition common-base.h:42
bool dump_kv_cache
Definition common-base.h:153
std::string embd_sep
Definition common-base.h:169
int n_pca_iterations
Definition common-base.h:227
int32_t n_threads
Definition common-base.h:41
int32_t i_pos
Definition common-base.h:213
std::string path_prompt_cache
Definition common-base.h:93
std::string cache_type_k
Definition common-base.h:158
bool cont_batching
Definition common-base.h:142
bool input_prefix_bos
Definition common-base.h:145
int32_t control_vector_layer_start
Definition common-base.h:112
std::string lora_outfile
Definition common-base.h:235
bool endpoint_slots
Definition common-base.h:188
struct llama_sampling_params sparams
Definition common-base.h:82
std::string input_prefix
Definition common-base.h:94
std::string mmproj
Definition common-base.h:162
bool log_json
Definition common-base.h:191
std::string model_alias
Definition common-base.h:86
int32_t n_out_freq
Definition common-base.h:218
enum llama_split_mode split_mode
Definition common-base.h:76
std::string model_url
Definition common-base.h:87
ggml_numa_strategy numa
Definition common-base.h:74
bool check_tensors
Definition common-base.h:156
bool ignore_eos
Definition common-base.h:146
std::string cvector_negative_file
Definition common-base.h:231
int32_t n_gpu_layers_draft
Definition common-base.h:56
bool spm_infill
Definition common-base.h:233
std::string slot_save_path
Definition common-base.h:193
float defrag_thold
Definition common-base.h:69
float yarn_beta_fast
Definition common-base.h:66
std::vector< std::string > in_files
Definition common-base.h:102
float yarn_ext_factor
Definition common-base.h:64
Definition sampling-base.h:18