mirror of
https://github.com/lordmathis/llamactl.git
synced 2025-11-06 09:04:27 +00:00
Add Instance and CreateInstanceOptions interfaces for instance management
This commit is contained in:
181
ui/src/types/instance.ts
Normal file
181
ui/src/types/instance.ts
Normal file
@@ -0,0 +1,181 @@
|
||||
export interface Instance {
|
||||
name: string;
|
||||
running: boolean;
|
||||
options?: CreateInstanceOptions;
|
||||
}
|
||||
|
||||
export interface CreateInstanceOptions {
|
||||
|
||||
auto_restart?: boolean;
|
||||
max_restarts?: number;
|
||||
restart_delay?: number;
|
||||
|
||||
// Llama server options
|
||||
// Common params
|
||||
verbose_prompt?: boolean;
|
||||
threads?: number;
|
||||
threads_batch?: number;
|
||||
cpu_mask?: string;
|
||||
cpu_range?: string;
|
||||
cpu_strict?: number;
|
||||
priority?: number;
|
||||
poll?: number;
|
||||
cpu_mask_batch?: string;
|
||||
cpu_range_batch?: string;
|
||||
cpu_strict_batch?: number;
|
||||
priority_batch?: number;
|
||||
poll_batch?: number;
|
||||
ctx_size?: number;
|
||||
predict?: number;
|
||||
batch_size?: number;
|
||||
ubatch_size?: number;
|
||||
keep?: number;
|
||||
flash_attn?: boolean;
|
||||
no_perf?: boolean;
|
||||
escape?: boolean;
|
||||
no_escape?: boolean;
|
||||
rope_scaling?: string;
|
||||
rope_scale?: number;
|
||||
rope_freq_base?: number;
|
||||
rope_freq_scale?: number;
|
||||
yarn_orig_ctx?: number;
|
||||
yarn_ext_factor?: number;
|
||||
yarn_attn_factor?: number;
|
||||
yarn_beta_slow?: number;
|
||||
yarn_beta_fast?: number;
|
||||
dump_kv_cache?: boolean;
|
||||
no_kv_offload?: boolean;
|
||||
cache_type_k?: string;
|
||||
cache_type_v?: string;
|
||||
defrag_thold?: number;
|
||||
parallel?: number;
|
||||
mlock?: boolean;
|
||||
no_mmap?: boolean;
|
||||
numa?: string;
|
||||
device?: string;
|
||||
override_tensor?: string[];
|
||||
gpu_layers?: number;
|
||||
split_mode?: string;
|
||||
tensor_split?: string;
|
||||
main_gpu?: number;
|
||||
check_tensors?: boolean;
|
||||
override_kv?: string[];
|
||||
lora?: string[];
|
||||
lora_scaled?: string[];
|
||||
control_vector?: string[];
|
||||
control_vector_scaled?: string[];
|
||||
control_vector_layer_range?: string;
|
||||
model?: string;
|
||||
model_url?: string;
|
||||
hf_repo?: string;
|
||||
hf_repo_draft?: string;
|
||||
hf_file?: string;
|
||||
hf_repo_v?: string;
|
||||
hf_file_v?: string;
|
||||
hf_token?: string;
|
||||
log_disable?: boolean;
|
||||
log_file?: string;
|
||||
log_colors?: boolean;
|
||||
verbose?: boolean;
|
||||
verbosity?: number;
|
||||
log_prefix?: boolean;
|
||||
log_timestamps?: boolean;
|
||||
|
||||
// Sampling params
|
||||
samplers?: string;
|
||||
seed?: number;
|
||||
sampling_seq?: string;
|
||||
ignore_eos?: boolean;
|
||||
temperature?: number;
|
||||
top_k?: number;
|
||||
top_p?: number;
|
||||
min_p?: number;
|
||||
xtc_probability?: number;
|
||||
xtc_threshold?: number;
|
||||
typical?: number;
|
||||
repeat_last_n?: number;
|
||||
repeat_penalty?: number;
|
||||
presence_penalty?: number;
|
||||
frequency_penalty?: number;
|
||||
dry_multiplier?: number;
|
||||
dry_base?: number;
|
||||
dry_allowed_length?: number;
|
||||
dry_penalty_last_n?: number;
|
||||
dry_sequence_breaker?: string[];
|
||||
dynatemp_range?: number;
|
||||
dynatemp_exp?: number;
|
||||
mirostat?: number;
|
||||
mirostat_lr?: number;
|
||||
mirostat_ent?: number;
|
||||
logit_bias?: string[];
|
||||
grammar?: string;
|
||||
grammar_file?: string;
|
||||
json_schema?: string;
|
||||
json_schema_file?: string;
|
||||
|
||||
// Server/Example-specific params
|
||||
no_context_shift?: boolean;
|
||||
special?: boolean;
|
||||
no_warmup?: boolean;
|
||||
spm_infill?: boolean;
|
||||
pooling?: string;
|
||||
cont_batching?: boolean;
|
||||
no_cont_batching?: boolean;
|
||||
mmproj?: string;
|
||||
mmproj_url?: string;
|
||||
no_mmproj?: boolean;
|
||||
no_mmproj_offload?: boolean;
|
||||
alias?: string;
|
||||
host?: string;
|
||||
port?: number;
|
||||
path?: string;
|
||||
no_webui?: boolean;
|
||||
embedding?: boolean;
|
||||
reranking?: boolean;
|
||||
api_key?: string;
|
||||
api_key_file?: string;
|
||||
ssl_key_file?: string;
|
||||
ssl_cert_file?: string;
|
||||
chat_template_kwargs?: string;
|
||||
timeout?: number;
|
||||
threads_http?: number;
|
||||
cache_reuse?: number;
|
||||
metrics?: boolean;
|
||||
slots?: boolean;
|
||||
props?: boolean;
|
||||
no_slots?: boolean;
|
||||
slot_save_path?: string;
|
||||
jinja?: boolean;
|
||||
reasoning_format?: string;
|
||||
reasoning_budget?: number;
|
||||
chat_template?: string;
|
||||
chat_template_file?: string;
|
||||
no_prefill_assistant?: boolean;
|
||||
slot_prompt_similarity?: number;
|
||||
lora_init_without_apply?: boolean;
|
||||
|
||||
// Speculative decoding params
|
||||
draft_max?: number;
|
||||
draft_min?: number;
|
||||
draft_p_min?: number;
|
||||
ctx_size_draft?: number;
|
||||
device_draft?: string;
|
||||
gpu_layers_draft?: number;
|
||||
model_draft?: string;
|
||||
cache_type_k_draft?: string;
|
||||
cache_type_v_draft?: string;
|
||||
|
||||
// Audio/TTS params
|
||||
model_vocoder?: string;
|
||||
tts_use_guide_tokens?: boolean;
|
||||
|
||||
// Default model params
|
||||
embd_bge_small_en_default?: boolean;
|
||||
embd_e5_small_en_default?: boolean;
|
||||
embd_gte_small_default?: boolean;
|
||||
fim_qwen_1_5b_default?: boolean;
|
||||
fim_qwen_3b_default?: boolean;
|
||||
fim_qwen_7b_default?: boolean;
|
||||
fim_qwen_7b_spec?: boolean;
|
||||
fim_qwen_14b_spec?: boolean;
|
||||
}
|
||||
Reference in New Issue
Block a user