export interface LoadModelParams { log_level?: LogLevel; seed?: number; n_ctx?: number; n_batch?: number; n_gpu_layers?: number; n_threads?: number; embeddings?: boolean; offload_kqv?: boolean; pooling_type?: 'LLAMA_POOLING_TYPE_UNSPECIFIED' | 'LLAMA_POOLING_TYPE_NONE' | 'LLAMA_POOLING_TYPE_MEAN' | 'LLAMA_POOLING_TYPE_CLS' | 'unspecified' | 'none' | 'mean' | 'cls' | 'last' | 'rank'; rope_scaling_type?: 'LLAMA_ROPE_SCALING_TYPE_UNSPECIFIED' | 'LLAMA_ROPE_SCALING_TYPE_NONE' | 'LLAMA_ROPE_SCALING_TYPE_LINEAR' | 'LLAMA_ROPE_SCALING_TYPE_YARN'; rope_freq_base?: number; rope_freq_scale?: number; yarn_ext_factor?: number; yarn_attn_factor?: number; yarn_beta_fast?: number; yarn_beta_slow?: number; yarn_orig_ctx?: number; cache_type_k?: 'f32' | 'f16' | 'q8_0' | 'q5_1' | 'q5_0' | 'q4_1' | 'q4_0'; cache_type_v?: 'f32' | 'f16' | 'q8_0' | 'q5_1' | 'q5_0' | 'q4_1' | 'q4_0'; flash_attn?: boolean; swa_full?: boolean; chat_template?: string; jinja?: boolean; reasoning?: boolean; image_min_tokens?: number; image_max_tokens?: number; warmup?: boolean; no_kv_offload?: boolean; mmproj_offload?: boolean; cont_batching?: boolean; n_keep?: number; ctx_shift?: boolean; cache_idle_slots?: boolean; n_cache_reuse?: number; lora_adapters?: { path: string; scale?: number; }[]; lora_init_without_apply?: boolean; spec_draft_model?: string; spec_draft_ngl?: number; spec_draft_n_max?: number; spec_draft_n_min?: number; spec_draft_p_min?: number; spec_draft_threads?: number; spec_draft_threads_batch?: number; kv_overrides?: Record; reasoning_budget_tokens?: number; reasoning_budget_message?: string; reasoning_format?: 'none' | 'deepseek-legacy' | 'deepseek'; skip_chat_parsing?: boolean; prefill_assistant?: boolean; default_template_kwargs?: Record; } export interface LoadedContextInfo { n_vocab: number; n_ctx: number; n_batch: number; n_ubatch: number; n_ctx_train: number; n_embd: number; n_layer: number; metadata: Record; token_bos: number; token_eos: number; token_eot: number; list_tokens_eog: number[]; has_encoder: boolean; token_decoder_start: number; add_bos_token: boolean; add_eos_token: boolean; has_image_input: boolean; has_audio_input: boolean; } export interface SamplingParams { seed?: number; mirostat?: number | undefined; mirostat_eta?: number | undefined; mirostat_tau?: number | undefined; samplers_sequence?: string[] | undefined; temp?: number | undefined; top_p?: number | undefined; top_k?: number | undefined; penalty_last_n?: number | undefined; penalty_repeat?: number | undefined; penalty_freq?: number | undefined; penalty_present?: number | undefined; dynatemp_range?: number | undefined; dynatemp_exponent?: number | undefined; grammar?: string; n_prev?: number | undefined; n_probs?: number | undefined; min_p?: number | undefined; typ_p?: number | undefined; typical_p?: number | undefined; logit_bias?: { token: number; bias: number; }[] | undefined; ignore_eos?: boolean | undefined; } export interface StreamParams { stream: true; onData: (data: T) => void; } export declare enum LogLevel { DEBUG = 1, INFO = 2, WARN = 3, ERROR = 4 }