llama-cpp-hs

Index

abort_callbackLlama.Internal.Types.Params
abort_callback_dataLlama.Internal.Types.Params
acceptLlama.Internal.Types
acceptTokenWithSamplerLlama.Sampler
AdapterLora 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
AddBosLlama.Internal.Types
addSamplerToChainLlama.Sampler
allowRequantizeLlama.Internal.Types.Params
AlwaysLlama.Internal.Types
applyLlama.Internal.Types
applyAdapterCVecLlama.Adapter
applySamplerLlama.Sampler
areEmbeddingsEnabledLlama.Decode
attention_typeLlama.Internal.Types.Params
Batch 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
batchGetOneLlama.Decode
batchInitLlama.Decode
biasLlama.Internal.Types
cb_evalLlama.Internal.Types.Params
cb_eval_user_dataLlama.Internal.Types.Params
cellsLlama.Internal.Types
cells_sequencesLlama.Internal.Types
chatApplyTemplateLlama.ChatTemplate
chatContentLlama.ChatTemplate
chatGetBuiltinTemplatesLlama.ChatTemplate
ChatMessage 
1 (Type/Class)Llama.ChatTemplate
2 (Data Constructor)Llama.ChatTemplate
chatRoleLlama.ChatTemplate
checkTensorsLlama.Internal.Types.Params
clearAdapterLoraLlama.Adapter
CLlamaAdapterLora 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
CLlamaContext 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
CLlamaContextParams 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
CLlamaKVCache 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
CLlamaModel 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
CLlamaModelParams 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
CLlamaModelQuantizeParams 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
CLlamaSamplerChainParams 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
CLlamaVocab 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
cloneLlama.Internal.Types
cloneSamplerLlama.Sampler
contentLlama.Internal.Types
Context 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
ContextParamsPtr 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
ctxLlama.Internal.Types
c_llama_adapter_lora_freeLlama.Internal.Foreign.Adapter, Llama.Internal.Foreign
c_llama_adapter_lora_initLlama.Internal.Foreign.Adapter, Llama.Internal.Foreign
c_llama_apply_adapter_cvecLlama.Internal.Foreign.Adapter, Llama.Internal.Foreign
c_llama_backend_freeLlama.Internal.Foreign.Backend, Llama.Internal.Foreign
c_llama_backend_initLlama.Internal.Foreign.Backend, Llama.Internal.Foreign
c_llama_batch_free_wrapLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_batch_get_one_intoLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_batch_init_intoLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_chat_apply_templateLlama.Internal.Foreign.ChatTemplate, Llama.Internal.Foreign
c_llama_chat_builtin_templatesLlama.Internal.Foreign.ChatTemplate, Llama.Internal.Foreign
c_llama_clear_adapter_loraLlama.Internal.Foreign.Adapter, Llama.Internal.Foreign
c_llama_context_default_params_intoLlama.Internal.Foreign.Context, Llama.Internal.Foreign
c_llama_decode_wrapLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_detach_threadpoolLlama.Internal.Foreign.Context, Llama.Internal.Foreign
c_llama_detokenizeLlama.Internal.Foreign.Tokenize, Llama.Internal.Foreign
c_llama_encodeLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_freeLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_get_embeddingsLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_get_embeddings_ithLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_get_embeddings_seqLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_get_kv_selfLlama.Internal.Foreign.Context, Llama.Internal.Foreign
c_llama_get_logitsLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_get_logits_ithLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_get_modelLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_init_from_model_wrapLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_kv_cache_view_freeLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_cache_view_init_intoLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_cache_view_updateLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_can_shiftLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_clearLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_defragLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_n_tokensLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_seq_addLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_seq_cpLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_seq_divLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_seq_keepLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_seq_pos_maxLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_seq_rmLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_updateLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_kv_self_used_cellsLlama.Internal.Foreign.KVCache, Llama.Internal.Foreign
c_llama_log_setLlama.Internal.Foreign.Split, Llama.Internal.Foreign
c_llama_model_chat_templateLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_decoder_start_tokenLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_default_paramsLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_descLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_freeLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_get_vocabLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_has_decoderLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_has_encoderLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_is_recurrentLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_load_from_file_wrapLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_load_from_splitsLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_meta_countLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_meta_key_by_indexLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_meta_val_strLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_meta_val_str_by_indexLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_n_ctx_trainLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_n_embdLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_n_headLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_n_head_kvLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_n_layerLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_n_paramsLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_quantizeLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_quantize_default_paramsLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_rope_freq_scale_trainLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_rope_type_intoLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_model_sizeLlama.Internal.Foreign.Model, Llama.Internal.Foreign
c_llama_n_threadsLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_n_threads_batchLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_n_vocabLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_perf_contextLlama.Internal.Foreign.Performance, Llama.Internal.Foreign
c_llama_perf_context_printLlama.Internal.Foreign.Performance, Llama.Internal.Foreign
c_llama_perf_context_resetLlama.Internal.Foreign.Performance, Llama.Internal.Foreign
c_llama_perf_samplerLlama.Internal.Foreign.Performance, Llama.Internal.Foreign
c_llama_perf_sampler_printLlama.Internal.Foreign.Performance, Llama.Internal.Foreign
c_llama_perf_sampler_resetLlama.Internal.Foreign.Performance, Llama.Internal.Foreign
c_llama_pooling_type_intoLlama.Internal.Foreign.Context, Llama.Internal.Foreign
c_llama_print_system_infoLlama.Internal.Foreign.Split, Llama.Internal.Foreign
c_llama_rm_adapter_loraLlama.Internal.Foreign.Adapter, Llama.Internal.Foreign
c_llama_sampler_acceptLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_applyLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_chain_addLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_chain_default_params_intoLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_chain_getLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_chain_initLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_chain_nLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_chain_removeLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_cloneLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_freeLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_get_seedLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_initLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_distLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_dryLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_grammarLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_grammar_lazy_patternsLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_greedyLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_infillLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_logit_biasLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_min_pLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_mirostatLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_mirostat_v2Llama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_penaltiesLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_tempLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_temp_extLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_top_kLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_top_n_sigmaLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_top_pLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_typicalLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_init_xtcLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_nameLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_resetLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_sampler_sampleLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
c_llama_set_abort_callbackLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_set_adapter_loraLlama.Internal.Foreign.Adapter, Llama.Internal.Foreign
c_llama_set_causal_attnLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_set_embeddingsLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_set_n_threadsLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_set_warmupLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_split_pathLlama.Internal.Foreign.Split, Llama.Internal.Foreign
c_llama_split_prefixLlama.Internal.Foreign.Split, Llama.Internal.Foreign
c_llama_state_get_dataLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_state_get_sizeLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_state_load_fileLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_state_save_fileLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_state_seq_get_dataLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_state_seq_get_sizeLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_state_seq_load_fileLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_state_seq_save_fileLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_state_seq_set_dataLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_state_set_dataLlama.Internal.Foreign.State, Llama.Internal.Foreign
c_llama_synchronizeLlama.Internal.Foreign.Decode, Llama.Internal.Foreign
c_llama_tokenizeLlama.Internal.Foreign.Tokenize, Llama.Internal.Foreign
c_llama_token_to_pieceLlama.Internal.Foreign.Tokenize, Llama.Internal.Foreign
c_llama_vocab_bosLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_eosLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_eotLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_fim_midLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_fim_padLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_fim_preLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_fim_repLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_fim_sepLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_fim_sufLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_get_add_bosLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_get_add_eosLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_get_attrLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_get_scoreLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_get_textLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_is_controlLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_is_eogLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_nlLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_n_tokensLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_padLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_sepLlama.Internal.Foreign.Vocab, Llama.Internal.Foreign
c_llama_vocab_typeLlama.Internal.Foreign.Model, Llama.Internal.Foreign
data_Llama.Internal.Types
decodeBatchLlama.Decode
defaultContextParamsLlama.Context
defaultModelParamsLlama.Model
defaultQuantizeParamsLlama.Model
defaultSamplerChainParamsLlama.Sampler
defrag_tholdLlama.Internal.Types.Params
detachThreadPoolLlama.Context
detokenizeLlama.Tokenize
devicesLlama.Internal.Types.Params
embdLlama.Internal.Types
embeddingsLlama.Internal.Types.Params
encodeBatchLlama.Decode
flash_attnLlama.Internal.Types.Params
freeBatchLlama.Decode
free_Llama.Internal.Types
fromLlamaRopePoolingTypeLlama.Internal.Types.Params
fromLlamaRopeTypeScalingLlama.Internal.Types.Params
fromLlamaRopeVocabTypeLlama.Internal.Types.Params
ftypeLlama.Internal.Types.Params
getBatchSizeLlama.Context
getBatchThreadCountLlama.Decode
getContextModelLlama.Model
getContextPerformanceLlama.Performance
getContextSizeLlama.Context
getMaxDevicesLlama.Context
getMaxSeqCountLlama.Context
getModelChatTemplateLlama.Model
getModelDecoderStartTokenLlama.Model
getModelDescriptionLlama.Model
getModelEmbeddingDimLlama.Model
getModelHasDecoderLlama.Model
getModelHasEncoderLlama.Model
getModelIsRecurrentLlama.Model
getModelMetaCountLlama.Model
getModelMetaKeyByIndexLlama.Model
getModelMetaValueLlama.Model
getModelMetaValueByIndexLlama.Model
getModelNumHeadsLlama.Model
getModelNumKVHeadsLlama.Model
getModelNumLayersLlama.Model
getModelNumParamsLlama.Model
getModelRoPEFreqScaleLlama.Model
getModelRopeTypeLlama.Model
getModelSizeLlama.Model
getModelTrainingContextSizeLlama.Model
getModelVocabLlama.Model
getPoolingTypeLlama.Context
getSamplerChainLengthLlama.Sampler
getSamplerFromChainLlama.Sampler
getSamplerNameLlama.Sampler
getSamplerPerformanceLlama.Performance
getSamplerSeedLlama.Sampler
getSequenceStateSizeLlama.State
getStateDataLlama.State
getStateSizeLlama.State
getThreadCountLlama.Decode
getTimeUsLlama.Context
getUnbatchedSizeLlama.Context
getVocabAddBOSTokenLlama.Vocab
getVocabAddEOSTokenLlama.Vocab
getVocabBosTokenLlama.Vocab
getVocabEosTokenLlama.Vocab
getVocabEotTokenLlama.Vocab
getVocabFIMMiddleTokenLlama.Vocab
getVocabFIMPADTokenLlama.Vocab
getVocabFIMPrefixTokenLlama.Vocab
getVocabFIMSeparatorTokenLlama.Vocab
getVocabFIMSuffixTokenLlama.Vocab
getVocabNlTokenLlama.Vocab
getVocabPadTokenLlama.Vocab
getVocabSepTokenLlama.Vocab
getVocabSizeLlama.Vocab
getVocabTokenAttrLlama.Vocab
getVocabTokenCountLlama.Vocab
getVocabTokenScoreLlama.Vocab
getVocabTokenTextLlama.Vocab
getVocabTypeLlama.Model
GgmlTypeLlama.Internal.Types.Params
GGML_TYPE_BF16Llama.Internal.Types.Params
GGML_TYPE_COUNTLlama.Internal.Types.Params
GGML_TYPE_F16Llama.Internal.Types.Params
GGML_TYPE_F32Llama.Internal.Types.Params
GGML_TYPE_F64Llama.Internal.Types.Params
GGML_TYPE_I16Llama.Internal.Types.Params
GGML_TYPE_I32Llama.Internal.Types.Params
GGML_TYPE_I64Llama.Internal.Types.Params
GGML_TYPE_I8Llama.Internal.Types.Params
GGML_TYPE_IQ1_MLlama.Internal.Types.Params
GGML_TYPE_IQ1_SLlama.Internal.Types.Params
GGML_TYPE_IQ2_SLlama.Internal.Types.Params
GGML_TYPE_IQ2_XSLlama.Internal.Types.Params
GGML_TYPE_IQ2_XXSLlama.Internal.Types.Params
GGML_TYPE_IQ3_SLlama.Internal.Types.Params
GGML_TYPE_IQ3_XXSLlama.Internal.Types.Params
GGML_TYPE_IQ4_NLLlama.Internal.Types.Params
GGML_TYPE_IQ4_XSLlama.Internal.Types.Params
GGML_TYPE_Q2_KLlama.Internal.Types.Params
GGML_TYPE_Q3_KLlama.Internal.Types.Params
GGML_TYPE_Q4_0Llama.Internal.Types.Params
GGML_TYPE_Q4_1Llama.Internal.Types.Params
GGML_TYPE_Q4_KLlama.Internal.Types.Params
GGML_TYPE_Q5_0Llama.Internal.Types.Params
GGML_TYPE_Q5_1Llama.Internal.Types.Params
GGML_TYPE_Q5_KLlama.Internal.Types.Params
GGML_TYPE_Q6_KLlama.Internal.Types.Params
GGML_TYPE_Q8_0Llama.Internal.Types.Params
GGML_TYPE_Q8_1Llama.Internal.Types.Params
GGML_TYPE_Q8_KLlama.Internal.Types.Params
GGML_TYPE_TQ1_0Llama.Internal.Types.Params
GGML_TYPE_TQ2_0Llama.Internal.Types.Params
idLlama.Internal.Types
ifaceLlama.Internal.Types
imatrixLlama.Internal.Types.Params
initAdapterLoraLlama.Adapter
initContextFromModelLlama.Model
initDistributedSamplerLlama.Sampler
initDrySamplerLlama.Sampler
initGrammarLazyPatternsSamplerLlama.Sampler
initGrammarSamplerLlama.Sampler
initGreedySamplerLlama.Sampler
initInfillSamplerLlama.Sampler
initLogitBiasSamplerLlama.Sampler
initMinPSamplerLlama.Sampler
initMirostatSamplerLlama.Sampler
initMirostatV2SamplerLlama.Sampler
initPenaltiesSamplerLlama.Sampler
initSamplerLlama.Sampler
initSamplerChainLlama.Sampler
initTempExtSamplerLlama.Sampler
initTempSamplerLlama.Sampler
initTopKSamplerLlama.Sampler
initTopNSigmaSamplerLlama.Sampler
initTopPSamplerLlama.Sampler
initTypicalSamplerLlama.Sampler
initXTCSamplerLlama.Sampler
isVocabTokenControlLlama.Vocab
isVocabTokenEogLlama.Vocab
keepSplitLlama.Internal.Types.Params
KVCache 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
kvCacheViewInitLlama.KVCache
kvCacheViewUpdateLlama.KVCache
kvOverridesLlama.Internal.Types.Params
kvOverridesQuantizeParamsLlama.Internal.Types.Params
kvSelfCanShiftLlama.KVCache
kvSelfClearLlama.KVCache
kvSelfDefragLlama.KVCache
kvSelfNumTokensLlama.KVCache
kvSelfSeqAddLlama.KVCache
kvSelfSeqCopyLlama.KVCache
kvSelfSeqDivLlama.KVCache
kvSelfSeqKeepLlama.KVCache
kvSelfSeqPosMaxLlama.KVCache
kvSelfSeqRemoveLlama.KVCache
kvSelfUpdateLlama.KVCache
kvSelfUsedCellsLlama.KVCache
LlamaAttentionTypeLlama.Internal.Types.Params
llamaBackendFreeLlama.Backend
llamaBackendInitLlama.Backend
LlamaBatch 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaChatMessage 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaContextParams 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
LlamaKvCacheView 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaLogitBias 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaModelParams 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
LlamaModelQuantizeParams 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
LlamaPerfContextData 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaPerfSamplerData 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaPoolingTypeLlama.Internal.Types.Params
LlamaPosLlama.Internal.Types
LlamaRopeTypeScalingLlama.Internal.Types.Params
LlamaSampler 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaSamplerChainParams 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
LlamaSamplerContextLlama.Internal.Types
LlamaSamplerI 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaSeqIdLlama.Internal.Types
LlamaSplitMode 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
LlamaTokenLlama.Internal.Types
LlamaTokenData 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaTokenDataArray 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
LlamaVocabTypeLlama.Internal.Types.Params
LLAMA_ATTENTION_TYPE_CAUSALLlama.Internal.Types.Params
LLAMA_ATTENTION_TYPE_NON_CAUSALLlama.Internal.Types.Params
LLAMA_ATTENTION_TYPE_UNSPECIFIEDLlama.Internal.Types.Params
llama_max_devicesLlama.Internal.Foreign.Context, Llama.Internal.Foreign
llama_n_batchLlama.Internal.Foreign.Context, Llama.Internal.Foreign
llama_n_ctxLlama.Internal.Foreign.Context, Llama.Internal.Foreign
llama_n_seq_maxLlama.Internal.Foreign.Context, Llama.Internal.Foreign
llama_n_ubatchLlama.Internal.Foreign.Context, Llama.Internal.Foreign
LLAMA_POOLING_TYPE_CLSLlama.Internal.Types.Params
LLAMA_POOLING_TYPE_LASTLlama.Internal.Types.Params
LLAMA_POOLING_TYPE_MEANLlama.Internal.Types.Params
LLAMA_POOLING_TYPE_NONELlama.Internal.Types.Params
LLAMA_POOLING_TYPE_RANKLlama.Internal.Types.Params
LLAMA_POOLING_TYPE_UNSPECIFIEDLlama.Internal.Types.Params
LLAMA_ROPE_SCALING_TYPE_LINEARLlama.Internal.Types.Params
LLAMA_ROPE_SCALING_TYPE_LONGROPELlama.Internal.Types.Params
LLAMA_ROPE_SCALING_TYPE_MAX_VALUELlama.Internal.Types.Params
LLAMA_ROPE_SCALING_TYPE_NONELlama.Internal.Types.Params
LLAMA_ROPE_SCALING_TYPE_UNSPECIFIEDLlama.Internal.Types.Params
LLAMA_ROPE_SCALING_TYPE_YARNLlama.Internal.Types.Params
llama_supports_gpu_offloadLlama.Internal.Foreign.Context, Llama.Internal.Foreign
llama_supports_mlockLlama.Internal.Foreign.Context, Llama.Internal.Foreign
llama_supports_mmapLlama.Internal.Foreign.Context, Llama.Internal.Foreign
llama_supports_rpcLlama.Internal.Foreign.Context, Llama.Internal.Foreign
llama_time_usLlama.Internal.Foreign.Context, Llama.Internal.Foreign
LLAMA_VOCAB_TYPE_BPELlama.Internal.Types.Params
LLAMA_VOCAB_TYPE_NONELlama.Internal.Types.Params
LLAMA_VOCAB_TYPE_RWKVLlama.Internal.Types.Params
LLAMA_VOCAB_TYPE_SPMLlama.Internal.Types.Params
LLAMA_VOCAB_TYPE_UGMLlama.Internal.Types.Params
LLAMA_VOCAB_TYPE_WPMLlama.Internal.Types.Params
loadModelFromFileLlama.Model
loadModelFromSplitsLlama.Model
loadSequenceStateFromFileLlama.State
loadStateFromFileLlama.State
logitLlama.Internal.Types
logitsLlama.Internal.Types
logits_allLlama.Internal.Types.Params
mainGpuLlama.Internal.Types.Params
max_contiguousLlama.Internal.Types
max_contiguous_idxLlama.Internal.Types
Model 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
ModelParamsPtr 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
ModelQuantizeParamsPtr 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
nameLlama.Internal.Types
NeverLlama.Internal.Types
nGpuLayersLlama.Internal.Types.Params
noPerfLlama.Internal.Types.Params
no_perfLlama.Internal.Types.Params
nthreadLlama.Internal.Types.Params
n_batchLlama.Internal.Types.Params
n_cellsLlama.Internal.Types
n_ctxLlama.Internal.Types.Params
n_evalLlama.Internal.Types
n_p_evalLlama.Internal.Types
n_sampleLlama.Internal.Types
n_seq_idLlama.Internal.Types
n_seq_max 
1 (Function)Llama.Internal.Types
2 (Function)Llama.Internal.Types.Params
n_threadsLlama.Internal.Types.Params
n_threads_batchLlama.Internal.Types.Params
n_tokensLlama.Internal.Types
n_ubatchLlama.Internal.Types.Params
offload_kqvLlama.Internal.Types.Params
onlyCopyLlama.Internal.Types.Params
outputTensorTypeLlama.Internal.Types.Params
pLlama.Internal.Types
pooling_typeLlama.Internal.Types.Params
posLlama.Internal.Types
printContextPerformanceLlama.Performance
printSamplerPerformanceLlama.Performance
printSystemInfoLlama.Split
progressCallbackLlama.Internal.Types.Params
progressCallbackUserDataLlama.Internal.Types.Params
pure_Llama.Internal.Types.Params
p_llama_adapter_lora_freeLlama.Internal.Foreign.Adapter, Llama.Internal.Foreign
p_llama_freeLlama.Internal.Foreign.Model, Llama.Internal.Foreign
p_llama_model_freeLlama.Internal.Foreign.Model, Llama.Internal.Foreign
p_llama_sampler_freeLlama.Internal.Foreign.Sampler, Llama.Internal.Foreign
quantizeModelLlama.Model
quantizeModelDefaultLlama.Model
quantizeOutputTensorLlama.Internal.Types.Params
removeSamplerFromChainLlama.Sampler
resetLlama.Internal.Types
resetContextPerformanceLlama.Performance
resetSamplerLlama.Sampler
resetSamplerPerformanceLlama.Performance
rmAdapterLoraLlama.Adapter
roleLlama.Internal.Types
rope_freq_baseLlama.Internal.Types.Params
rope_freq_scaleLlama.Internal.Types.Params
rope_scaling_typeLlama.Internal.Types.Params
Sampler 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
SamplerChainParamsPtr 
1 (Type/Class)Llama.Internal.Types.Params
2 (Data Constructor)Llama.Internal.Types.Params
sampleWithSamplerLlama.Sampler
saveSequenceStateToFileLlama.State
saveStateToFileLlama.State
selectedLlama.Internal.Types
seq_idLlama.Internal.Types
setAdapterLoraLlama.Adapter
setCausalAttentionLlama.Decode
setEmbeddingsEnabledLlama.Decode
setSequenceStateDataLlama.State
setStateDataLlama.State
setThreadCountLlama.Decode
setThreadCountsLlama.Decode
setWarmupModeLlama.Decode
size_Llama.Internal.Types
sortedLlama.Internal.Types
splitModeLlama.Internal.Types.Params
splitPathLlama.Split
splitPrefixLlama.Split
supportsGpuOffloadLlama.Context
supportsMLockLlama.Context
supportsMMapLlama.Context
supportsRpcLlama.Context
synchronizeContextLlama.Decode
tensorBuftOverridesLlama.Internal.Types.Params
tensorSplitLlama.Internal.Types.Params
tensorTypesLlama.Internal.Types.Params
toCLlamaChatMessageLlama.ChatTemplate
tokenLlama.Internal.Types
tokenEmbeddingTypeLlama.Internal.Types.Params
tokenizeLlama.Tokenize
tokenLogitBiasLlama.Internal.Types
tokenToPieceLlama.Tokenize
token_countLlama.Internal.Types
type_kLlama.Internal.Types.Params
type_vLlama.Internal.Types.Params
t_eval_msLlama.Internal.Types
t_load_msLlama.Internal.Types
t_p_eval_msLlama.Internal.Types
t_sample_msLlama.Internal.Types
t_start_msLlama.Internal.Types
used_cellsLlama.Internal.Types
useMlockLlama.Internal.Types.Params
useMmapLlama.Internal.Types.Params
Vocab 
1 (Type/Class)Llama.Internal.Types
2 (Data Constructor)Llama.Internal.Types
vocabOnlyLlama.Internal.Types.Params
yarn_attn_factorLlama.Internal.Types.Params
yarn_beta_fastLlama.Internal.Types.Params
yarn_beta_slowLlama.Internal.Types.Params
yarn_ext_factorLlama.Internal.Types.Params
yarn_orig_ctxLlama.Internal.Types.Params