LlamaController constructor
LlamaController({
- required String modelPath,
- bool? vocabOnly,
- bool? useMmap,
- bool? useMlock,
- bool? checkTensors,
- int? nCtx,
- int? nBatch,
- int? nUBatch,
- int? nSeqMax,
- int? nThreads,
- int? nThreadsBatch,
- RopeScalingType? ropeScalingType,
- PoolingType? poolingType,
- AttentionType? attentionType,
- double? ropeFrequencyBase,
- double? ropeFrequencyScale,
- double? yarnExtrapolationFactor,
- double? yarnAttenuationFactor,
- double? yarnBetaFast,
- double? yarnBetaSlow,
- int? yarnOriginalContext,
- double? defragmentationThreshold,
- GgmlType? typeK,
- GgmlType? typeV,
- bool? embeddings,
- bool? offloadKqv,
- bool? flashAttention,
- bool? noPerformance,
- bool? greedy,
- bool? infill,
- int? seed,
- int? topK,
- double? topP,
- int? minKeepTopP,
- double? minP,
- int? minKeepMinP,
- double? typicalP,
- int? minKeepTypicalP,
- double? temperature,
- double? temperatureDelta,
- double? temperatureExponent,
- double? xtcP,
- double? xtcT,
- int? minKeepXtc,
- int? xtcSeed,
- int? mirostatNVocab,
- int? mirostatSeed,
- double? mirostatTau,
- double? mirostatEta,
- int? mirostatM,
- int? mirostatV2Seed,
- double? mirostatV2Tau,
- double? mirostatV2Eta,
- String? grammarStr,
- String? grammarRoot,
- int? penaltiesLastN,
- double? penaltiesRepeat,
- double? penaltiesFrequency,
- double? penaltiesPresent,
- int? drySamplerNCtxTrain,
- double? drySamplerMultiplier,
- double? drySamplerDryBase,
- int? drySamplerAllowedLength,
Creates a new instance of LlamaController.
Implementation
LlamaController({
required String modelPath,
bool? vocabOnly,
bool? useMmap,
bool? useMlock,
bool? checkTensors,
int? nCtx,
int? nBatch,
int? nUBatch,
int? nSeqMax,
int? nThreads,
int? nThreadsBatch,
RopeScalingType? ropeScalingType,
PoolingType? poolingType,
AttentionType? attentionType,
double? ropeFrequencyBase,
double? ropeFrequencyScale,
double? yarnExtrapolationFactor,
double? yarnAttenuationFactor,
double? yarnBetaFast,
double? yarnBetaSlow,
int? yarnOriginalContext,
double? defragmentationThreshold,
GgmlType? typeK,
GgmlType? typeV,
bool? embeddings,
bool? offloadKqv,
bool? flashAttention,
bool? noPerformance,
bool? greedy,
bool? infill,
int? seed,
int? topK,
double? topP,
int? minKeepTopP,
double? minP,
int? minKeepMinP,
double? typicalP,
int? minKeepTypicalP,
double? temperature,
double? temperatureDelta,
double? temperatureExponent,
double? xtcP,
double? xtcT,
int? minKeepXtc,
int? xtcSeed,
int? mirostatNVocab,
int? mirostatSeed,
double? mirostatTau,
double? mirostatEta,
int? mirostatM,
int? mirostatV2Seed,
double? mirostatV2Tau,
double? mirostatV2Eta,
String? grammarStr,
String? grammarRoot,
int? penaltiesLastN,
double? penaltiesRepeat,
double? penaltiesFrequency,
double? penaltiesPresent,
int? drySamplerNCtxTrain,
double? drySamplerMultiplier,
double? drySamplerDryBase,
int? drySamplerAllowedLength,
}) : _modelPath = modelPath,
_vocabOnly = vocabOnly,
_useMmap = useMmap,
_useMlock = useMlock,
_checkTensors = checkTensors,
_nCtx = nCtx ?? 0,
_nBatch = nBatch,
_nUBatch = nUBatch,
_nSeqMax = nSeqMax,
_nThreads = nThreads,
_nThreadsBatch = nThreadsBatch,
_ropeScalingType = ropeScalingType,
_poolingType = poolingType,
_attentionType = attentionType,
_ropeFrequencyBase = ropeFrequencyBase,
_ropeFrequencyScale = ropeFrequencyScale,
_yarnExtrapolationFactor = yarnExtrapolationFactor,
_yarnAttenuationFactor = yarnAttenuationFactor,
_yarnBetaFast = yarnBetaFast,
_yarnBetaSlow = yarnBetaSlow,
_yarnOriginalContext = yarnOriginalContext,
_defragmentationThreshold = defragmentationThreshold,
_typeK = typeK,
_typeV = typeV,
_embeddings = embeddings,
_offloadKqv = offloadKqv,
_flashAttention = flashAttention,
_noPerformance = noPerformance,
_greedy = greedy ?? false,
_infill = infill ?? false,
_seed = seed,
_topK = topK,
_topP = topP,
_minKeepTopP = minKeepTopP,
_minP = minP,
_minKeepMinP = minKeepMinP,
_typicalP = typicalP,
_minKeepTypicalP = minKeepTypicalP,
_temperature = temperature,
_temperatureDelta = temperatureDelta,
_temperatureExponent = temperatureExponent,
_xtcP = xtcP,
_xtcT = xtcT,
_minKeepXtc = minKeepXtc,
_xtcSeed = xtcSeed,
_mirostatNVocab = mirostatNVocab,
_mirostatSeed = mirostatSeed,
_mirostatTau = mirostatTau,
_mirostatEta = mirostatEta,
_mirostatM = mirostatM,
_mirostatV2Seed = mirostatV2Seed,
_mirostatV2Tau = mirostatV2Tau,
_mirostatV2Eta = mirostatV2Eta,
_grammarStr = grammarStr,
_grammarRoot = grammarRoot,
_penaltiesLastN = penaltiesLastN,
_penaltiesRepeat = penaltiesRepeat,
_penaltiesFrequency = penaltiesFrequency,
_penaltiesPresent = penaltiesPresent,
_drySamplerNCtxTrain = drySamplerNCtxTrain,
_drySamplerMultiplier = drySamplerMultiplier,
_drySamplerDryBase = drySamplerDryBase,
_drySamplerAllowedLength = drySamplerAllowedLength;