Class OllamaOptions
Inheritance
OllamaOptions
Assembly: Glitch9.AIDevKit.Provider.Ollama.dll
Syntax
public sealed class OllamaOptions : ITextRequestOptions, IProviderRequestOptions
Properties
|
Edit this page
View Source
KeepAlive
Declaration
public bool? KeepAlive { get; set; }
Property Value
|
Edit this page
View Source
LowVram
Ollama only. Use VRAM-optimized loading.
Declaration
public bool? LowVram { get; set; }
Property Value
|
Edit this page
View Source
MainGpu
Ollama only. ID of the main GPU to prioritize.
Declaration
public int? MainGpu { get; set; }
Property Value
|
Edit this page
View Source
MinP
Minimum probability for token filtering (less common).
Range: 0.0??.0
Declaration
public float? MinP { get; set; }
Property Value
|
Edit this page
View Source
Mirostat
Ollama only. Enables Mirostat sampling (0: off, 1 or 2: enabled).
Declaration
public int? Mirostat { get; set; }
Property Value
|
Edit this page
View Source
MirostatEta
Ollama only. Controls learning rate in Mirostat sampling.
Typical: 0.1
Declaration
public float? MirostatEta { get; set; }
Property Value
|
Edit this page
View Source
MirostatTau
Ollama only. ontrols surprise level in Mirostat sampling.
Typical: 5.0
Declaration
public float? MirostatTau { get; set; }
Property Value
|
Edit this page
View Source
NumBatch
Number of tokens to process in a single batch.
Declaration
public int? NumBatch { get; set; }
Property Value
|
Edit this page
View Source
NumCtx
Ollama only. Number of context tokens (max sequence length).
Declaration
public int? NumCtx { get; set; }
Property Value
|
Edit this page
View Source
NumGpu
Ollama only. Number of GPUs to use.
Declaration
public int? NumGpu { get; set; }
Property Value
|
Edit this page
View Source
NumKeep
Ollama only. Number of initial tokens to keep from context when truncating.
Declaration
public int? NumKeep { get; set; }
Property Value
|
Edit this page
View Source
NumPredict
Ollama only. Maximum number of tokens to predict (like max_tokens).
Declaration
public int? NumPredict { get; set; }
Property Value
|
Edit this page
View Source
NumThread
Ollama only. Number of CPU threads to use for inference.
Typical: number of physical CPU cores.
Declaration
public int? NumThread { get; set; }
Property Value
|
Edit this page
View Source
Numa
Ollama only. Enable NUMA-aware optimization.
Declaration
public bool? Numa { get; set; }
Property Value
|
Edit this page
View Source
PenalizeNewline
Ollama only. Whether to apply penalties to newline tokens.
Declaration
public bool? PenalizeNewline { get; set; }
Property Value
|
Edit this page
View Source
RepeatLastN
Ollama only. Number of previous tokens to consider for repetition penalty.
Typical: 64??56
Declaration
public int? RepeatLastN { get; set; }
Property Value
|
Edit this page
View Source
RepeatPenalty
Penalizes repetition of recent tokens.
Range: 0.0??.0 (typical: 1.1).
Declaration
public float? RepeatPenalty { get; set; }
Property Value
|
Edit this page
View Source
TypicalP
Ollama only. Typical sampling, alternative to top_p.
Range: 0.0??.0
Declaration
public float? TypicalP { get; set; }
Property Value
|
Edit this page
View Source
UseMlock
Ollama only. Lock model in RAM.
Declaration
public bool? UseMlock { get; set; }
Property Value
|
Edit this page
View Source
UseMmap
Ollama only. Use memory-mapped files.
Declaration
public bool? UseMmap { get; set; }
Property Value
|
Edit this page
View Source
VocabOnly
Ollama only. Only load the vocabulary; do not load full model.
Declaration
public bool? VocabOnly { get; set; }
Property Value
Implements
Extension Methods