|
|
|
@ -169,7 +169,7 @@ var ( |
|
|
|
// Enable the new Ollama engine
|
|
|
|
NewEngine = Bool("OLLAMA_NEW_ENGINE") |
|
|
|
// ContextLength sets the default context length
|
|
|
|
ContextLength = Uint("OLLAMA_CONTEXT_LENGTH", 2048) |
|
|
|
ContextLength = Uint("OLLAMA_CONTEXT_LENGTH", 4096) |
|
|
|
) |
|
|
|
|
|
|
|
func String(s string) func() string { |
|
|
|
@ -255,7 +255,7 @@ func AsMap() map[string]EnvVar { |
|
|
|
"OLLAMA_ORIGINS": {"OLLAMA_ORIGINS", AllowedOrigins(), "A comma separated list of allowed origins"}, |
|
|
|
"OLLAMA_SCHED_SPREAD": {"OLLAMA_SCHED_SPREAD", SchedSpread(), "Always schedule model across all GPUs"}, |
|
|
|
"OLLAMA_MULTIUSER_CACHE": {"OLLAMA_MULTIUSER_CACHE", MultiUserCache(), "Optimize prompt caching for multi-user scenarios"}, |
|
|
|
"OLLAMA_CONTEXT_LENGTH": {"OLLAMA_CONTEXT_LENGTH", ContextLength(), "Context length to use unless otherwise specified (default: 2048)"}, |
|
|
|
"OLLAMA_CONTEXT_LENGTH": {"OLLAMA_CONTEXT_LENGTH", ContextLength(), "Context length to use unless otherwise specified (default: 4096)"}, |
|
|
|
"OLLAMA_NEW_ENGINE": {"OLLAMA_NEW_ENGINE", NewEngine(), "Enable the new Ollama engine"}, |
|
|
|
|
|
|
|
// Informational
|
|
|
|
|