summarylogtreecommitdiffstats
path: root/ollama.conf
blob: 2038e1f9407f94407386be2cfc69890710d474ad (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
# CUDA Environment Variables for Ollama Optimization
CUDA_VISIBLE_DEVICES=0,1,2,3
CUDA_DEVICE_ORDER=PCI_BUS_ID
CUDA_LAUNCH_BLOCKING=0
CUDA_MODULE_LOADING=LAZY
CUDA_MODULE_DATA_LOADING=LAZY
CUDA_CACHE_MAXSIZE=2147483648
CUDA_CACHE_PATH=/var/cache/cuda
CUDA_LOG_FILE=/var/log/cuda.log

# Ollama Environment Variables
OLLAMA_HOST="http://127.0.0.1:11434"
OLLAMA_KEEP_ALIVE="5m"
OLLAMA_LOAD_TIMEOUT="5m"
OLLAMA_CONTEXT_LENGTH=4096
OLLAMA_MAX_LOADED_MODELS=0
OLLAMA_GPU_OVERHEAD=0
OLLAMA_MAX_QUEUE=512
OLLAMA_NUM_PARALLEL=1
OLLAMA_NOHISTORY=false
OLLAMA_NOPRUNE=false
OLLAMA_FLASH_ATTENTION=true
OLLAMA_SCHED_SPREAD=false
OLLAMA_DEBUG=0