chore(ollama): set ollama resource by env-vars
This commit is contained in:
@@ -8,7 +8,11 @@ export OLLAMA_GPU_TYPE := env("OLLAMA_GPU_TYPE", "nvidia")
|
|||||||
export OLLAMA_GPU_COUNT := env("OLLAMA_GPU_COUNT", "1")
|
export OLLAMA_GPU_COUNT := env("OLLAMA_GPU_COUNT", "1")
|
||||||
export OLLAMA_MODELS := env("OLLAMA_MODELS", "")
|
export OLLAMA_MODELS := env("OLLAMA_MODELS", "")
|
||||||
export OLLAMA_STORAGE_SIZE := env("OLLAMA_STORAGE_SIZE", "30Gi")
|
export OLLAMA_STORAGE_SIZE := env("OLLAMA_STORAGE_SIZE", "30Gi")
|
||||||
export OLLAMA_HELM_TIMEOUT := env("OLLAMA_HELM_TIMEOUT", "10m")
|
export OLLAMA_HELM_TIMEOUT := env("OLLAMA_HELM_TIMEOUT", "60m")
|
||||||
|
export OLLAMA_MEMORY_REQUEST := env("OLLAMA_MEMORY_REQUEST", "2Gi")
|
||||||
|
export OLLAMA_MEMORY_LIMIT := env("OLLAMA_MEMORY_LIMIT", "12Gi")
|
||||||
|
export OLLAMA_CPU_REQUEST := env("OLLAMA_CPU_REQUEST", "25m")
|
||||||
|
export OLLAMA_CPU_LIMIT := env("OLLAMA_CPU_LIMIT", "100m")
|
||||||
|
|
||||||
[private]
|
[private]
|
||||||
default:
|
default:
|
||||||
|
|||||||
@@ -36,11 +36,11 @@ securityContext:
|
|||||||
|
|
||||||
resources:
|
resources:
|
||||||
requests:
|
requests:
|
||||||
cpu: 25m
|
cpu: {{ .Env.OLLAMA_CPU_REQUEST }}
|
||||||
memory: 2Gi
|
memory: {{ .Env.OLLAMA_MEMORY_REQUEST }}
|
||||||
limits:
|
limits:
|
||||||
cpu: 100m
|
cpu: {{ .Env.OLLAMA_CPU_LIMIT }}
|
||||||
memory: 8Gi
|
memory: {{ .Env.OLLAMA_MEMORY_LIMIT }}
|
||||||
|
|
||||||
persistentVolume:
|
persistentVolume:
|
||||||
enabled: true
|
enabled: true
|
||||||
|
|||||||
Reference in New Issue
Block a user