mirror of
https://github.com/remsky/Kokoro-FastAPI.git
synced 2025-08-31 21:59:28 +00:00
Add example folder values files for Azure AKS and Nvidia GPU Operator
This commit is contained in:
parent
14bd6a8118
commit
3c8e1b9143
2 changed files with 57 additions and 1 deletions
|
@ -19,7 +19,7 @@
|
||||||
# --skip-gpu-driver-install
|
# --skip-gpu-driver-install
|
||||||
|
|
||||||
kokoroTTS:
|
kokoroTTS:
|
||||||
replicaCount: 2
|
replicaCount: 8
|
||||||
port: 8880
|
port: 8880
|
||||||
tag: v0.2.0
|
tag: v0.2.0
|
||||||
pullPolicy: IfNotPresent
|
pullPolicy: IfNotPresent
|
56
charts/kokoro-fastapi/examples/gpu-operator-values.yaml
Normal file
56
charts/kokoro-fastapi/examples/gpu-operator-values.yaml
Normal file
|
@ -0,0 +1,56 @@
|
||||||
|
# Follow the official NVIDIA GPU Operator documentation
|
||||||
|
# to install the GPU operator with these settings:
|
||||||
|
# https://docs.nvidia.com/datacenter/cloud-native/gpu-operator/latest/getting-started.html
|
||||||
|
#
|
||||||
|
# This example is for a Nvidia T4 16gb GPU node pool with only 1 GPU on each node on Azure AKS.
|
||||||
|
# It uses time-slicing to share the a and claim to the system that 1 GPU is 4 GPUs.
|
||||||
|
# So each pod has access to a smaller gpu with 4gb of memory.
|
||||||
|
#
|
||||||
|
devicePlugin: # Remove this if you dont want to use time-slicing
|
||||||
|
config:
|
||||||
|
create: true
|
||||||
|
name: "time-slicing-config"
|
||||||
|
default: "any"
|
||||||
|
data:
|
||||||
|
any: |-
|
||||||
|
version: v1
|
||||||
|
flags:
|
||||||
|
migStrategy: none
|
||||||
|
sharing:
|
||||||
|
timeSlicing:
|
||||||
|
resources:
|
||||||
|
- name: nvidia.com/gpu
|
||||||
|
replicas: 4
|
||||||
|
|
||||||
|
daemonsets:
|
||||||
|
tolerations:
|
||||||
|
- key: "sku"
|
||||||
|
operator: Equal
|
||||||
|
value: "gpu"
|
||||||
|
effect: NoSchedule
|
||||||
|
- key: "kubernetes.azure.com/scalesetpriority"
|
||||||
|
operator: Equal
|
||||||
|
value: "spot"
|
||||||
|
effect: NoSchedule
|
||||||
|
|
||||||
|
node-feature-discovery:
|
||||||
|
master:
|
||||||
|
tolerations:
|
||||||
|
- key: "sku"
|
||||||
|
operator: Equal
|
||||||
|
value: "gpu"
|
||||||
|
effect: NoSchedule
|
||||||
|
- key: "kubernetes.azure.com/scalesetpriority"
|
||||||
|
operator: Equal
|
||||||
|
value: "spot"
|
||||||
|
effect: NoSchedule
|
||||||
|
worker:
|
||||||
|
tolerations:
|
||||||
|
- key: "sku"
|
||||||
|
operator: Equal
|
||||||
|
value: "gpu"
|
||||||
|
effect: NoSchedule
|
||||||
|
- key: "kubernetes.azure.com/scalesetpriority"
|
||||||
|
operator: Equal
|
||||||
|
value: "spot"
|
||||||
|
effect: NoSchedule
|
Loading…
Add table
Reference in a new issue