mirror of
https://github.com/remsky/Kokoro-FastAPI.git
synced 2025-08-31 21:59:28 +00:00
Add example folder values files for Azure AKS and Nvidia GPU Operator
This commit is contained in:
parent
14bd6a8118
commit
3c8e1b9143
2 changed files with 57 additions and 1 deletions
|
@ -19,7 +19,7 @@
|
|||
# --skip-gpu-driver-install
|
||||
|
||||
kokoroTTS:
|
||||
replicaCount: 2
|
||||
replicaCount: 8
|
||||
port: 8880
|
||||
tag: v0.2.0
|
||||
pullPolicy: IfNotPresent
|
56
charts/kokoro-fastapi/examples/gpu-operator-values.yaml
Normal file
56
charts/kokoro-fastapi/examples/gpu-operator-values.yaml
Normal file
|
@ -0,0 +1,56 @@
|
|||
# Follow the official NVIDIA GPU Operator documentation
|
||||
# to install the GPU operator with these settings:
|
||||
# https://docs.nvidia.com/datacenter/cloud-native/gpu-operator/latest/getting-started.html
|
||||
#
|
||||
# This example is for a Nvidia T4 16gb GPU node pool with only 1 GPU on each node on Azure AKS.
|
||||
# It uses time-slicing to share the a and claim to the system that 1 GPU is 4 GPUs.
|
||||
# So each pod has access to a smaller gpu with 4gb of memory.
|
||||
#
|
||||
devicePlugin: # Remove this if you dont want to use time-slicing
|
||||
config:
|
||||
create: true
|
||||
name: "time-slicing-config"
|
||||
default: "any"
|
||||
data:
|
||||
any: |-
|
||||
version: v1
|
||||
flags:
|
||||
migStrategy: none
|
||||
sharing:
|
||||
timeSlicing:
|
||||
resources:
|
||||
- name: nvidia.com/gpu
|
||||
replicas: 4
|
||||
|
||||
daemonsets:
|
||||
tolerations:
|
||||
- key: "sku"
|
||||
operator: Equal
|
||||
value: "gpu"
|
||||
effect: NoSchedule
|
||||
- key: "kubernetes.azure.com/scalesetpriority"
|
||||
operator: Equal
|
||||
value: "spot"
|
||||
effect: NoSchedule
|
||||
|
||||
node-feature-discovery:
|
||||
master:
|
||||
tolerations:
|
||||
- key: "sku"
|
||||
operator: Equal
|
||||
value: "gpu"
|
||||
effect: NoSchedule
|
||||
- key: "kubernetes.azure.com/scalesetpriority"
|
||||
operator: Equal
|
||||
value: "spot"
|
||||
effect: NoSchedule
|
||||
worker:
|
||||
tolerations:
|
||||
- key: "sku"
|
||||
operator: Equal
|
||||
value: "gpu"
|
||||
effect: NoSchedule
|
||||
- key: "kubernetes.azure.com/scalesetpriority"
|
||||
operator: Equal
|
||||
value: "spot"
|
||||
effect: NoSchedule
|
Loading…
Add table
Reference in a new issue