2024-06-21 22:18:13 +00:00
|
|
|
apiVersion: apps/v1
|
|
|
|
kind: Deployment
|
|
|
|
metadata:
|
|
|
|
name: fast-whisper
|
2024-06-21 22:27:36 +00:00
|
|
|
namespace: api-ns
|
2024-06-21 22:18:13 +00:00
|
|
|
labels:
|
|
|
|
app: fast-whisper
|
|
|
|
spec:
|
|
|
|
replicas: 1
|
|
|
|
selector:
|
|
|
|
matchLabels:
|
2024-06-21 22:40:09 +00:00
|
|
|
app: fast-whisper
|
2024-06-21 22:42:51 +00:00
|
|
|
template:
|
|
|
|
metadata:
|
|
|
|
labels:
|
|
|
|
app: fast-whisper
|
|
|
|
spec:
|
2024-06-21 23:02:42 +00:00
|
|
|
runtimeClassName: nvidia
|
2024-06-21 22:42:51 +00:00
|
|
|
containers:
|
|
|
|
- name: fast-whisper
|
|
|
|
image: fedirz/faster-whisper-server:latest-cuda
|
|
|
|
ports:
|
|
|
|
- containerPort: 8000
|
2024-06-21 22:53:54 +00:00
|
|
|
resources:
|
|
|
|
limits:
|
|
|
|
nvidia.com/gpu: 1
|
2024-07-04 00:46:12 +00:00
|
|
|
env:
|
|
|
|
- name: MAX_NO_DATA_SECONDS
|
|
|
|
value: "100.0"
|