38 lines
1.0 KiB
YAML
38 lines
1.0 KiB
YAML
# k8s/ai/tei/deploy.yaml
|
|
apiVersion: apps/v1
|
|
kind: Deployment
|
|
metadata: { name: tei, namespace: ml }
|
|
spec:
|
|
replicas: 1
|
|
selector: { matchLabels: { app: tei } }
|
|
template:
|
|
metadata: { labels: { app: tei } }
|
|
spec:
|
|
containers:
|
|
- name: tei
|
|
image: ghcr.io/huggingface/text-embeddings-inference:cpu-latest
|
|
env: [{ name: MODEL_ID, value: "mixedbread-ai/mxbai-embed-large-v1" }]
|
|
ports: [{ containerPort: 80 }]
|
|
---
|
|
apiVersion: v1
|
|
kind: Service
|
|
metadata: { name: tei, namespace: ml }
|
|
spec: { selector: { app: tei }, ports: [ { port: 80, targetPort: 80 } ] }
|
|
---
|
|
apiVersion: networking.k8s.io/v1
|
|
kind: Ingress
|
|
metadata:
|
|
name: tei
|
|
namespace: ml
|
|
annotations: { cert-manager.io/cluster-issuer: letsencrypt-prod }
|
|
spec:
|
|
ingressClassName: nginx
|
|
tls: [{ hosts: ["embeddings.betelgeusebytes.io"], secretName: tei-tls }]
|
|
rules:
|
|
- host: embeddings.betelgeusebytes.io
|
|
http:
|
|
paths:
|
|
- path: /
|
|
pathType: Prefix
|
|
backend: { service: { name: tei, port: { number: 80 } } }
|