-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathapplication-serve-mistral-7b.yaml
47 lines (47 loc) · 1.28 KB
/
application-serve-mistral-7b.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
---
apiVersion: argoproj.io/v1alpha1
kind: Application
metadata:
labels:
app: serve-mistral-7b
name: serve-mistral-7b
namespace: openshift-gitops
spec:
destination:
server: 'https://kubernetes.default.svc'
project: default
source:
path: gitops/model
repoURL: https://github.com/alvarolop/model-serving-utils.git
targetRevision: main
helm:
values: |
dataScienceProjectDisplayName: mistral-7b
dataScienceProjectNamespace: mistral-7b
instanceName: mistral-7b
model:
root: mistralai
id: Mistral-7B-Instruct-v0.2
name: mistral-7b
displayName: Mistral 7b
# additionalLabels:
# networking.knative.dev/visibility: cluster-local
toolCallParser: mistral
maxModelLen: '6144'
runtime:
resources:
limits:
cpu: '8'
memory: 24Gi
requests:
cpu: '6'
memory: 24Gi
image: quay.io/modh/vllm@sha256:c86ff1e89c86bc9821b75d7f2bbc170b3c13e3ccf538bf543b1110f23e056316
accelerator:
productName: NVIDIA-A10G-SHARED
syncPolicy:
automated:
prune: false
selfHeal: false
syncOptions:
- CreateNamespace=true