first commit

This commit is contained in:
2026-05-28 07:21:15 +00:00
commit 6465520041
57 changed files with 942 additions and 0 deletions

View File

@ -0,0 +1,19 @@
- op: replace
path: /spec/template/spec/containers/0/args/5
value: Qwen/Qwen2.5-7B-Instruct
- op: replace
path: /spec/template/spec/containers/0/args/7
value: qwen2-5-7b
- op: replace
path: /spec/template/spec/containers/0/resources/requests/cpu
value: "4"
- op: replace
path: /spec/template/spec/containers/0/resources/requests/memory
value: 24Gi
- op: replace
path: /spec/template/spec/containers/0/resources/limits/cpu
value: "8"
- op: replace
path: /spec/template/spec/containers/0/resources/limits/memory
value: 48Gi

View File

@ -0,0 +1,12 @@
apiVersion: v1
kind: Secret
metadata:
name: vllm-secrets
labels:
app.kubernetes.io/name: vllm-server
app.kubernetes.io/component: auth
app.kubernetes.io/part-of: ocdp-workload
type: Opaque
stringData:
hfToken: ""

View File

@ -0,0 +1,22 @@
apiVersion: kustomize.config.k8s.io/v1beta1
kind: Kustomization
namespace: ocdp-workload-test
nameSuffix: -test
resources:
- ../../../apps/vllm-server/base
- generated-secret.yaml
components:
- ../../../apps/vllm-server/components/gpu-nvidia
- ../../../apps/vllm-server/components/pvc-cache
- ../../../apps/vllm-server/components/service-loadbalancer
patches:
- path: deployment-patch.yaml
target:
group: apps
version: v1
kind: Deployment
name: vllm-server
- path: pvc-patch.yaml
target:
kind: PersistentVolumeClaim
name: vllm-cache

View File

@ -0,0 +1,4 @@
- op: replace
path: /spec/resources/requests/storage
value: 200Gi