Reorganized for new stable/waypoint versioning design.

This commit is contained in:
2026-05-24 18:28:47 +00:00
parent 945d2225a2
commit bc7a168851
352 changed files with 1264 additions and 294 deletions

View File

@@ -0,0 +1,15 @@
version: 0.5.4-1
requires: []
defaultConfig:
namespace: llm
model: Qwen/Qwen2.5-7B-Instruct
maxModelLen: 8192
gpuMemoryUtilization: 0.9
gpuProduct: RTX 4090
cpuRequest: '4'
cpuLimit: '8'
memoryRequest: 16Gi
memoryLimit: 24Gi
gpuCount: 1
domain: vllm.{{ .cloud.domain }}
defaultSecrets: []