apiVersion: v1 kind: Service metadata: name: vllm spec: type: ClusterIP selector: component: inference ports: - name: http port: 8000 targetPort: http