diff --git a/kube/deploy/apps/mlc-llm/app/hr.yaml b/kube/deploy/apps/mlc-llm/app/hr.yaml index 366a69a0..6fcc0b7a 100644 --- a/kube/deploy/apps/mlc-llm/app/hr.yaml +++ b/kube/deploy/apps/mlc-llm/app/hr.yaml @@ -75,6 +75,7 @@ spec: limits: cpu: "1000m" memory: "2Gi" + gpu.intel.com/i915: "1" service: mlc-llm: controller: mlc-llm