nim-llm: env: - name: NVIDIA_VISIBLE_DEVICES value: "0,1,2,3" resources: limits: nvidia.com/gpu: 0 # no limit vss: applicationSpecs: vss-deployment: containers: vss: env: - name: VLM_MODEL_TO_USE value: vila-1.5 - name: MODEL_PATH value: "ngc:nim/nvidia/vila-1.5-40b:vila-yi-34b-siglip-stage3_1003_video_v8" - name: NVIDIA_VISIBLE_DEVICES value: "4,5" - name: DISABLE_GUARDRAILS value: "true" resources: limits: nvidia.com/gpu: 0 # no limit nemo-embedding: applicationSpecs: embedding-deployment: containers: embedding-container: env: - name: NGC_API_KEY valueFrom: secretKeyRef: key: NGC_API_KEY name: ngc-api-key-secret - name: NVIDIA_VISIBLE_DEVICES value: '6' resources: limits: nvidia.com/gpu: 0 # no limit nemo-rerank: applicationSpecs: ranking-deployment: containers: ranking-container: env: - name: NGC_API_KEY valueFrom: secretKeyRef: key: NGC_API_KEY name: ngc-api-key-secret - name: NVIDIA_VISIBLE_DEVICES value: '7' resources: limits: nvidia.com/gpu: 0 # no limit