File size: 497 Bytes
2c59142 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 |
import os
from chutes.chute import NodeSelector
from chutes.chute.template.vllm import build_vllm_chute
os.environ["NO_PROXY"] = "localhost,127.0.0.1"
chute = build_vllm_chute(
username="achoji",
readme="ronx-labs/affine-081410",
model_name="ronx-labs/affine-081410",
image="chutes/vllm_gptoss:0.10.1.dev5",
concurrency=16,
revision="606d2f4e4f62a2d549de4daa8c602930dcae3e51",
node_selector=NodeSelector(
gpu_count=8,
min_vram_gb_per_gpu=24,
),
)
|