import os from chutes.chute import NodeSelector from chutes.chute.template.vllm import build_vllm_chute os.environ["NO_PROXY"] = "localhost,127.0.0.1" chute = build_vllm_chute( username="achoji", readme="ronx-labs/affine-081410", model_name="ronx-labs/affine-081410", image="chutes/vllm_gptoss:0.10.1.dev5", concurrency=16, revision="606d2f4e4f62a2d549de4daa8c602930dcae3e51", node_selector=NodeSelector( gpu_count=8, min_vram_gb_per_gpu=24, ), )