vLLM Backend
case "vllm":
self.llms.append(OpenAI(
base_url=config.hostname,
api_key="sk-1234" # Dummy API key
))
case "sglang":
self.llms.append(OpenAI(
base_url=config.hostname,
api_key="sk-1234" # Dummy API key
))completed_response = model.chat.completions.create(
model=model_name,
**completion_kwargs
)
return completed_response.choices[0].message.content, TrueLast updated