Version: v0.4.0

remote::vllm

Description

Remote vLLM inference provider for connecting to vLLM servers.

Field	Type	Required	Default	Description
`allowed_models`	`list[str] \| None`	No		List of models that should be registered with the model registry. If None, all models are allowed.
`refresh_models`	`bool`	No	False	Whether to refresh models periodically from the provider
`api_token`	`SecretStr \| None`	No		The API token
`base_url`	`HttpUrl \| None`	No		The URL for the vLLM model serving endpoint
`max_tokens`	`int`	No	4096	Maximum number of tokens to generate.
`tls_verify`	`bool \| str`	No	True	Whether to verify TLS certificates. Can be a boolean or a path to a CA certificate file.

base_url: ${env.VLLM_URL:=}
max_tokens: ${env.VLLM_MAX_TOKENS:=4096}
api_token: ${env.VLLM_API_TOKEN:=fake}
tls_verify: ${env.VLLM_TLS_VERIFY:=true}