qwen3_vl
Runnable Python SDK example qwen3_vl.
from mistralrs import Runner, Which, ChatCompletionRequest, MultimodalArchitecture
MODEL_ID = "Qwen/Qwen3-VL-4B-Thinking"
runner = Runner( which=Which.MultimodalPlain( model_id=MODEL_ID, arch=MultimodalArchitecture.Qwen3VL, ),)
res = runner.send_chat_completion_request( ChatCompletionRequest( model="default", messages=[ { "role": "user", "content": [ { "type": "image_url", "image_url": { "url": "https://www.garden-treasures.com/cdn/shop/products/IMG_6245.jpg" }, }, { "type": "text", "text": "What type of flower is this? Give some fun facts.", }, ], } ], max_tokens=256, presence_penalty=1.0, top_p=0.1, temperature=0.1, ))print(res.choices[0].message.content)print(res.usage)Source: examples/python/qwen3_vl.py