phi4mm
Runnable HTTP server example phi4mm.
from openai import OpenAIimport httpximport textwrapimport json
def log_response(response: httpx.Response): request = response.request print(f"Request: {request.method} {request.url}") print(" Headers:") for key, value in request.headers.items(): if key.lower() == "authorization": value = "[...]" if key.lower() == "cookie": value = value.split("=")[0] + "=..." print(f" {key}: {value}") print(" Body:") try: request_body = json.loads(request.content) print(textwrap.indent(json.dumps(request_body, indent=2), " ")) except json.JSONDecodeError: print(textwrap.indent(request.content.decode(), " ")) print(f"Response: status_code={response.status_code}") print(" Headers:") for key, value in response.headers.items(): if key.lower() == "set-cookie": value = value.split("=")[0] + "=..." print(f" {key}: {value}")
client = OpenAI(api_key="foobar", base_url="http://localhost:1234/v1/")
# Enable this to log requests and responses# client._client = httpx.Client(# event_hooks={"request": [print], "response": [log_response]}# )
completion = client.chat.completions.create( model="default", messages=[ { "role": "user", "content": [ { "type": "image_url", "image_url": { "url": "https://www.nhmagazine.com/content/uploads/2019/05/mtwashingtonFranconia-2-19-18-108-Edit-Edit.jpg" }, }, { "type": "text", "text": "What is shown in this image? Write a detailed response analyzing the scene.", }, ], }, ], max_tokens=256, frequency_penalty=1.0, top_p=0.1, temperature=0,)resp = completion.choices[0].message.contentprint(resp)Source: examples/server/phi4mm.py