@_j I think you misunderstood the problem, my regression is about passing images as part of “function” or “system” type of messages. Your example is using “user” type of messages which do not have any problem.
Example:
{
"model": "gpt-4o",
"temperature": 0,
"top_p": 1,
"frequency_penalty": 0,
"presence_penalty": 0,
"max_tokens": 4096,
"n": 1,
"stream": false,
"tools": [
{
"type": "function",
"function": {
"name": "navigate-to-website",
"description": "useful for when you need to find something on or summarize a webpage.",
"parameters": {
"type": "object",
"properties": {
"url": {
"type": "string",
"description": "The url to navigate to."
},
"keywords": {
"type": "array",
"items": {
"type": "string"
},
"description": "keywords representing what you want to find."
},
"searchDescription": {
"type": "string",
"description": "a long and detailed description of what do expect to find in the page."
}
},
"required": [
"url",
"keywords",
"searchDescription"
],
"additionalProperties": false,
"$schema": "http://json-schema.org/draft-07/schema#"
}
}
}
],
"messages": [
{
"role": "user",
"content": [
{
"type": "text",
"text": "Navigate to google.com website."
}
]
},
{
"role": "assistant",
"content": "",
"function_call": {
"name": "navigate-to-website",
"arguments": "{\"url\":\"https://www.google.com\",\"keywords\":[]}"
}
},
{
"role": "function",
"content": [
{
"type": "image_url",
"image_url": {
"url": "data:image/png;base64,.....",
"detail": "high"
}
}
],
"name": "navigate-to-website"
}
]
}
This same request used to work on the gpt-4-turbo model.