Hi, I am sending the following request:
{
"model": "gpt-3.5-turbo-1106",
"messages": [
{
"role": "user",
"content": [
{
"type": "text",
"text": "What is the time now?"
}
]
}
],
"temperature": 0.0,
"tools": [
{
"type": "function",
"function": {
"name": "check_watch",
"description": "returns current time",
"parameters": {
"type": "object",
"properties": {},
"required": []
}
}
}
]
}
And getting two different completion_tokens
calculations for the same responses. Sometimes it is 10, sometimes 27:
{
"id": "chatcmpl-8T4fbHQI5v8fhQEgm4uY6UDzzrFgg",
"object": "chat.completion",
"created": 1701940155,
"model": "gpt-3.5-turbo-1106",
"choices": [
{
"index": 0,
"message": {
"role": "assistant",
"content": null,
"tool_calls": [
{
"id": "call_2b39dQtuHVAX17Yx610fFpSe",
"type": "function",
"function": {
"name": "check_watch",
"arguments": "{}"
}
}
]
},
"finish_reason": "tool_calls"
}
],
"usage": {
"prompt_tokens": 42,
"completion_tokens": 10,
"total_tokens": 52
},
"system_fingerprint": "fp_eeff13170a"
}
{
"id": "chatcmpl-8T4fssaSPN74eSQQO7gZ47gPw0XvF",
"object": "chat.completion",
"created": 1701940172,
"model": "gpt-3.5-turbo-1106",
"choices": [
{
"index": 0,
"message": {
"role": "assistant",
"content": null,
"tool_calls": [
{
"id": "call_dQQJHC4zaBj8DwHUtEwtNHzs",
"type": "function",
"function": {
"name": "check_watch",
"arguments": "{}"
}
}
]
},
"finish_reason": "tool_calls"
}
],
"usage": {
"prompt_tokens": 42,
"completion_tokens": 27,
"total_tokens": 69
},
"system_fingerprint": "fp_eeff13170a"
}