curl --request POST \
--url https://inference.api.nscale.com/v1/chat/completions \
--header 'Authorization: Bearer <token>' \
--header 'Content-Type: application/json; charset=utf-8' \
--data '{
"frequency_penalty": 0,
"logit_bias": null,
"logprobs": false,
"max_completion_tokens": 100,
"max_tokens": 100,
"messages": [
{
"content": "What is the weather in Paris?",
"role": "user"
}
],
"model": "meta-llama/Llama-3.1-8B-Instruct",
"n": 1,
"presence_penalty": 0,
"seed": 42,
"stop": "\n",
"stream": false,
"stream_options": null,
"temperature": 1,
"tool_choice": "auto",
"tools": [
{
"function": {
"description": "Get the weather for a city",
"name": "get_weather",
"parameters": {
"properties": {
"city": {
"description": "City name",
"type": "string"
}
},
"required": [
"city"
],
"type": "object"
}
},
"type": "function"
}
],
"top_logprobs": 0,
"top_p": 1
}'