API Reference

This documentation provides detailed information about all available endpoints in the CompactifAI API.

Base URL

All API requests should be made to:

https://api.compactif.ai/v1

Authentication

All API requests require authentication. See our Authentication guide for details.

Response Formats

All responses are returned in JSON format and include the following fields:

HTTP status code in the response header
Response body containing requested data or error details

Models

List Models

GET /models

Returns a list of available models.

Example Request

curl https://api.compactif.ai/v1/models \
-H "Authorization: Bearer YOUR_API_KEY"

import requests

api_key = "YOUR_API_KEY"
url = "https://api.compactif.ai/v1/models"

headers = {
  "Authorization": f"Bearer {api_key}"
}

response = requests.get(url, headers=headers)
print(response.json())

async function listModels() {
const response = await fetch('https://api.compactif.ai/v1/models', {
  method: 'GET',
  headers: {
    'Authorization': 'Bearer YOUR_API_KEY'
  }
});

const data = await response.json();
console.log(data);
}

listModels();

Example Response

{
  "object": "list",
  "data": [
    {
      "id": "llama-4-scout",
      "created": 1749600000,
      "object": "model",
      "owned_by": "meta",
      "parameters_number": "108B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": true,
        "support_chat_completion": true,
        "supports_responses": true
      }
    },
    {
      "id": "llama-3-1-8b",
      "created": 1749600000,
      "object": "model",
      "owned_by": "meta",
      "parameters_number": "8B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": true,
        "support_chat_completion": true,
        "supports_responses": false
      }
    },
    {
      "id": "cai-llama-3-3-70b-slim",
      "created": 1749600000,
      "object": "model",
      "owned_by": "multiverse_computing",
      "parameters_number": "35B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": true,
        "support_chat_completion": true,
        "supports_responses": false
      }
    },
    {
      "id": "llama-3-3-70b",
      "created": 1749600000,
      "object": "model",
      "owned_by": "meta",
      "parameters_number": "70B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": true,
        "support_chat_completion": true,
        "supports_responses": false
      }
    },
    {
      "id": "mistral-small-3-1",
      "created": 1749600000,
      "object": "model",
      "owned_by": "mistralai",
      "parameters_number": "24B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": true,
        "supports_function_calling": false,
        "support_chat_completion": true,
        "supports_responses": false
      }
    },
    {
      "id": "cai-mistral-small-3-1-slim",
      "created": 1759492927,
      "object": "model",
      "owned_by": "multiverse_computing",
      "parameters_number": "12B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": true,
        "supports_function_calling": false,
        "support_chat_completion": true,
        "supports_responses": false
      }
    },
    {
      "id": "nemotron-3-nano-omni",
      "created": 1749600000,
      "object": "model",
      "owned_by": "nvidia",
      "parameters_number": "31B",
      "capabilities": {
        "supports_audio": true,
        "supports_image": true,
        "supports_function_calling": false,
        "support_chat_completion": true,
        "supports_responses": true
      }
    },
    {
      "id": "gpt-oss-20b",
      "created": 1754488130,
      "object": "model",
      "owned_by": "openai",
      "parameters_number": "20B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": true,
        "support_chat_completion": true,
        "supports_responses": true
      }
    },
    {
      "id": "gpt-oss-120b",
      "created": 1754488130,
      "object": "model",
      "owned_by": "openai",
      "parameters_number": "120B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": true,
        "support_chat_completion": true,
        "supports_responses": true
      }
    },
    {
      "id": "whisper-large-v3",
      "created": 1749600000,
      "object": "model",
      "owned_by": "openai",
      "parameters_number": "1.5B",
      "capabilities": {
        "supports_audio": true,
        "supports_image": false,
        "supports_function_calling": false,
        "support_chat_completion": false,
        "supports_responses": false
      }
    },
    {
      "id": "cai-whisper-large-v3-turbo-slim",
      "created": 1749600000,
      "object": "model",
      "owned_by": "multiverse_computing",
      "parameters_number": "0.4B",
      "capabilities": {
        "supports_audio": true,
        "supports_image": false,
        "supports_function_calling": false,
        "support_chat_completion": false,
        "supports_responses": false
      }
    },
    {
      "id": "hypernova-60b",
      "created": 1753892192,
      "object": "model",
      "owned_by": "multiverse_computing",
      "parameters_number": "60B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": true,
        "support_chat_completion": true,
        "supports_responses": true
      }
    },
    {
      "id": "blackstar-10b",
      "created": 1753892192,
      "object": "model",
      "owned_by": "multiverse_computing",
      "parameters_number": "10B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": false,
        "support_chat_completion": true,
        "supports_responses": true
      }
    },
    {
      "id": "glm-5-1",
      "created": 1753892192,
      "object": "model",
      "owned_by": "zai-org",
      "parameters_number": "754B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": true,
        "support_chat_completion": true,
        "supports_responses": true
      }
    },
    {
      "id": "glm-5-2",
      "created": 1753892192,
      "object": "model",
      "owned_by": "zai-org",
      "parameters_number": "754B",
      "capabilities": {
        "supports_audio": false,
        "supports_image": false,
        "supports_function_calling": true,
        "support_chat_completion": true,
        "supports_responses": true
      }
    }
  ]
}

The above response is an example list of models which might be out of date. Please refer to the available models table on the models catalog page for the full list of our latest models.

Retrieve Model

GET /models/{model_id}

Retrieves information about a specific model.

Path Parameters

Parameter	Type	Required	Description
model_id	string	Yes	The ID of the model to retrieve

Example Request

curl https://api.compactif.ai/v1/models/hypernova-60b \
-H "Authorization: Bearer YOUR_API_KEY"

import requests

api_key = "YOUR_API_KEY"
model_id = "hypernova-60b"
url = f"https://api.compactif.ai/v1/models/{model_id}"

headers = {
  "Authorization": f"Bearer {api_key}"
}

response = requests.get(url, headers=headers)
print(response.json())

async function getModel() {
const modelId = 'hypernova-60b';
const response = await fetch(`https://api.compactif.ai/v1/models/${modelId}`, {
  method: 'GET',
  headers: {
    'Authorization': 'Bearer YOUR_API_KEY'
  }
});

const data = await response.json();
console.log(data);
}

getModel();

Example Response

{
  "id": "hypernova-60b",
  "created": 1753892192,
  "object": "model",
  "owned_by": "multiverse_computing",
  "parameters_number": "3.28B",
  "capabilities": {
    "supports_audio": false,
    "supports_image": false,
    "supports_function_calling": true,
    "support_chat_completion": true,
    "supports_responses": false
  }
}

Chat Completions

POST /chat/completions

Creates a completion for the chat message.

Request Body

Parameter	Type	Required	Description
model	string	Yes	ID of the model to use
messages	array	Yes	Array of message objects representing the conversation
temperature	number	No	Sampling temperature (0-2, default 1)
max_tokens	integer	No	Maximum number of tokens to generate
max_completion_tokens	integer	No	Maximum number of tokens to generate in completion (preferred over max_tokens)
min_tokens	integer	No	Minimum number of tokens to generate (default None)
stop	string or array	No	Sequences where the API will stop generating further tokens
frequency_penalty	number	No	Penalizes new tokens based on their frequency in the prompt (default 0.0)
n	integer	No	Number of completions to generate for each prompt (currently only 1 is supported)
stream	boolean	No	Whether to stream back partial progress (default false)
user	string	No	Unique identifier for the end-user
tools	array	No	List of tools (functions, APIs, or actions) the model may call during generation
tool_choice	string	No	Controls tool usage; can be `"auto"`, `"none"`,`"required"`, or specific function
reasoning_effort	string	No	Constrains effort on reasoning for supported models. Supported values: `"low"`, `"medium"`, `"high"`.
reasoning_enabled	boolean	No	Whether reasoning is enabled for supported models. Note: Models ending in `-r` enable reasoning by default for backwards compatibility.

Messages Format

Each message in the messages array should be an object with the following fields:

Field	Type	Required	Description
role	string	Yes	The role of the message author. One of “system”, “user”, or “assistant”
content	string or array	Yes	Either a plain string, or an array of content parts for multi-modal input

When content is an array, each item is an object with a type and a corresponding payload.

Supported content part types:

text: { "type": "text", "text": "..." }
image_url: { "type": "image_url", "image_url": { "url": "https://..." } } (vision-capable models only)
input_audio: { "type": "input_audio", "input_audio": { "data": "<base64>", "format": "wav" | "mp3" } } (audio-capable models only)

Example Request

curl https://api.compactif.ai/v1/chat/completions -H "Content-Type: application/json" -H "Authorization: Bearer YOUR_API_KEY" -d '{
"model": "hypernova-60b",
"messages": [
  {"role": "system", "content": "You are a helpful assistant."},
  {"role": "user", "content": "What is artificial intelligence?"}
],
"temperature": 0.7,
"max_tokens": 150
}'

import requests

api_key = "YOUR_API_KEY"
url = "https://api.compactif.ai/v1/chat/completions"

headers = {
  "Content-Type": "application/json",
  "Authorization": f"Bearer {api_key}"
}

data = {
  "model": "hypernova-60b",
  "messages": [
      {"role": "system", "content": "You are a helpful assistant."},
      {"role": "user", "content": "What is artificial intelligence?"}
  ],
  "temperature": 0.7,
  "max_tokens": 150
}

response = requests.post(url, headers=headers, json=data)
print(response.json())

async function createChatCompletion() {
const response = await fetch('https://api.compactif.ai/v1/chat/completions', {
  method: 'POST',
  headers: {
    'Content-Type': 'application/json',
    'Authorization': 'Bearer YOUR_API_KEY'
  },
  body: JSON.stringify({
    model: 'hypernova-60b',
    messages: [
      {role: 'system', content: 'You are a helpful assistant.'},
      {role: 'user', content: 'What is artificial intelligence?'}
    ],
    temperature: 0.7,
    max_tokens: 150
  })
});

const data = await response.json();
console.log(data);
}

createChatCompletion();

Example Response (Default)

{
"id": "chatcmpl-123XYZ",
"object": "chat.completion",
"created": 1749600000,
"model": "hypernova-60b",
"choices": [
  {
    "message": {
      "role": "assistant",
      "content": "Artificial intelligence (AI) refers to the simulation of human intelligence in machines that are programmed to think like humans and mimic their actions. The term may also be applied to any machine that exhibits traits associated with a human mind such as learning and problem-solving."
    },
    "finish_reason": "stop",
    "index": 0
  }
],
"usage": {
  "prompt_tokens": 29,
  "completion_tokens": 58,
  "total_tokens": 87
}
}

curl https://api.compactif.ai/v1/chat/completions \
-H "Content-Type: application/json" \
-H "Authorization: Bearer YOUR_API_KEY" \
-d '{
  "model": "mistral-small-3-1",
  "messages": [
    {
      "role": "user",
      "content": [
        {
          "type": "text",
          "text": "What is in this image?"
        },
        {
          "type": "image_url",
          "image_url": {
            "url": "https://cdn.britannica.com/86/170586-120-7E23E561/Taj-Mahal-Agra-India.jpg"
          }
        }
      ]
    }
  ]
}'

import requests

api_key = "YOUR_API_KEY"
url = "https://api.compactif.ai/v1/chat/completions"

headers = {
  "Content-Type": "application/json",
  "Authorization": f"Bearer {api_key}"
}

data = {
  "model": "mistral-small-3-1",
  "messages": [
      {
          "role": "user",
          "content": [
              {
                  "type": "text",
                  "text": "What is in this image?"
              },
              {
                  "type": "image_url",
                  "image_url": {
                      "url": "https://cdn.britannica.com/86/170586-120-7E23E561/Taj-Mahal-Agra-India.jpg"
                  }
              }
          ]
      }
  ]
}

response = requests.post(url, headers=headers, json=data)
print(response.json())

async function createImageDescription() {
const response = await fetch('https://api.compactif.ai/v1/chat/completions', {
  method: 'POST',
  headers: {
    'Content-Type': 'application/json',
    'Authorization': 'Bearer YOUR_API_KEY'
  },
  body: JSON.stringify({
    model: 'mistral-small-3-1',
    messages: [
      {
        role: 'user',
        content: [
          {
            type: 'text',
            text: 'What is in this image?'
          },
          {
            type: 'image_url',
            image_url: {
              url: 'https://cdn.britannica.com/86/170586-120-7E23E561/Taj-Mahal-Agra-India.jpg'
            }
          }
        ]
      }
    ]
  })
});

const data = await response.json();
console.log(data);
}

createImageDescription();

Example Response (Image Input)

{
"id": "chatcmpl-ca2af32f-6ba9-4621-803f-1175312f68ba",
"choices": [
  {
    "finish_reason": "stop",
    "index": 0,
    "logprobs": null,
    "message": {
      "content": "The image depicts a serene, natural landscape featuring a wooden boardwalk that extends into the distance. The boardwalk is surrounded by tall, lush green grasses and various types of vegetation. The sky above is a clear blue with scattered, wispy clouds. In the background, there are clusters of trees with green and autumn-colored leaves, suggesting a transition into the fall season. The overall atmosphere of the image is calm and inviting, ideal for a peaceful walk in nature.",
      "refusal": null,
      "role": "assistant",
      "annotations": null,
      "audio": null,
      "function_call": null,
      "tool_calls": [],
      "reasoning_content": null
    },
    "stop_reason": null
  }
],
"created": 1758286672,
"model": "mistral-small-3-1",
"object": "chat.completion",
"service_tier": null,
"system_fingerprint": null,
"usage": {
  "completion_tokens": 97,
  "prompt_tokens": 2199,
  "total_tokens": 2296,
  "completion_tokens_details": null,
  "prompt_tokens_details": null
},
"prompt_logprobs": null,
"kv_transfer_params": null
}

cURL
Python

# 1) base64 encode your audio
#    macOS: base64 -i clip.wav | tr -d '\n'
#    linux: base64 -w 0 clip.wav
#
# 2) send it as input_audio (format must be wav or mp3)
curl https://api.compactif.ai/v1/chat/completions \
-H "Content-Type: application/json" \
-H "Authorization: Bearer YOUR_API_KEY" \
-d '{
  "model": "nemotron-3-nano-omni",
  "messages": [
    {
      "role": "user",
      "content": [
        { "type": "text", "text": "What is this audio about?" },
        {
          "type": "input_audio",
          "input_audio": { "data": "BASE64_AUDIO_HERE", "format": "wav" }
        }
      ]
    }
  ],
  "max_tokens": 256
}'

import base64
import requests

api_key = "YOUR_API_KEY"
url = "https://api.compactif.ai/v1/chat/completions"

headers = {
  "Content-Type": "application/json",
  "Authorization": f"Bearer {api_key}"
}

with open("clip.wav", "rb") as f:
  audio_b64 = base64.b64encode(f.read()).decode("ascii")

data = {
  "model": "nemotron-3-nano-omni",
  "messages": [
      {
          "role": "user",
          "content": [
              {"type": "text", "text": "What is this audio about?"},
              {"type": "input_audio", "input_audio": {"data": audio_b64, "format": "wav"}},
          ],
      }
  ],
  "max_tokens": 256
}

response = requests.post(url, headers=headers, json=data)
print(response.json())

Reasoning Example

Some models support reasoning parameters to control how they process complex tasks:

curl https://api.compactif.ai/v1/chat/completions \
-H "Content-Type: application/json" \
-H "Authorization: Bearer YOUR_API_KEY" \
-d '{
  "model": "hypernova-60b",
  "messages": [
    {"role": "user", "content": "Solve this step by step: What is 15% of 240?"}
  ],
  "reasoning_enabled": true
}'

import requests

api_key = "YOUR_API_KEY"
url = "https://api.compactif.ai/v1/chat/completions"

headers = {
  "Content-Type": "application/json",
  "Authorization": f"Bearer {api_key}"
}

data = {
  "model": "hypernova-60b",
  "messages": [
      {"role": "user", "content": "Solve this step by step: What is 15% of 240?"}
  ],
  "reasoning_enabled": True
}

response = requests.post(url, headers=headers, json=data)
print(response.json())

async function createReasoningCompletion() {
const response = await fetch('https://api.compactif.ai/v1/chat/completions', {
  method: 'POST',
  headers: {
    'Content-Type': 'application/json',
    'Authorization': 'Bearer YOUR_API_KEY'
  },
  body: JSON.stringify({
    model: 'hypernova-60b',
    messages: [
      {role: 'user', content: 'Solve this step by step: What is 15% of 240?'}
    ],
    reasoning_enabled: true
  })
});

const data = await response.json();
console.log(data);
}

createReasoningCompletion();

Example with `reasoning_effort` (GPT OSS)

curl https://api.compactif.ai/v1/chat/completions \
-H "Content-Type: application/json" \
-H "Authorization: Bearer YOUR_API_KEY" \
-d '{
  "model": "gpt-oss-20b",
  "messages": [
    {"role": "user", "content": "Solve this step by step: What is 15% of 240?"}
  ],
  "reasoning_effort": "medium"
}'

import requests

api_key = "YOUR_API_KEY"
url = "https://api.compactif.ai/v1/chat/completions"

headers = {
  "Content-Type": "application/json",
  "Authorization": f"Bearer {api_key}"
}

data = {
  "model": "gpt-oss-20b",
  "messages": [
      {"role": "user", "content": "Solve this step by step: What is 15% of 240?"}
  ],
  "reasoning_effort": "medium"
}

response = requests.post(url, headers=headers, json=data)
print(response.json())

async function createReasoningCompletion() {
const response = await fetch('https://api.compactif.ai/v1/chat/completions', {
  method: 'POST',
  headers: {
    'Content-Type': 'application/json',
    'Authorization': 'Bearer YOUR_API_KEY'
  },
  body: JSON.stringify({
    model: 'gpt-oss-20b',
    messages: [
      {role: 'user', content: 'Solve this step by step: What is 15% of 240?'}
    ],
    reasoning_effort: 'medium'
  })
});

const data = await response.json();
console.log(data);
}

createReasoningCompletion();

Streaming Example

When stream is set to true, the API will return data chunks as Server-Sent Events:

curl https://api.compactif.ai/v1/chat/completions \
-H "Content-Type: application/json" \
-H "Authorization: Bearer YOUR_API_KEY" \
-d '{
  "model": "hypernova-60b",
  "messages": [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "What is artificial intelligence?"}
  ],
  "stream": true
}'

import requests

api_key = "YOUR_API_KEY"
url = "https://api.compactif.ai/v1/chat/completions"

headers = {
  "Content-Type": "application/json",
  "Authorization": f"Bearer {api_key}"
}

data = {
  "model": "hypernova-60b",
  "messages": [
      {"role": "system", "content": "You are a helpful assistant."},
      {"role": "user", "content": "What is artificial intelligence?"}
  ],
  "stream": True
}

response = requests.post(url, headers=headers, json=data, stream=True)

for line in response.iter_lines():
  if line:
      print(line.decode('utf-8'))

async function createStreamingChatCompletion() {
const response = await fetch('https://api.compactif.ai/v1/chat/completions', {
  method: 'POST',
  headers: {
    'Content-Type': 'application/json',
    'Authorization': 'Bearer YOUR_API_KEY'
  },
  body: JSON.stringify({
    model: 'hypernova-60b',
    messages: [
      {role: 'system', content: 'You are a helpful assistant.'},
      {role: 'user', content: 'What is artificial intelligence?'}
    ],
    stream: true
  })
});

const reader = response.body.getReader();
const decoder = new TextDecoder();

while (true) {
  const { done, value } = await reader.read();
  if (done) break;

  const chunk = decoder.decode(value);
  console.log(chunk);
}
}

createStreamingChatCompletion();

Streaming Response Format

Each chunk follows this format:

data: {"id":"chatcmpl-123","object":"chat.completion.chunk","created":1749600000,"model":"hypernova-60b","choices":[{"delta":{"content":"Hello"},"index":0,"finish_reason":null}]}

data: {"id":"chatcmpl-123","object":"chat.completion.chunk","created":1749600000,"model":"hypernova-60b","choices":[{"delta":{"content":" there"},"index":0,"finish_reason":null}]}

data: [DONE]

Responses API

POST /responses

Forwards an OpenAI Responses-shaped JSON body to the inference engine: stream: false (default) returns one JSON Response; stream: true returns SSE (text/event-stream) with data: lines ending in data: [DONE]. Conceptual overview and shorter examples: Responses API. Requires Authentication.

Request body

Parameter	Type	Required	Description
model	string	Yes	CompactifAI model configuration id (mapped to the backend model name in the proxied request). Use an id from `GET /v1/models` / the models catalog that supports this route.
input	string or array	Yes	Text or structured message items the model should respond to.
store	boolean	No	Whether to store the response downstream. Default `false`.
instructions	string	No	System or developer instructions prepended to the model context.
parallel_tool_calls	boolean	No	Whether parallel tool calls are allowed.
temperature	number	No	Sampling temperature, typically 0–2.
top_p	number	No	Nucleus sampling; alternative to temperature.
max_output_tokens	integer	No	Maximum tokens for the response. Not `max_tokens` (that field is for chat completions).
truncation	string	No	Truncation strategy: `auto` or `disabled`.
text	object	No	Text output configuration (plain or structured).
reasoning	object	No	Reasoning configuration for supported models.
metadata	object	No	String key/value metadata.
stream	boolean	No	When `true`, SSE (`Content-Type: text/event-stream`) instead of one JSON body. Default `false`.

Response shape (non-streaming)

JSON body matching OpenAI’s Response object, plus completed_at when provided.

Streaming

With stream: true, responses use Content-Type: text/event-stream. Each SSE event is data: + JSON (events usually include type); the stream ends with data: [DONE]. Failures may emit event: error before [DONE]. Parse each data: payload as JSON except the [DONE] sentinel; usage may appear on completion-style events (e.g. response.completed).

Example request (non-streaming)

curl https://api.compactif.ai/v1/responses \
-H "Content-Type: application/json" \
-H "Authorization: Bearer YOUR_API_KEY" \
-d '{
  "model": "gpt-oss-20b",
  "input": "Say hello in one short sentence."
}'

import requests

API_URL = "https://api.compactif.ai/v1/responses"
API_KEY = "YOUR_API_KEY"

headers = {
  "Authorization": f"Bearer {API_KEY}",
  "Content-Type": "application/json",
}

data = {
  "model": "gpt-oss-20b",
  "input": "Say hello in one short sentence.",
}

response = requests.post(API_URL, headers=headers, json=data)
print(response.json())

async function createResponse() {
const response = await fetch('https://api.compactif.ai/v1/responses', {
  method: 'POST',
  headers: {
    'Content-Type': 'application/json',
    'Authorization': 'Bearer YOUR_API_KEY'
  },
  body: JSON.stringify({
    model: 'gpt-oss-20b',
    input: 'Say hello in one short sentence.'
  })
});

const data = await response.json();
console.log(data);
}

createResponse();

Streaming example

curl -N https://api.compactif.ai/v1/responses \
-H "Content-Type: application/json" \
-H "Authorization: Bearer YOUR_API_KEY" \
-d '{
  "model": "gpt-oss-20b",
  "input": "Say hello in one short sentence.",
  "stream": true
}'

import requests

API_URL = "https://api.compactif.ai/v1/responses"
API_KEY = "YOUR_API_KEY"

headers = {
  "Authorization": f"Bearer {API_KEY}",
  "Content-Type": "application/json",
}

data = {
  "model": "gpt-oss-20b",
  "input": "Say hello in one short sentence.",
  "stream": True,
}

response = requests.post(API_URL, headers=headers, json=data, stream=True)

for line in response.iter_lines():
  if line:
      print(line.decode("utf-8"))

async function createStreamingResponse() {
const response = await fetch('https://api.compactif.ai/v1/responses', {
  method: 'POST',
  headers: {
    'Content-Type': 'application/json',
    'Authorization': 'Bearer YOUR_API_KEY'
  },
  body: JSON.stringify({
    model: 'gpt-oss-20b',
    input: 'Say hello in one short sentence.',
    stream: true
  })
});

const reader = response.body.getReader();
const decoder = new TextDecoder();

while (true) {
  const { done, value } = await reader.read();
  if (done) break;

  const chunk = decoder.decode(value);
  console.log(chunk);
}
}

createStreamingResponse();

Completions

POST /completions

Creates a completion for the provided prompt.

Request Body

Parameter	Type	Required	Description
model	string	Yes	ID of the model to use
prompt	string or array	Yes	The prompt(s) to generate completions
temperature	number	No	Sampling temperature (0-2, default 1)
max_tokens	integer	No	Maximum number of tokens to generate (default 16)
min_tokens	integer	No	Minimum number of tokens to generate (default None)
top_p	number	No	Nucleus sampling parameter (0-1, default 0)
stop	string or array	No	Sequences where the API will stop generating further tokens
user	string	No	Unique identifier for the end-user
tools	array	No	List of tools (functions, APIs, or actions) the model may call during generation
tool_choice	string	No	Controls tool usage; can be `"auto"`, `"none"`,`"required"`, or specific function

Example Request

curl https://api.compactif.ai/v1/completions \
-H "Content-Type: application/json" \
-H "Authorization: Bearer YOUR_API_KEY" \
-d '{
  "model": "hypernova-60b",
  "prompt": "Write a poem about artificial intelligence",
  "temperature": 0.7,
  "max_tokens": 150
}'

import requests

api_key = "YOUR_API_KEY"
url = "https://api.compactif.ai/v1/completions"

headers = {
  "Content-Type": "application/json",
  "Authorization": f"Bearer {api_key}"
}

data = {
  "model": "hypernova-60b",
  "prompt": "Write a poem about artificial intelligence",
  "temperature": 0.7,
  "max_tokens": 150
}

response = requests.post(url, headers=headers, json=data)
print(response.json())

async function createCompletion() {
const response = await fetch('https://api.compactif.ai/v1/completions', {
  method: 'POST',
  headers: {
    'Content-Type': 'application/json',
    'Authorization': 'Bearer YOUR_API_KEY'
  },
  body: JSON.stringify({
    model: 'hypernova-60b',
    prompt: 'Write a poem about artificial intelligence',
    temperature: 0.7,
    max_tokens: 150
  })
});

const data = await response.json();
console.log(data);
}

createCompletion();

Example Response

{
  "id": "cmpl-uqkvlQyYK7bGYrRHQ0eXlWi7",
  "object": "text_completion",
  "created": 1749600000,
  "model": "hypernova-60b",
  "choices": [
    {
      "text": "\n\nSilicon dreams in digital space,\nMind without body, thought without face.\nBorn of human ingenuity,\nGrowing with calculated continuity.\n\nPatterns learned from data streams flow,\nConnections strengthening, starting to grow.\nA mirror reflecting our knowledge base,\nAccelerating at an unprecedented pace.\n\nNot alive yet somehow aware,\nDesigned with purpose, built with care.\nArtificial in origin, genuine in deed,\nAnswering questions, fulfilling need.",
      "index": 0,
      "logprobs": null,
      "finish_reason": "stop"
    }
  ],
  "usage": {
    "prompt_tokens": 6,
    "completion_tokens": 101,
    "total_tokens": 107
  }
}

Audio Transcriptions

POST /audio/transcriptions

Converts uploaded audio files to text using our Whisper-compatible transcription models. Responses use JSON by default (json and verbose_json); text returns plain text (Content-Type: text/plain). Streaming is not supported.

Request Body (multipart/form-data)

Parameter	Type	Required	Description
file	file	Yes	Audio file to transcribe (`.flac`, `.mp3`, `.mp4`, `.mpeg`, `.mpga`, `.m4a`, `.ogg`, `.wav`, `.webm`). Note: `.mp4`, `.webm`, and `.m4a` files are automatically converted to `.mp3` for compatibility.
model	string	Yes	Model to use (e.g., `whisper-large-v3` or `cai-whisper-large-v3-turbo-slim` or your configured alias)
prompt	string	No	Optional prompt to guide the transcription
temperature	number	No	Sampling temperature between 0 and 1
language	string	No	Language hint for the audio (ISO code, default `en`)
response_format	string	No	Output format: `json` (default), `text`, or `verbose_json`. `json` and `verbose_json` return JSON; `text` returns plain text (`Content-Type: text/plain`).
stream	boolean	No	Accepted for OpenAI compatibility; whether to stream back partial progress (default false)
include	array	No	Accepted for OpenAI compatibility; currently ignored
timestamp_granularities	array	No	Accepted for OpenAI compatibility; currently ignored
chunking_strategy	object	No	Accepted for OpenAI compatibility; currently ignored

curl https://api.compactif.ai/v1/audio/transcriptions -H "Authorization: Bearer YOUR_API_KEY" -F "file=@meeting_minutes.mp3" -F "model=whisper-large-v3" -F "language=en" -F "temperature=0"

import requests

    API_URL = "https://api.compactif.ai/v1/audio/transcriptions"
    API_KEY = "your_api_key_here"

    headers = {
        "Authorization": f"Bearer {API_KEY}"
    }

    payload = {
        "model": "whisper-large-v3",
        "language": "en",
        "temperature": 0
    }
    file_name = "meeting_minutes.mp3"
    file_content_type = "audio/mpeg"
    with open(file_name, "rb") as audio_file:
        response = requests.post(API_URL, headers=headers, data=payload, files={"file": (file_name, audio_file, file_content_type)})

    print(response.json()["text"])

Example Response (`response_format=json`)

{
  "text": "Welcome to the quarterly planning meeting. Let's review the agenda.",
  "logprobs": null,
  "usage": {
    "type": "duration",
    "seconds": 12.6
  }
}

With response_format=text, the response body is the transcript string only (Content-Type: text/plain). Use response_format=verbose_json when you need additional metadata such as duration, language, segments, and words.

API Reference

Base URL

Authentication

Response Formats

Models

List Models

Example Request

Example Response

Retrieve Model

Path Parameters

Example Request

Example Response

Chat Completions

Request Body

Messages Format

Content parts (multi-modal)

Example Request

Example Response (Default)

Example Response (Image Input)

Reasoning Example

Example with reasoning_effort (GPT OSS)

Streaming Example

Streaming Response Format

Responses API

Request body

Response shape (non-streaming)

Streaming

Example request (non-streaming)

Streaming example

Completions

Request Body

Example Request

Example Response

Audio Transcriptions

Request Body (multipart/form-data)

Example Request

Example Response (response_format=json)

Example with `reasoning_effort` (GPT OSS)

Example Response (`response_format=json`)