baseurl: https://ai.megallm.io/v1
| model id | in price | out price | context | max token |
|---|---|---|---|---|
| gpt-4o-mini | $0.15/M | $0.60/M | 128,000 token | 4,096 token |
| gpt-4 | $30.00/M | $60.00/M | 32,768 token | 4,096 token |
| openai-gpt-oss-120b | $0.15/M | $0.60/M | 128,000 token | 128,000 token |
| gpt-4o | $2.50/M | $10.00/M | 128,000 token | 16,384 token |
| gpt-5 | $1.25/M | $10.00/M | 128,000 token | 64,000 token |
| gpt-4 | $30.00/M | $60.00/M | 32,768 token | 4,096 token |
| gpt-3.5-turbo-0613 | $1.50/M | $2.00/M | 16,384 tokens | 4,096 tokens |
| gemini-2.5-pro | $1.25/M | $10.00/M | 128,000 tokens | 64,000 tokens |
| gpt-4.1-2025-04-14 | $2.00/M | $8.00/M | 128,000 tokens | 16,384 tokens |
| gpt-4.1 | $2.00/M | $8.00/M | 128,000 tokens | 16,384 tokens |
| gpt-5-mini | $0.25/M | $2.50/M | 128,000 tokens | 64,000 tokens |
| gpt-4o | $2.50/M | $10.00/M | 128,000 tokens | 16,384 tokens |
| gpt-4o-2024-08-06 | $2.50/M | $10.00/M | 128,000 tokens | 16,384 tokens |
| claude-opus-4.1-20250805 | $15.00/M | $75.00/M | 80,000 tokens | 32,000 tokens |
| claude-sonnet-4-20250614 | $3.00/M | $15.00/M | 128,000 tokens | 64,000 tokens |
| Qwen3 32B | $0.15/M | $0.60/M | 131,072 tokens | 16,384 tokens |
| gpt-4o-mini | $0.15/M | $0.60/M | 128,000 tokens | 4,096 tokens |
| gpt-4o | $5.00/M | $15.00/M | 128,000 tokens | 4,096 tokens |
| claude-sonnet-4.5-20250929 | $3.00/M | $15.00/M | 128,000 tokens | 64,000 tokens |
| llama3.3-70b-instruct | $0.12/M | $0.75/M | 131,072 tokens | 131,072 tokens |
| deepseek-r1-distill-llama-70b | $0.75/M | $0.99/M | 128,000 tokens | 128,000 tokens |
| claude-opus-4 | $15.00/M | $75.00/M | 80,000 tokens | 32,000 tokens |
| llama-3.1-8b-instruct | $0.30/M | $0.60/M | 8,192 tokens | 8,192 tokens |
| claude-haiku-4.5 | $1.00/M | $5.00/M | 128,000 tokens | 32,000 tokens |
| moonshotai/kimi-k2-instruct-0905 | $1.00/M | $1.00/M | 256,000 tokens | 56,000 tokens |
| deepseek-ai/deepseek-v3.1-terminus | $1.00/M | $1.00/M | 163,840 tokens | 56,000 tokens |
| qwen/qwen3-next-80b-a3b-instruct | $1.00/M | $1.00/M | 262,144 tokens | 16,384 tokens |
| deepseek-ai/deepseek-v3.1 | $1.00/M | $1.00/M | 128,000 tokens | 16,384 tokens |
| mistralai/mistral-nemotron | $1.00/M | $1.00/M | 128,000 tokens | 16,384 tokens |
| glm-4.6 | $1.00/M | $1.00/M | 196,000 tokens | 32,000 tokens |
| gemini-2.5-flash | $1.00/M | $1.00/M | 196,000 tokens | 32,000 tokens |
| minimaxai/minimax-m2 | $1.00/M | $1.00/M | 128,000 tokens | 32,000 tokens |
| text-embedding-3-small | $1.00/M | $1.00/M | 8,191 tokens | 1,536 tokens |
| GPT-5.1 | $1.25/M | $10.00/M | 128,000 tokens | 64,000 tokens |
Python
from openai import OpenAI
client = OpenAI(
base_url="https://ai.megallm.io/v1",
api_key=os.environ.get("YOUR_API_KEY")
)
response = client.chat.completions.create(
model="gpt-5",
messages=[
{"role": "user", "content": "Hello, world!"}
]
)
cURL
curl https://ai.megallm.io/v1/chat/completions \
-H "Content-Type: application/json" \
-H "Authorization: Bearer $YOUR_API_KEY" \
-d '{
"model": "gpt-5",
"messages": [
{"role": "user", "content": "Hello, world!"}
]
}'
Java
import OpenAI from 'openai';
const client = new OpenAI({
baseURL: 'https://ai.megallm.io/v1',
apiKey: process.env.MEGALLM_API_KEY
});
const response = await client.chat.completions.create({
model: 'gpt-5',
messages: [
{ role: 'user', content: 'Hello, world!' }
]
});