{"object":"viablelab.api_metadata","version":"2026-06-image-b64-asset-preview","base_url":"https://api.viablelab.org","agent_guide_url":"https://developers.viablelab.org/agents/viablelab-api.md","default_model":"gpt-4.1-nano","default_models_by_mode":{"chat":"gpt-4.1-nano","embedding":"nomic-embed-text-v1.5","image_generation":"flux.2-klein","audio_transcription":"whisper-large-v3","audio_speech":"gpt-4o-mini-tts"},"modes":{"chat":[{"id":"gpt-5.5","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"GPT-5.5 model configuration for advanced chat, reasoning, and multimodal workflows.","owned_by":"openai","intelligence":"Higher","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":5,"output_per_million":30,"cached_input_per_million":0.5,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"OpenAI standard short-context public pricing, per 1M tokens: $5 input, $0.50 cached input, $30 output."}},{"id":"gpt-5.4-mini","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"GPT-5.4 mini model configuration for balanced chat, reasoning, and multimodal workflows.","owned_by":"openai","intelligence":"High","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.75,"output_per_million":4.5,"cached_input_per_million":0.075,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"OpenAI standard public pricing, per 1M tokens: $0.75 input, $0.075 cached input, $4.50 output."}},{"id":"gpt-5.4-nano","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"GPT-5.4 nano model configuration for latency-sensitive chat and classification workflows.","owned_by":"openai","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.2,"output_per_million":1.25,"cached_input_per_million":0.02,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"OpenAI standard public pricing, per 1M tokens: $0.20 input, $0.02 cached input, $1.25 output."}},{"id":"gpt-5","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-5, the flagship model for coding, reasoning, and agentic tasks across domains.","owned_by":"openai","intelligence":"Higher","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":1.25,"output_per_million":10,"cached_input_per_million":0.125,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-5-mini","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-5 mini, a faster, more cost-efficient version of GPT-5 for well-defined tasks.","owned_by":"openai","intelligence":"High","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.25,"output_per_million":2,"cached_input_per_million":0.025,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-5-nano","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-5 nano, the fastest, most cost-efficient version of GPT-5 for summarization and classification.","owned_by":"openai","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.05,"output_per_million":0.4,"cached_input_per_million":0.005,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-5-chat-latest","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-5 Chat, the snapshot currently used in ChatGPT.","owned_by":"openai","intelligence":"High","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":1.25,"output_per_million":10,"cached_input_per_million":0.125,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4.1","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4.1. Flagship OpenAI model for complex tasks. It is well suited for problem solving across domains.","owned_by":"openai","intelligence":"Higher","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1047576,"max_output_tokens":32768,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":2,"output_per_million":8,"cached_input_per_million":0.5,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4.1-mini","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4.1 mini, balancing intelligence, speed, and cost for many use cases.","owned_by":"openai","intelligence":"High","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1047576,"max_output_tokens":32768,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.4,"output_per_million":1.6,"cached_input_per_million":0.1,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4.1-nano","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4.1 nano, the fastest, most cost-efficient version of GPT-4.1 for summarization and classification.","owned_by":"openai","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1047576,"max_output_tokens":32768,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.1,"output_per_million":0.4,"cached_input_per_million":0.025,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4o","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4o. Fast, intelligent, flexible GPT model.","owned_by":"openai","intelligence":"High","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":128000,"max_output_tokens":16384,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":2.5,"output_per_million":10,"cached_input_per_million":1.25,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4o-mini","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4o mini.","owned_by":"openai","intelligence":"Average","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":128000,"max_output_tokens":16384,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.15,"output_per_million":0.6,"cached_input_per_million":0.075,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gemini-3.1-pro","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Gemini 3.1 Pro model configuration for advanced multimodal reasoning.","owned_by":"google","intelligence":"Higher","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1048576,"max_output_tokens":8192,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":2,"output_per_million":12,"cached_input_per_million":0.2,"image_per_unit":null,"audio_per_minute":null,"status":"short_context","note":"Gemini 3.1 Pro Preview paid-tier pricing for prompts <=200K tokens. Longer prompts are listed at $4/M input, $0.40/M cached input, and $18/M output."}},{"id":"gemini-3.5-flash","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Gemini 3.5 Flash model configuration for fast multimodal generation.","owned_by":"google","intelligence":"High","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1048576,"max_output_tokens":8192,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":1.5,"output_per_million":9,"cached_input_per_million":0.15,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"Gemini 3.5 Flash paid-tier pricing, per 1M tokens: $1.50 input, $0.15 cached input, $9 output."}},{"id":"gemini-2.5-flash","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to Gemini 2.5 Flash. Optimized for speed and cost-effective multimodal generation.","owned_by":"google","intelligence":"High","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1048576,"max_output_tokens":8192,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.3,"output_per_million":2.5,"cached_input_per_million":0.03,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"Gemini 2.5 Flash paid-tier text/image/video pricing, per 1M tokens: $0.30 input, $0.03 cached input, $2.50 output. Audio input is listed separately at $1/M."}},{"id":"gemini-2.0-flash","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to Gemini 2.0 Flash. Optimized for speed and cost-effectiveness.","owned_by":"google","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1048576,"max_output_tokens":8192,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.1,"output_per_million":0.4,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-oss-120b","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Open-weight 120B model for cost-efficient text generation through the VIABLE Lab API.","owned_by":"viable-lab","intelligence":"High","speed":"Medium","input_modalities":["text"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":true,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.06,"output_per_million":0.15,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-oss-20b","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Open-weight 20B model for low-cost text generation through the VIABLE Lab API.","owned_by":"viable-lab","intelligence":"Average","speed":"Fast","input_modalities":["text"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":true,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.03,"output_per_million":0.07,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"llama-3.1-8b-instruct","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Llama 3.1 8B Instruct model for lightweight text generation through the VIABLE Lab API.","owned_by":"viable-lab","intelligence":"Average","speed":"Fast","input_modalities":["text"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":true,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.22,"output_per_million":0.22,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"llama-3.1-70b-instruct","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Llama 3.1 70B Instruct model for stronger open-weight text generation through the VIABLE Lab API.","owned_by":"viable-lab","intelligence":"High","speed":"Medium","input_modalities":["text"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":true,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.4,"output_per_million":0.4,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}}],"embedding":[{"id":"nomic-embed-text-v1.5","object":"model","mode":"embedding","endpoint":"/v1/embeddings","description":"Text embedding model for semantic search, clustering, retrieval, and ranking workflows.","owned_by":"viable-lab","intelligence":"Embedding","speed":"Fast","input_modalities":["text"],"output_modalities":["embedding"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":false,"embeddings":true,"image_generation":false},"pricing":{"input_per_million":0.005,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"docs_inferred","note":"Derived from provider docs: 250,000 pages per dollar at approximately 800 tokens per page."}}],"image_generation":[{"id":"flux.2-klein","object":"model","mode":"image_generation","endpoint":"/v1/images/generations","description":"Image generation model for prompt-to-image workflows.","owned_by":"viable-lab","intelligence":"Image","speed":"Medium","input_modalities":["text"],"output_modalities":["image"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":false,"embeddings":false,"image_generation":true},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":0.014,"audio_per_minute":null,"status":"starts_at","note":"Provider docs list pricing from $0.014 per image; final cost varies by resolution/model variant."}}],"audio_transcription":[{"id":"whisper-large-v3","object":"model","mode":"audio_transcription","endpoint":"/v1/audio/transcriptions","description":"Speech-to-text model for audio transcription.","owned_by":"viable-lab","intelligence":"Audio","speed":"Medium","input_modalities":["audio","file"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":false,"images":false,"files":true,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.006,"status":"documented","note":"Provider docs list $0.006 per minute of input audio."}},{"id":"gpt-4o-transcribe","object":"model","mode":"audio_transcription","endpoint":"/v1/audio/transcriptions","description":"OpenAI speech-to-text model exposed through the VIABLE Lab API.","owned_by":"openai","intelligence":"Audio","speed":"Medium","input_modalities":["audio","file"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":false,"images":false,"files":true,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":2.5,"output_per_million":10,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.006,"status":"documented","note":"OpenAI transcription pricing: $2.50/M input tokens, $10/M output tokens, estimated $0.006/minute."}},{"id":"gpt-4o-mini-transcribe","object":"model","mode":"audio_transcription","endpoint":"/v1/audio/transcriptions","description":"OpenAI speech-to-text model optimized for transcription workflows.","owned_by":"openai","intelligence":"Audio","speed":"Fast","input_modalities":["audio","file"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":false,"images":false,"files":true,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":1.25,"output_per_million":5,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.003,"status":"documented","note":"OpenAI transcription pricing: $1.25/M input tokens, $5/M output tokens, estimated $0.003/minute."}},{"id":"whisper-1","object":"model","mode":"audio_transcription","endpoint":"/v1/audio/transcriptions","description":"OpenAI Whisper transcription model preserved for compatibility.","owned_by":"openai","intelligence":"Audio","speed":"Medium","input_modalities":["audio","file"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":false,"images":false,"files":true,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.006,"status":"documented","note":"OpenAI Whisper transcription pricing is listed as $0.006 per minute."}}],"audio_speech":[{"id":"kokoro","object":"model","mode":"audio_speech","endpoint":"/v1/audio/speech","description":"Text-to-speech model for generated speech audio.","owned_by":"viable-lab","intelligence":"Audio","speed":"Fast","input_modalities":["text"],"output_modalities":["audio"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"default_voice":"af_heart","pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.006,"status":"documented","note":"Provider docs list $0.006 per minute of generated audio."}},{"id":"gpt-4o-mini-tts","object":"model","mode":"audio_speech","endpoint":"/v1/audio/speech","description":"OpenAI text-to-speech model exposed through the VIABLE Lab API.","owned_by":"openai","intelligence":"Audio","speed":"Fast","input_modalities":["text"],"output_modalities":["audio"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"not_listed","note":null}},{"id":"tts-1","object":"model","mode":"audio_speech","endpoint":"/v1/audio/speech","description":"OpenAI text-to-speech model preserved for compatibility.","owned_by":"openai","intelligence":"Audio","speed":"Fast","input_modalities":["text"],"output_modalities":["audio"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"not_listed","note":null}},{"id":"tts-1-hd","object":"model","mode":"audio_speech","endpoint":"/v1/audio/speech","description":"OpenAI high-definition text-to-speech model preserved for compatibility.","owned_by":"openai","intelligence":"Audio","speed":"Medium","input_modalities":["text"],"output_modalities":["audio"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"not_listed","note":null}}]},"models":[{"id":"viable-1","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Recommended for complex evaluation and sophisticated text generation. Operates at a higher cost tier; mindful token usage is advised for long contexts.","owned_by":"viable-lab","intelligence":"High","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1047576,"max_output_tokens":32768,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.4,"output_per_million":1.6,"cached_input_per_million":0.1,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"viable-2","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Optimized for efficiency in common tasks like classification, summarization, and standard text completion.","owned_by":"viable-lab","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1047576,"max_output_tokens":32768,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.1,"output_per_million":0.4,"cached_input_per_million":0.025,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"viable-3","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"A balanced model for performance and cost, offering stable results. Recommended when specific output formatting is crucial.","owned_by":"viable-lab","intelligence":"Average","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":128000,"max_output_tokens":16384,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.15,"output_per_million":0.6,"cached_input_per_million":0.075,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"viable-4","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"High-performance viable access point for well-defined tasks with fast responses and strong reasoning on structured prompts.","owned_by":"viable-lab","intelligence":"High","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.25,"output_per_million":2,"cached_input_per_million":0.025,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"viable-5","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Cost-optimized viable access point tuned for fastest responses and high-throughput use cases like summarization and classification.","owned_by":"viable-lab","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.05,"output_per_million":0.4,"cached_input_per_million":0.005,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-5.5","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"GPT-5.5 model configuration for advanced chat, reasoning, and multimodal workflows.","owned_by":"openai","intelligence":"Higher","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":5,"output_per_million":30,"cached_input_per_million":0.5,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"OpenAI standard short-context public pricing, per 1M tokens: $5 input, $0.50 cached input, $30 output."}},{"id":"gpt-5.4-mini","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"GPT-5.4 mini model configuration for balanced chat, reasoning, and multimodal workflows.","owned_by":"openai","intelligence":"High","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.75,"output_per_million":4.5,"cached_input_per_million":0.075,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"OpenAI standard public pricing, per 1M tokens: $0.75 input, $0.075 cached input, $4.50 output."}},{"id":"gpt-5.4-nano","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"GPT-5.4 nano model configuration for latency-sensitive chat and classification workflows.","owned_by":"openai","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.2,"output_per_million":1.25,"cached_input_per_million":0.02,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"OpenAI standard public pricing, per 1M tokens: $0.20 input, $0.02 cached input, $1.25 output."}},{"id":"gpt-5","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-5, the flagship model for coding, reasoning, and agentic tasks across domains.","owned_by":"openai","intelligence":"Higher","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":1.25,"output_per_million":10,"cached_input_per_million":0.125,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-5-mini","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-5 mini, a faster, more cost-efficient version of GPT-5 for well-defined tasks.","owned_by":"openai","intelligence":"High","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.25,"output_per_million":2,"cached_input_per_million":0.025,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-5-nano","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-5 nano, the fastest, most cost-efficient version of GPT-5 for summarization and classification.","owned_by":"openai","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.05,"output_per_million":0.4,"cached_input_per_million":0.005,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-5-chat-latest","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-5 Chat, the snapshot currently used in ChatGPT.","owned_by":"openai","intelligence":"High","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":400000,"max_output_tokens":128000,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":1.25,"output_per_million":10,"cached_input_per_million":0.125,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4.1","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4.1. Flagship OpenAI model for complex tasks. It is well suited for problem solving across domains.","owned_by":"openai","intelligence":"Higher","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1047576,"max_output_tokens":32768,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":2,"output_per_million":8,"cached_input_per_million":0.5,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4.1-mini","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4.1 mini, balancing intelligence, speed, and cost for many use cases.","owned_by":"openai","intelligence":"High","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1047576,"max_output_tokens":32768,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.4,"output_per_million":1.6,"cached_input_per_million":0.1,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4.1-nano","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4.1 nano, the fastest, most cost-efficient version of GPT-4.1 for summarization and classification.","owned_by":"openai","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1047576,"max_output_tokens":32768,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.1,"output_per_million":0.4,"cached_input_per_million":0.025,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4o","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4o. Fast, intelligent, flexible GPT model.","owned_by":"openai","intelligence":"High","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":128000,"max_output_tokens":16384,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":2.5,"output_per_million":10,"cached_input_per_million":1.25,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-4o-mini","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to GPT-4o mini.","owned_by":"openai","intelligence":"Average","speed":"Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":128000,"max_output_tokens":16384,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.15,"output_per_million":0.6,"cached_input_per_million":0.075,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gemini-3.1-pro","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Gemini 3.1 Pro model configuration for advanced multimodal reasoning.","owned_by":"google","intelligence":"Higher","speed":"Medium","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1048576,"max_output_tokens":8192,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":2,"output_per_million":12,"cached_input_per_million":0.2,"image_per_unit":null,"audio_per_minute":null,"status":"short_context","note":"Gemini 3.1 Pro Preview paid-tier pricing for prompts <=200K tokens. Longer prompts are listed at $4/M input, $0.40/M cached input, and $18/M output."}},{"id":"gemini-3.5-flash","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Gemini 3.5 Flash model configuration for fast multimodal generation.","owned_by":"google","intelligence":"High","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1048576,"max_output_tokens":8192,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":1.5,"output_per_million":9,"cached_input_per_million":0.15,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"Gemini 3.5 Flash paid-tier pricing, per 1M tokens: $1.50 input, $0.15 cached input, $9 output."}},{"id":"gemini-2.5-flash","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to Gemini 2.5 Flash. Optimized for speed and cost-effective multimodal generation.","owned_by":"google","intelligence":"High","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1048576,"max_output_tokens":8192,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.3,"output_per_million":2.5,"cached_input_per_million":0.03,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":"Gemini 2.5 Flash paid-tier text/image/video pricing, per 1M tokens: $0.30 input, $0.03 cached input, $2.50 output. Audio input is listed separately at $1/M."}},{"id":"gemini-2.0-flash","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Direct access to Gemini 2.0 Flash. Optimized for speed and cost-effectiveness.","owned_by":"google","intelligence":"Average","speed":"Very Fast","input_modalities":["text","image","file","pdf"],"output_modalities":["text"],"context_window":1048576,"max_output_tokens":8192,"supports_streaming":true,"capabilities":{"text":true,"images":true,"files":true,"pdf":true,"audio":false,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.1,"output_per_million":0.4,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"nomic-embed-text-v1.5","object":"model","mode":"embedding","endpoint":"/v1/embeddings","description":"Text embedding model for semantic search, clustering, retrieval, and ranking workflows.","owned_by":"viable-lab","intelligence":"Embedding","speed":"Fast","input_modalities":["text"],"output_modalities":["embedding"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":false,"embeddings":true,"image_generation":false},"pricing":{"input_per_million":0.005,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"docs_inferred","note":"Derived from provider docs: 250,000 pages per dollar at approximately 800 tokens per page."}},{"id":"flux.2-klein","object":"model","mode":"image_generation","endpoint":"/v1/images/generations","description":"Image generation model for prompt-to-image workflows.","owned_by":"viable-lab","intelligence":"Image","speed":"Medium","input_modalities":["text"],"output_modalities":["image"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":false,"embeddings":false,"image_generation":true},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":0.014,"audio_per_minute":null,"status":"starts_at","note":"Provider docs list pricing from $0.014 per image; final cost varies by resolution/model variant."}},{"id":"whisper-large-v3","object":"model","mode":"audio_transcription","endpoint":"/v1/audio/transcriptions","description":"Speech-to-text model for audio transcription.","owned_by":"viable-lab","intelligence":"Audio","speed":"Medium","input_modalities":["audio","file"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":false,"images":false,"files":true,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.006,"status":"documented","note":"Provider docs list $0.006 per minute of input audio."}},{"id":"gpt-4o-transcribe","object":"model","mode":"audio_transcription","endpoint":"/v1/audio/transcriptions","description":"OpenAI speech-to-text model exposed through the VIABLE Lab API.","owned_by":"openai","intelligence":"Audio","speed":"Medium","input_modalities":["audio","file"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":false,"images":false,"files":true,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":2.5,"output_per_million":10,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.006,"status":"documented","note":"OpenAI transcription pricing: $2.50/M input tokens, $10/M output tokens, estimated $0.006/minute."}},{"id":"gpt-4o-mini-transcribe","object":"model","mode":"audio_transcription","endpoint":"/v1/audio/transcriptions","description":"OpenAI speech-to-text model optimized for transcription workflows.","owned_by":"openai","intelligence":"Audio","speed":"Fast","input_modalities":["audio","file"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":false,"images":false,"files":true,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":1.25,"output_per_million":5,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.003,"status":"documented","note":"OpenAI transcription pricing: $1.25/M input tokens, $5/M output tokens, estimated $0.003/minute."}},{"id":"whisper-1","object":"model","mode":"audio_transcription","endpoint":"/v1/audio/transcriptions","description":"OpenAI Whisper transcription model preserved for compatibility.","owned_by":"openai","intelligence":"Audio","speed":"Medium","input_modalities":["audio","file"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":false,"images":false,"files":true,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.006,"status":"documented","note":"OpenAI Whisper transcription pricing is listed as $0.006 per minute."}},{"id":"kokoro","object":"model","mode":"audio_speech","endpoint":"/v1/audio/speech","description":"Text-to-speech model for generated speech audio.","owned_by":"viable-lab","intelligence":"Audio","speed":"Fast","input_modalities":["text"],"output_modalities":["audio"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"default_voice":"af_heart","pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":0.006,"status":"documented","note":"Provider docs list $0.006 per minute of generated audio."}},{"id":"gpt-4o-mini-tts","object":"model","mode":"audio_speech","endpoint":"/v1/audio/speech","description":"OpenAI text-to-speech model exposed through the VIABLE Lab API.","owned_by":"openai","intelligence":"Audio","speed":"Fast","input_modalities":["text"],"output_modalities":["audio"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"not_listed","note":null}},{"id":"tts-1","object":"model","mode":"audio_speech","endpoint":"/v1/audio/speech","description":"OpenAI text-to-speech model preserved for compatibility.","owned_by":"openai","intelligence":"Audio","speed":"Fast","input_modalities":["text"],"output_modalities":["audio"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"not_listed","note":null}},{"id":"tts-1-hd","object":"model","mode":"audio_speech","endpoint":"/v1/audio/speech","description":"OpenAI high-definition text-to-speech model preserved for compatibility.","owned_by":"openai","intelligence":"Audio","speed":"Medium","input_modalities":["text"],"output_modalities":["audio"],"context_window":null,"max_output_tokens":null,"supports_streaming":false,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":true,"tools":false,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":null,"output_per_million":null,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"not_listed","note":null}},{"id":"gpt-oss-120b","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Open-weight 120B model for cost-efficient text generation through the VIABLE Lab API.","owned_by":"viable-lab","intelligence":"High","speed":"Medium","input_modalities":["text"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":true,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.06,"output_per_million":0.15,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"gpt-oss-20b","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Open-weight 20B model for low-cost text generation through the VIABLE Lab API.","owned_by":"viable-lab","intelligence":"Average","speed":"Fast","input_modalities":["text"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":true,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.03,"output_per_million":0.07,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"llama-3.1-8b-instruct","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Llama 3.1 8B Instruct model for lightweight text generation through the VIABLE Lab API.","owned_by":"viable-lab","intelligence":"Average","speed":"Fast","input_modalities":["text"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":true,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.22,"output_per_million":0.22,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}},{"id":"llama-3.1-70b-instruct","object":"model","mode":"chat","endpoint":"/v1/chat/completions","description":"Llama 3.1 70B Instruct model for stronger open-weight text generation through the VIABLE Lab API.","owned_by":"viable-lab","intelligence":"High","speed":"Medium","input_modalities":["text"],"output_modalities":["text"],"context_window":null,"max_output_tokens":null,"supports_streaming":true,"capabilities":{"text":true,"images":false,"files":false,"pdf":false,"audio":false,"tools":true,"embeddings":false,"image_generation":false},"pricing":{"input_per_million":0.4,"output_per_million":0.4,"cached_input_per_million":null,"image_per_unit":null,"audio_per_minute":null,"status":"documented","note":null}}],"endpoints":[{"method":"POST","path":"/v1/chat/completions","mode":"chat","request_format":"OpenAI Chat Completions JSON","streaming":true,"notes":["Send model plus messages. The API accepts supported aliases and model IDs while keeping routing details internal.","Text, image data URLs, files, and PDFs are accepted by compatible models."]},{"method":"POST","path":"/v1/chat/vetting","mode":"chat","request_format":"OpenAI Chat Completions JSON with vetting metadata","streaming":false,"notes":["Use the chat request shape when you want a vetted educational response.","The response preserves chat completion choices and adds vetting_info.","Uses the same chat model registry as /v1/chat/completions; non-chat models are rejected."]},{"method":"POST","path":"/v1/vetting/full","mode":"chat","request_format":"Full VETTING workflow JSON","streaming":false,"notes":["Use for structured educational verification against questions and answer keys.","chatModel and verificationModel can use different chat-capable providers.","This endpoint is intentionally non-streaming."]},{"method":"POST","path":"/v1/embeddings","mode":"embedding","request_format":"OpenAI Embeddings JSON","streaming":false,"notes":["Send input text or an array of strings. Default model is nomic-embed-text-v1.5."]},{"method":"POST","path":"/v1/images/generations","mode":"image_generation","request_format":"OpenAI Images JSON","streaming":false,"notes":["Send prompt, optional size/n/response_format. Default model is flux.2-klein.","response_format=url returns a public https://api.viablelab.org/v1/assets/... URL when the provider returns inline image data.","response_format=b64_json returns inline base64 to the caller; logs redact base64 and include an asset URL preview when asset storage is available."]},{"method":"GET","path":"/v1/assets/{key}","mode":"asset","request_format":"Generated asset URL","streaming":true,"notes":["Serves API-generated assets such as image outputs stored in private R2.","Only unguessable API-generated asset keys are accepted; upload and delete operations are not exposed."]},{"method":"POST","path":"/v1/audio/speech","mode":"audio_speech","request_format":"OpenAI Audio Speech JSON","streaming":false,"notes":["Send input, model, voice, and response_format. Binary audio is returned. OpenAI speech models and registered VIABLE Lab speech models are supported."]},{"method":"POST","path":"/v1/audio/transcriptions","mode":"audio_transcription","request_format":"multipart/form-data","streaming":false,"notes":["Send file and model. OpenAI transcription models and registered VIABLE Lab transcription models are supported. Optional duration_seconds/duration_minutes improves cost logging."]},{"method":"GET","path":"/v1/developer/me","mode":"developer","request_format":"Firebase Bearer token","streaming":false,"notes":["Returns the signed-in developer profile after Google Firebase sign-in."]},{"method":"GET/POST/PATCH/DELETE","path":"/v1/developer/api-keys","mode":"developer","request_format":"Firebase Bearer token","streaming":false,"notes":["Create, list, reveal, pause, resume, update, and revoke encrypted-at-rest VIABLE Lab API keys.","Optional allowedModels, request rate, daily token, and monthly cost limits are enforced for protected API calls when set."]},{"method":"GET","path":"/v1/developer/usage","mode":"developer","request_format":"Firebase Bearer token","streaming":false,"notes":["Returns daily request, token, error, and cost rollups for the signed-in developer."]},{"method":"GET","path":"/v1/developer/logs","mode":"developer","request_format":"Firebase Bearer token","streaming":false,"notes":["Returns paginated request log rows for the signed-in developer, filterable by API key, endpoint, platform, model, provider, status, operation, and date range."]},{"method":"GET","path":"/v1/developer/logs/export","mode":"developer","request_format":"Firebase Bearer token","streaming":false,"notes":["Exports the signed-in developer request logs as CSV by default or JSONL with format=jsonl. Payloads are omitted by default."]},{"method":"GET","path":"/v1/developer/logs/{request_id}","mode":"developer","request_format":"Firebase Bearer token","streaming":false,"notes":["Returns one developer-owned request log row by request_id with optional sanitized request/response payloads when include_payload=true. Legacy numeric log IDs remain accepted for existing links."]}],"quickstarts":{"chat":{"curl":"curl https://api.viablelab.org/v1/chat/completions -H \"Content-Type: application/json\" -d '{\"model\":\"viable-2\",\"messages\":[{\"role\":\"user\",\"content\":\"Write one sentence.\"}]}'"},"streaming_chat":{"curl":"curl -N https://api.viablelab.org/v1/chat/completions -H \"Content-Type: application/json\" -d '{\"model\":\"gpt-oss-120b\",\"stream\":true,\"messages\":[{\"role\":\"user\",\"content\":\"Stream one sentence.\"}]}'"},"embedding":{"curl":"curl https://api.viablelab.org/v1/embeddings -H \"Content-Type: application/json\" -d '{\"model\":\"nomic-embed-text-v1.5\",\"input\":\"Searchable text\"}'"},"image_generation":{"curl":"curl https://api.viablelab.org/v1/images/generations -H \"Content-Type: application/json\" -d '{\"model\":\"flux.2-klein\",\"prompt\":\"A clean classroom whiteboard UI mockup\",\"size\":\"1024x1024\",\"n\":1,\"response_format\":\"url\"}'"},"image_generation_b64":{"curl":"curl https://api.viablelab.org/v1/images/generations -H \"Content-Type: application/json\" -d '{\"model\":\"flux.2-klein\",\"prompt\":\"A clean classroom whiteboard UI mockup\",\"size\":\"1024x1024\",\"n\":1,\"response_format\":\"b64_json\"}'"},"speech":{"curl":"curl https://api.viablelab.org/v1/audio/speech -H \"Content-Type: application/json\" -d '{\"model\":\"gpt-4o-mini-tts\",\"input\":\"Hello from VIABLE Lab.\",\"voice\":\"alloy\",\"response_format\":\"mp3\"}' --output speech.mp3"},"transcription":{"curl":"curl https://api.viablelab.org/v1/audio/transcriptions -F model=whisper-large-v3 -F file=@sample.mp3"},"openai_transcription":{"curl":"curl https://api.viablelab.org/v1/audio/transcriptions -F model=gpt-4o-transcribe -F file=@sample.mp3"},"vetted_chat":{"curl":"curl https://api.viablelab.org/v1/chat/vetting -H \"Content-Type: application/json\" -d '{\"model\":\"gemini-2.5-flash\",\"messages\":[{\"role\":\"user\",\"content\":\"Explain photosynthesis without giving away a homework answer.\"}],\"vettingConfig\":{\"maxAttempts\":1}}'"},"full_vetting":{"curl":"curl https://api.viablelab.org/v1/vetting/full -H \"Content-Type: application/json\" -d '{\"mode\":\"vetting\",\"config\":{\"chatModel\":{\"modelId\":\"viable-2\"},\"verificationModel\":{\"modelId\":\"gemini-2.5-flash\"},\"maxVerificationAttempts\":1},\"prompts\":{\"chatSystemPrompt\":\"Guide the student without giving away the answer.\"},\"context\":{\"items\":[{\"question\":{\"text\":\"What is photosynthesis?\"},\"answerKey\":{\"correctAnswer\":\"Plants convert light, water, and carbon dioxide into glucose and oxygen.\"}}]},\"messages\":[{\"role\":\"user\",\"content\":\"What is photosynthesis?\"}]}'"}},"pricing_notes":["Token prices are registry-backed and logged when providers return token usage.","Image usage can have zero tokens and non-zero cost because it is priced per generated image rather than per token.","Image model pricing is currently documented as a starting price and may vary by resolution.","Audio pricing is per minute; cost is null unless duration is provided or returned by a provider.","Models without listed pricing are logged with null cost until pricing is added to the registry."],"cache":{"status":"hit","ttlSeconds":3600}}