{"openapi":"3.1.0","info":{"title":"FastAPI","version":"0.1.0"},"servers":[{"url":"/prod"}],"paths":{"/v1/tcp_warming":{"get":{"summary":"Tcp Warming","operationId":"tcp_warming_v1_tcp_warming_get","responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{}}}}}}},"/v1/chat/completions":{"post":{"summary":"Chat","operationId":"chat_v1_chat_completions_post","security":[{"HTTPBearer":[]}],"parameters":[{"name":"X-Amz-Cf-Id","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"X-Amz-Cf-Id"}},{"name":"CF-RAY","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Cf-Ray"}},{"name":"X-delay-time","in":"header","required":false,"schema":{"anyOf":[{"type":"number"},{"type":"null"}],"title":"X-Delay-Time"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/CreateChatCompletionResponse"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}},"requestBody":{"required":true,"content":{"application/json":{"schema":{"$ref":"#/components/schemas/ChatCompletionRequest"}},"application/vnd.msgpack":{"schema":{"$ref":"#/components/schemas/ChatCompletionRequest"}},"application/x-msgpack":{"schema":{"$ref":"#/components/schemas/ChatCompletionRequest"}},"application/msgpack":{"schema":{"$ref":"#/components/schemas/ChatCompletionRequest"}}}}}},"/v1/completions":{"post":{"summary":"Completions","operationId":"completions_v1_completions_post","security":[{"HTTPBearer":[]}],"parameters":[{"name":"X-Amz-Cf-Id","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"X-Amz-Cf-Id"}},{"name":"CF-RAY","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Cf-Ray"}},{"name":"X-delay-time","in":"header","required":false,"schema":{"anyOf":[{"type":"number"},{"type":"null"}],"title":"X-Delay-Time"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/CreateCompletionResponse"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}},"requestBody":{"required":true,"content":{"application/json":{"schema":{"$ref":"#/components/schemas/CompletionRequest"}},"application/vnd.msgpack":{"schema":{"$ref":"#/components/schemas/CompletionRequest"}},"application/x-msgpack":{"schema":{"$ref":"#/components/schemas/CompletionRequest"}},"application/msgpack":{"schema":{"$ref":"#/components/schemas/CompletionRequest"}}}}}},"/v1/models":{"get":{"summary":"List Models","operationId":"list_models_v1_models_get","security":[{"HTTPBearer":[]}],"parameters":[{"name":"X-Amz-Cf-Id","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"X-Amz-Cf-Id"}},{"name":"CF-RAY","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Cf-Ray"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/ModelMetadataList"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}},"/v1/models/{model_id}":{"get":{"summary":"Get Model","operationId":"get_model_v1_models__model_id__get","security":[{"HTTPBearer":[]}],"parameters":[{"name":"model_id","in":"path","required":true,"schema":{"type":"string","title":"Model Id"}},{"name":"X-Amz-Cf-Id","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"X-Amz-Cf-Id"}},{"name":"CF-RAY","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Cf-Ray"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"$ref":"#/components/schemas/ModelMetadata"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}},"/public/v1/models":{"get":{"tags":["Public Models"],"summary":"List all available models","description":"List all publicly available models (modelVisibility='PUBLIC' only). Use the `format` parameter to get responses compatible with OpenRouter or HuggingFace APIs.","operationId":"list_public_models_endpoint_public_v1_models_get","parameters":[{"name":"format","in":"query","required":false,"schema":{"$ref":"#/components/schemas/ModelFormat","description":"Output format: 'default' (Cerebras schema), 'openrouter', or 'huggingface'","default":"default"},"description":"Output format: 'default' (Cerebras schema), 'openrouter', or 'huggingface'"},{"name":"X-Amz-Cf-Id","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"X-Amz-Cf-Id"}},{"name":"CF-RAY","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Cf-Ray"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"anyOf":[{"$ref":"#/components/schemas/PublicModelsListResponse"},{"$ref":"#/components/schemas/OpenRouterModelsResponse"},{"$ref":"#/components/schemas/HuggingFaceModelsResponse"}],"title":"Response List Public Models Endpoint Public V1 Models Get"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}},"/public/v1/models/{model_id}":{"get":{"tags":["Public Models"],"summary":"Retrieve a specific model","description":"Retrieve a specific publicly available model by ID (modelVisibility='PUBLIC' only). Use the `format` parameter to get responses compatible with OpenRouter or HuggingFace APIs.","operationId":"get_public_model_public_v1_models__model_id__get","parameters":[{"name":"model_id","in":"path","required":true,"schema":{"type":"string","title":"Model Id"}},{"name":"format","in":"query","required":false,"schema":{"$ref":"#/components/schemas/ModelFormat","description":"Output format: 'default' (Cerebras schema), 'openrouter', or 'huggingface'","default":"default"},"description":"Output format: 'default' (Cerebras schema), 'openrouter', or 'huggingface'"},{"name":"X-Amz-Cf-Id","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"X-Amz-Cf-Id"}},{"name":"CF-RAY","in":"header","required":false,"schema":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Cf-Ray"}}],"responses":{"200":{"description":"Successful Response","content":{"application/json":{"schema":{"anyOf":[{"$ref":"#/components/schemas/PublicModel"},{"$ref":"#/components/schemas/OpenRouterModel"},{"$ref":"#/components/schemas/HuggingFaceModel"}],"title":"Response Get Public Model Public V1 Models  Model Id  Get"}}}},"422":{"description":"Validation Error","content":{"application/json":{"schema":{"$ref":"#/components/schemas/HTTPValidationError"}}}}}}}},"components":{"schemas":{"AssistantToolCall":{"properties":{"id":{"type":"string","title":"Id"},"type":{"type":"string","const":"function","title":"Type"},"function":{"$ref":"#/components/schemas/AssistantToolCallFunction"}},"additionalProperties":true,"type":"object","required":["id","type","function"],"title":"AssistantToolCall","description":"A tool call for an assistant."},"AssistantToolCallFunction":{"properties":{"name":{"type":"string","title":"Name"},"arguments":{"type":"string","title":"Arguments"}},"additionalProperties":true,"type":"object","required":["name","arguments"],"title":"AssistantToolCallFunction","description":"A function call for an assistant tool."},"ChatChunkChoice":{"properties":{"delta":{"anyOf":[{"$ref":"#/components/schemas/ChunkResponseMessage"},{"type":"null"}]},"finish_reason":{"anyOf":[{"type":"string","enum":["stop","length","content_filter","tool_calls"]},{"type":"null"}],"title":"Finish Reason"},"index":{"type":"integer","title":"Index"},"logprobs":{"anyOf":[{"$ref":"#/components/schemas/ChatCompletionLogProbs"},{"type":"null"}]},"reasoning_logprobs":{"anyOf":[{"$ref":"#/components/schemas/ChatCompletionLogProbs"},{"type":"null"}]},"tokens":{"anyOf":[{"items":{"type":"integer"},"type":"array"},{"type":"null"}],"title":"Tokens"},"text":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Text"}},"additionalProperties":true,"type":"object","required":["index"],"title":"ChatChunkChoice"},"ChatChunkResponse":{"properties":{"id":{"type":"string","title":"Id"},"choices":{"anyOf":[{"items":{"$ref":"#/components/schemas/ChatChunkChoice"},"type":"array"},{"type":"null"}],"title":"Choices"},"created":{"type":"integer","title":"Created"},"model":{"type":"string","title":"Model"},"service_tier":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Service Tier"},"system_fingerprint":{"type":"string","title":"System Fingerprint"},"object":{"type":"string","enum":["chat.completion.chunk","text_completion"],"title":"Object"},"usage":{"anyOf":[{"$ref":"#/components/schemas/Usage"},{"type":"null"}]},"time_info":{"anyOf":[{"$ref":"#/components/schemas/TimeInfo"},{"type":"null"}]}},"additionalProperties":true,"type":"object","required":["id","created","model","system_fingerprint","object"],"title":"ChatChunkResponse","examples":[{"choices":[{"delta":{"role":"assistant"},"index":0}],"created":1721088719,"id":"response_1721","model":"llama3.1-8b","object":"chat.completion.chunk","system_fingerprint":"88719"},{"choices":[{"delta":{"content":"Generative "},"index":0}],"created":1721088719,"id":"response_1721","model":"llama3.1-8b","object":"chat.completion.chunk","system_fingerprint":"88719"},{"choices":[{"delta":{},"finish_reason":"stop","index":0}],"created":1721088719,"id":"response_1721","model":"llama3.1-8b","object":"chat.completion.chunk","system_fingerprint":"88719","time_info":{"completion_time":0.44,"prompt_time":0.02,"queue_time":0.0,"total_time":0.46},"usage":{"completion_tokens":1020,"prompt_tokens":40,"prompt_tokens_details":{"cached_tokens":1020},"total_tokens":1060}}]},"ChatCompletionChoice":{"properties":{"finish_reason":{"type":"string","enum":["stop","length","content_filter","tool_calls"],"title":"Finish Reason"},"index":{"type":"integer","title":"Index"},"message":{"$ref":"#/components/schemas/ChatCompletionResponseMessage"},"logprobs":{"anyOf":[{"$ref":"#/components/schemas/ChatCompletionLogProbs"},{"type":"null"}]},"reasoning_logprobs":{"anyOf":[{"$ref":"#/components/schemas/ChatCompletionLogProbs"},{"type":"null"}]}},"additionalProperties":true,"type":"object","required":["finish_reason","index","message"],"title":"ChatCompletionChoice"},"ChatCompletionLogProbs":{"properties":{"content":{"anyOf":[{"items":{"$ref":"#/components/schemas/LogProbsContent"},"type":"array"},{"type":"null"}],"title":"Content"},"refusal":{"anyOf":[{"items":{"$ref":"#/components/schemas/LogProbsContent"},"type":"array"},{"type":"null"}],"title":"Refusal"}},"additionalProperties":true,"type":"object","title":"ChatCompletionLogProbs"},"ChatCompletionResponse":{"properties":{"id":{"type":"string","title":"Id"},"choices":{"items":{"$ref":"#/components/schemas/ChatCompletionChoice"},"type":"array","minItems":1,"title":"Choices"},"created":{"type":"integer","title":"Created"},"model":{"type":"string","title":"Model"},"service_tier":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Service Tier"},"system_fingerprint":{"type":"string","title":"System Fingerprint"},"object":{"type":"string","const":"chat.completion","title":"Object"},"usage":{"$ref":"#/components/schemas/Usage"},"time_info":{"$ref":"#/components/schemas/TimeInfo"}},"additionalProperties":true,"type":"object","required":["id","choices","created","model","system_fingerprint","object","usage","time_info"],"title":"ChatCompletionResponse","examples":[{"choices":[{"finish_reason":"stop","index":0,"message":{"content":"Generative AI is a subfield of artificial intelligence that focuses on generating new, original content, such as images, music, text, or videos. These models are trained on large datasets and learn to recognize patterns, relationships, and structures within the data, allowing them to generate new content that is similar in style, tone, or characteristics to the training data. \n \n Generative AI models can be categorized into two main types: Generative Adversarial Networks (GANs) and Variational Autoencoders (VAEs). GANs consist of two neural networks: a generator and a discriminator. The generator creates new content, while the discriminator evaluates the generated content and tells the generator whether it's realistic or not. VAEs are neural networks that learn to compress and reconstruct data. \n \n Generative AI has numerous applications across various industries, including art and design, content generation, data augmentation, and recommendation systems. Some examples of Generative AI in action include Deep Dream Generator, Amper Music, and DALL-E. \n \n In summary, Generative AI is a powerful technology that enables the creation of new, original content using machine learning models. It has the potential to revolutionize various industries and create new opportunities for artists, designers, and content creators.","role":"assistant"}}],"created":1721088719,"id":"response_1721","model":"llama3.1-8b","object":"chat.completion","system_fingerprint":"88719","time_info":{"completion_time":0.44,"prompt_time":0.02,"queue_time":0.0,"total_time":0.46},"usage":{"completion_tokens":1020,"prompt_tokens":40,"prompt_tokens_details":{"cached_tokens":1020},"total_tokens":1060}}]},"ChatCompletionResponseMessage":{"properties":{"content":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Content"},"reasoning":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Reasoning"},"tool_calls":{"anyOf":[{"items":{"$ref":"#/components/schemas/AssistantToolCall"},"type":"array"},{"type":"null"}],"title":"Tool Calls"},"role":{"type":"string","enum":["assistant","user","system","tool"],"title":"Role"}},"additionalProperties":true,"type":"object","required":["role"],"title":"ChatCompletionResponseMessage"},"ChunkAssistantToolCall":{"properties":{"function":{"$ref":"#/components/schemas/ChunkAssistantToolCallFunction"},"type":{"type":"string","const":"function","title":"Type"},"id":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Id"},"index":{"anyOf":[{"type":"integer"},{"type":"null"}],"title":"Index"}},"additionalProperties":true,"type":"object","required":["function","type"],"title":"ChunkAssistantToolCall","description":"Streaming only. Represents a function call in an assistant tool call."},"ChunkAssistantToolCallFunction":{"properties":{"name":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Name"},"arguments":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Arguments"}},"additionalProperties":true,"type":"object","title":"ChunkAssistantToolCallFunction","description":"Streaming only. Represents a function in an assistant tool call."},"ChunkResponseMessage":{"properties":{"content":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Content"},"reasoning":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Reasoning"},"tool_calls":{"anyOf":[{"items":{"$ref":"#/components/schemas/ChunkAssistantToolCall"},"type":"array"},{"type":"null"}],"title":"Tool Calls"},"role":{"anyOf":[{"type":"string","enum":["assistant","user","system","tool"]},{"type":"null"}],"title":"Role"},"tokens":{"anyOf":[{"items":{"type":"integer"},"type":"array"},{"type":"null"}],"title":"Tokens"}},"additionalProperties":true,"type":"object","title":"ChunkResponseMessage"},"CompletionChoice":{"properties":{"finish_reason":{"anyOf":[{"type":"string","enum":["stop","length","content_filter"]},{"type":"null"}],"title":"Finish Reason"},"index":{"type":"integer","title":"Index"},"text":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Text"},"tokens":{"anyOf":[{"items":{"type":"integer"},"type":"array"},{"type":"null"}],"title":"Tokens"},"logprobs":{"anyOf":[{"$ref":"#/components/schemas/CompletionLogProbs"},{"type":"null"}]}},"additionalProperties":true,"type":"object","required":["index"],"title":"CompletionChoice"},"CompletionChunkChoice":{"properties":{"delta":{"anyOf":[{"$ref":"#/components/schemas/ChunkResponseMessage"},{"type":"null"}]},"finish_reason":{"anyOf":[{"type":"string","enum":["stop","length","content_filter","tool_calls"]},{"type":"null"}],"title":"Finish Reason"},"index":{"type":"integer","title":"Index"},"logprobs":{"anyOf":[{"$ref":"#/components/schemas/CompletionLogProbs"},{"type":"null"}]},"tokens":{"anyOf":[{"items":{"type":"integer"},"type":"array"},{"type":"null"}],"title":"Tokens"},"text":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Text"}},"additionalProperties":true,"type":"object","required":["index"],"title":"CompletionChunkChoice"},"CompletionChunkResponse":{"properties":{"id":{"type":"string","title":"Id"},"choices":{"anyOf":[{"items":{"$ref":"#/components/schemas/CompletionChunkChoice"},"type":"array"},{"type":"null"}],"title":"Choices"},"created":{"type":"integer","title":"Created"},"model":{"type":"string","title":"Model"},"service_tier":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Service Tier"},"system_fingerprint":{"type":"string","title":"System Fingerprint"},"object":{"type":"string","enum":["chat.completion.chunk","text_completion"],"title":"Object"},"usage":{"anyOf":[{"$ref":"#/components/schemas/Usage"},{"type":"null"}]},"time_info":{"anyOf":[{"$ref":"#/components/schemas/TimeInfo"},{"type":"null"}]}},"additionalProperties":true,"type":"object","required":["id","created","model","system_fingerprint","object"],"title":"CompletionChunkResponse","examples":[{"choices":[{"delta":{"role":"assistant"},"index":0}],"created":1721088719,"id":"response_1721","model":"llama3.1-8b","object":"chat.completion.chunk","system_fingerprint":"88719"},{"choices":[{"delta":{"content":"Generative "},"index":0}],"created":1721088719,"id":"response_1721","model":"llama3.1-8b","object":"chat.completion.chunk","system_fingerprint":"88719"},{"choices":[{"delta":{},"finish_reason":"stop","index":0}],"created":1721088719,"id":"response_1721","model":"llama3.1-8b","object":"chat.completion.chunk","system_fingerprint":"88719","time_info":{"completion_time":0.44,"prompt_time":0.02,"queue_time":0.0,"total_time":0.46},"usage":{"completion_tokens":1020,"prompt_tokens":40,"prompt_tokens_details":{"cached_tokens":1020},"total_tokens":1060}}]},"CompletionLogProbs":{"properties":{"text_offset":{"anyOf":[{"items":{"type":"integer"},"type":"array"},{"type":"null"}],"title":"Text Offset"},"token_logprobs":{"anyOf":[{"items":{"type":"number"},"type":"array"},{"type":"null"}],"title":"Token Logprobs"},"tokens":{"anyOf":[{"items":{"type":"string"},"type":"array"},{"type":"null"}],"title":"Tokens"},"top_logprobs":{"anyOf":[{"items":{"additionalProperties":{"type":"number"},"type":"object"},"type":"array"},{"type":"null"}],"title":"Top Logprobs"}},"additionalProperties":true,"type":"object","title":"CompletionLogProbs"},"CompletionResponse":{"properties":{"id":{"type":"string","title":"Id"},"choices":{"items":{"$ref":"#/components/schemas/CompletionChoice"},"type":"array","minItems":1,"title":"Choices"},"created":{"type":"integer","title":"Created"},"model":{"type":"string","title":"Model"},"system_fingerprint":{"type":"string","title":"System Fingerprint"},"usage":{"anyOf":[{"$ref":"#/components/schemas/Usage"},{"type":"null"}]},"time_info":{"anyOf":[{"$ref":"#/components/schemas/TimeInfo"},{"type":"null"}]},"object":{"type":"string","const":"text_completion","title":"Object"}},"additionalProperties":true,"type":"object","required":["id","choices","created","model","system_fingerprint","object"],"title":"CompletionResponse","examples":[{"choices":[{"finish_reason":"stop","index":0,"text":"Generative AI is a subfield of artificial intelligence that focuses on generating new, original content, such as images, music, text, or videos. These models are trained on large datasets and learn to recognize patterns, relationships, and structures within the data, allowing them to generate new content that is similar in style, tone, or characteristics to the training data. \n \n Generative AI models can be categorized into two main types: Generative Adversarial Networks (GANs) and Variational Autoencoders (VAEs). GANs consist of two neural networks: a generator and a discriminator. The generator creates new content, while the discriminator evaluates the generated content and tells the generator whether it's realistic or not. VAEs are neural networks that learn to compress and reconstruct data. \n \n Generative AI has numerous applications across various industries, including art and design, content generation, data augmentation, and recommendation systems. Some examples of Generative AI in action include Deep Dream Generator, Amper Music, and DALL-E. \n \n In summary, Generative AI is a powerful technology that enables the creation of new, original content using machine learning models. It has the potential to revolutionize various industries and create new opportunities for artists, designers, and content creators."}],"created":1721088719,"id":"response_1721","model":"llama3.1-8b","object":"text_completion","system_fingerprint":"88719","time_info":{"completion_time":0.44,"prompt_time":0.02,"queue_time":0.0,"total_time":0.46},"usage":{"completion_tokens":1020,"prompt_tokens":40,"total_tokens":1060}}]},"CreateChatCompletionResponse":{"anyOf":[{"$ref":"#/components/schemas/ChatCompletionResponse"},{"$ref":"#/components/schemas/ChatChunkResponse"},{"$ref":"#/components/schemas/ErrorChunkResponse"}],"title":"CreateChatCompletionResponse"},"CreateCompletionResponse":{"anyOf":[{"$ref":"#/components/schemas/CompletionResponse"},{"$ref":"#/components/schemas/CompletionChunkResponse"},{"$ref":"#/components/schemas/ErrorChunkResponse"}],"title":"CreateCompletionResponse"},"DatacenterLocation":{"properties":{"country_code":{"type":"string","title":"Country Code","description":"ISO 3166 Alpha-2 country code"}},"type":"object","required":["country_code"],"title":"DatacenterLocation","description":"Datacenter location information."},"ErrorChunkContent":{"properties":{"message":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Message","default":""},"type":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Type","default":""},"param":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Param","default":""},"code":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Code","default":""},"id":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Id","default":""}},"additionalProperties":true,"type":"object","title":"ErrorChunkContent"},"ErrorChunkResponse":{"properties":{"status_code":{"type":"integer","title":"Status Code"},"error":{"$ref":"#/components/schemas/ErrorChunkContent"}},"additionalProperties":true,"type":"object","required":["status_code","error"],"title":"ErrorChunkResponse"},"HTTPValidationError":{"properties":{"detail":{"items":{"$ref":"#/components/schemas/ValidationError"},"type":"array","title":"Detail"}},"type":"object","title":"HTTPValidationError"},"HuggingFaceCapabilities":{"properties":{"streaming":{"type":"boolean","title":"Streaming","default":true},"function_calling":{"type":"boolean","title":"Function Calling","default":false},"structured_outputs":{"type":"boolean","title":"Structured Outputs","default":false},"vision":{"type":"boolean","title":"Vision","default":false}},"type":"object","title":"HuggingFaceCapabilities","description":"HuggingFace capabilities format."},"HuggingFaceModel":{"properties":{"id":{"type":"string","title":"Id"},"hugging_face_id":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Hugging Face Id","description":"The corresponding HuggingFace Hub model ID"},"object":{"type":"string","const":"model","title":"Object","default":"model"},"created":{"type":"integer","title":"Created"},"owned_by":{"type":"string","title":"Owned By"},"context_length":{"type":"integer","title":"Context Length","description":"Supported context length in tokens"},"pricing":{"$ref":"#/components/schemas/HuggingFacePricing"},"capabilities":{"$ref":"#/components/schemas/HuggingFaceCapabilities"}},"type":"object","required":["id","created","owned_by","context_length","pricing"],"title":"HuggingFaceModel","description":"Model in HuggingFace-compatible format for inference providers.\n\nThis format is used by HuggingFace to power their provider comparison table\nand provider selection features."},"HuggingFaceModelsResponse":{"properties":{"object":{"type":"string","const":"list","title":"Object","default":"list"},"data":{"items":{"$ref":"#/components/schemas/HuggingFaceModel"},"type":"array","title":"Data"}},"type":"object","required":["data"],"title":"HuggingFaceModelsResponse","description":"HuggingFace-compatible list of models."},"HuggingFacePricing":{"properties":{"input":{"type":"number","title":"Input","description":"Price in USD per million input tokens"},"output":{"type":"number","title":"Output","description":"Price in USD per million output tokens"}},"type":"object","required":["input","output"],"title":"HuggingFacePricing","description":"HuggingFace pricing format - price in USD per million tokens."},"LogProbsContent":{"properties":{"token":{"type":"string","title":"Token"},"logprob":{"type":"number","title":"Logprob"},"bytes":{"anyOf":[{"items":{"type":"integer"},"type":"array"},{"type":"null"}],"title":"Bytes"},"top_logprobs":{"items":{"$ref":"#/components/schemas/TopLogProbs"},"type":"array","title":"Top Logprobs"}},"additionalProperties":true,"type":"object","required":["token","logprob","top_logprobs"],"title":"LogProbsContent"},"ModelArchitecture":{"properties":{"modality":{"type":"string","enum":["text","text+vision","multimodal"],"title":"Modality","description":"The modality of the model (e.g., 'text', 'text+vision', 'multimodal')."},"tokenizer":{"type":"string","title":"Tokenizer","description":"The tokenizer used by the model (e.g., 'Llama3', 'GPT4')."},"instruct_type":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Instruct Type","description":"The instruction format type used for fine-tuning (e.g., 'llama3', 'chatml')."}},"type":"object","required":["modality","tokenizer"],"title":"ModelArchitecture","description":"Architecture details of the model."},"ModelCapabilities":{"properties":{"streaming":{"type":"boolean","title":"Streaming","description":"Indicates if the model supports streaming responses via Server-Sent Events (SSE).","default":true},"function_calling":{"type":"boolean","title":"Function Calling","description":"Indicates if the model supports function calling (tool use).","default":false},"structured_outputs":{"type":"boolean","title":"Structured Outputs","description":"Indicates if the model supports structured outputs (e.g. JSON schema enforcement).","default":false},"vision":{"type":"boolean","title":"Vision","description":"Indicates if the model accepts image inputs (vision capabilities).","default":false},"json_mode":{"type":"boolean","title":"Json Mode","description":"Indicates if the model supports JSON mode (guaranteed JSON output).","default":false},"tools":{"type":"boolean","title":"Tools","description":"Indicates if the model supports the tools parameter.","default":false},"tool_choice":{"type":"boolean","title":"Tool Choice","description":"Indicates if the model supports the tool_choice parameter.","default":false},"parallel_tool_calls":{"type":"boolean","title":"Parallel Tool Calls","description":"Indicates if the model supports parallel tool calls.","default":false},"response_format":{"type":"boolean","title":"Response Format","description":"Indicates if the model supports the response_format parameter.","default":false},"reasoning":{"type":"boolean","title":"Reasoning","description":"Indicates if the model supports reasoning/chain-of-thought outputs.","default":false}},"type":"object","title":"ModelCapabilities","description":"Capabilities and features supported by the model."},"ModelFormat":{"type":"string","enum":["default","openrouter","huggingface"],"title":"ModelFormat","description":"Output format for public models endpoint."},"ModelLimits":{"properties":{"max_context_length":{"type":"integer","exclusiveMinimum":0.0,"title":"Max Context Length","description":"The maximum context window size in tokens."},"max_completion_tokens":{"type":"integer","exclusiveMinimum":0.0,"title":"Max Completion Tokens","description":"The maximum number of tokens that can be generated in a single completion."},"requests_per_minute":{"anyOf":[{"type":"integer","minimum":0.0},{"type":"null"}],"title":"Requests Per Minute","description":"The default rate limit for requests per minute (RPM)."},"tokens_per_minute":{"anyOf":[{"type":"integer","minimum":0.0},{"type":"null"}],"title":"Tokens Per Minute","description":"The default rate limit for tokens per minute (TPM)."}},"type":"object","required":["max_context_length","max_completion_tokens"],"title":"ModelLimits","description":"Rate limits and constraints for the model."},"ModelMetadata":{"properties":{"id":{"type":"string","title":"Id"},"object":{"type":"string","const":"model","title":"Object","default":"model"},"created":{"type":"integer","title":"Created","default":0},"owned_by":{"type":"string","title":"Owned By","default":""}},"additionalProperties":true,"type":"object","required":["id"],"title":"ModelMetadata"},"ModelMetadataList":{"properties":{"object":{"type":"string","const":"list","title":"Object","default":"list"},"data":{"items":{"$ref":"#/components/schemas/ModelMetadata"},"type":"array","title":"Data"}},"additionalProperties":true,"type":"object","required":["data"],"title":"ModelMetadataList"},"ModelPricing":{"properties":{"prompt":{"type":"string","pattern":"^(?!^[-+.]*$)[+-]?0*\\d*\\.?\\d*$","title":"Prompt","description":"Cost per token for prompt (input) tokens in USD."},"completion":{"type":"string","pattern":"^(?!^[-+.]*$)[+-]?0*\\d*\\.?\\d*$","title":"Completion","description":"Cost per token for completion (output) tokens in USD."}},"type":"object","required":["prompt","completion"],"title":"ModelPricing","description":"Pricing information for a model.","example":{"completion":"0.0000001","prompt":"0.0000001"}},"OpenRouterInfo":{"properties":{"slug":{"type":"string","title":"Slug","description":"OpenRouter slug for the model"}},"type":"object","required":["slug"],"title":"OpenRouterInfo","description":"OpenRouter metadata."},"OpenRouterModel":{"properties":{"id":{"type":"string","title":"Id","description":"Model ID with provider prefix, e.g., 'cerebras/llama3.1-8b'"},"hugging_face_id":{"type":"string","title":"Hugging Face Id","description":"The corresponding HuggingFace Hub model ID, if available","default":""},"name":{"type":"string","title":"Name"},"created":{"type":"integer","title":"Created","description":"Unix timestamp when model was created"},"input_modalities":{"items":{"type":"string"},"type":"array","title":"Input Modalities","description":"Supported input modalities (text, image, file)"},"output_modalities":{"items":{"type":"string"},"type":"array","title":"Output Modalities","description":"Supported output modalities (text, image, file)"},"quantization":{"type":"string","title":"Quantization","description":"Model quantization (fp16 only for Cerebras)","default":"fp16"},"context_length":{"type":"integer","title":"Context Length"},"max_output_length":{"type":"integer","title":"Max Output Length","description":"Maximum number of output tokens"},"pricing":{"$ref":"#/components/schemas/OpenRouterPricing"},"supported_sampling_parameters":{"items":{"type":"string"},"type":"array","title":"Supported Sampling Parameters","description":"List of supported sampling parameters"},"supported_features":{"items":{"type":"string"},"type":"array","title":"Supported Features","description":"List of supported features"},"description":{"type":"string","title":"Description","description":"Model description","default":""},"openrouter":{"anyOf":[{"$ref":"#/components/schemas/OpenRouterInfo"},{"type":"null"}],"description":"OpenRouter metadata"},"datacenters":{"items":{"$ref":"#/components/schemas/DatacenterLocation"},"type":"array","title":"Datacenters","description":"Datacenter locations"}},"type":"object","required":["id","name","created","context_length","max_output_length","pricing"],"title":"OpenRouterModel","description":"Model in OpenRouter-compatible format."},"OpenRouterModelsResponse":{"properties":{"data":{"items":{"$ref":"#/components/schemas/OpenRouterModel"},"type":"array","title":"Data"}},"type":"object","required":["data"],"title":"OpenRouterModelsResponse","description":"OpenRouter-compatible list of models."},"OpenRouterPricing":{"properties":{"prompt":{"type":"string","title":"Prompt","description":"Cost per input token as string"},"completion":{"type":"string","title":"Completion","description":"Cost per output token as string"},"request":{"type":"string","title":"Request","description":"Cost per request as string","default":"0"},"image":{"type":"string","title":"Image","description":"Cost per image as string","default":"0"},"input_cache_read":{"type":"string","title":"Input Cache Read","description":"Cost per cached input token read as string","default":"0"},"input_cache_write":{"type":"string","title":"Input Cache Write","description":"Cost per cached input token write as string","default":"0"}},"type":"object","required":["prompt","completion"],"title":"OpenRouterPricing","description":"OpenRouter pricing format."},"PublicModel":{"properties":{"id":{"type":"string","maxLength":200,"minLength":1,"title":"Id","description":"The unique identifier for the model (e.g., 'llama3.1-8b')."},"object":{"type":"string","const":"model","title":"Object","description":"The object type, which is always 'model'.","default":"model"},"created":{"type":"integer","minimum":0.0,"title":"Created","description":"The Unix timestamp (in seconds) when the model was created."},"owned_by":{"type":"string","minLength":1,"title":"Owned By","description":"The organization that owns or created the model."},"name":{"type":"string","minLength":1,"title":"Name","description":"The human-readable name of the model."},"description":{"type":"string","maxLength":1000,"minLength":1,"title":"Description","description":"A brief description of the model."},"hugging_face_id":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Hugging Face Id","description":"The corresponding HuggingFace Hub model ID, if available (e.g., 'meta-llama/Llama-3.1-8B-Instruct')."},"pricing":{"$ref":"#/components/schemas/ModelPricing","description":"Pricing details for the model."},"capabilities":{"$ref":"#/components/schemas/ModelCapabilities","description":"The capabilities supported by the model."},"supported_parameters":{"$ref":"#/components/schemas/SupportedParameters"},"architecture":{"$ref":"#/components/schemas/ModelArchitecture","description":"Technical architecture details of the model."},"limits":{"$ref":"#/components/schemas/ModelLimits","description":"Usage limits and constraints for the model."},"datacenter_locations":{"items":{"type":"string"},"type":"array","title":"Datacenter Locations","description":"List of datacenter locations where this model is deployed (e.g., ['us-east-1', 'eu-west-1'])."},"deprecated":{"type":"boolean","title":"Deprecated","description":"Indicates if the model is deprecated and should not be used for new applications.","default":false},"preview":{"type":"boolean","title":"Preview","description":"Indicates if the model is in preview or beta status.","default":false},"quantization":{"anyOf":[{"type":"string"},{"type":"null"}],"title":"Quantization","description":"Quantization precision (e.g., 'FP16', 'FP16/FP8 (weights only)')."}},"type":"object","required":["id","created","owned_by","name","description","pricing","capabilities","supported_parameters","architecture","limits"],"title":"PublicModel","description":"Complete model specification following OpenAI-compatible schema\nwith extensions for OpenRouter/HuggingFace compatibility."},"PublicModelsListResponse":{"properties":{"object":{"type":"string","const":"list","title":"Object","description":"Object type (always 'list')","default":"list"},"data":{"items":{"$ref":"#/components/schemas/PublicModel"},"type":"array","title":"Data","description":"Array of model objects"}},"type":"object","required":["data"],"title":"PublicModelsListResponse","description":"OpenAI-compatible list of models."},"SupportedParameters":{"properties":{"temperature":{"type":"boolean","title":"Temperature","description":"Supports temperature sampling parameter.","default":true},"top_p":{"type":"boolean","title":"Top P","description":"Supports top_p (nucleus) sampling parameter.","default":true},"seed":{"type":"boolean","title":"Seed","description":"Supports seed for reproducible outputs.","default":true},"stop":{"type":"boolean","title":"Stop","description":"Supports stop sequences parameter.","default":true},"max_completion_tokens":{"type":"boolean","title":"Max Completion Tokens","description":"Supports max_completion_tokens parameter.","default":true},"logprobs":{"type":"boolean","title":"Logprobs","description":"Supports logprobs output.","default":false},"top_logprobs":{"type":"boolean","title":"Top Logprobs","description":"Supports top_logprobs parameter.","default":false},"frequency_penalty":{"type":"boolean","title":"Frequency Penalty","description":"Supports frequency_penalty parameter.","default":false},"presence_penalty":{"type":"boolean","title":"Presence Penalty","description":"Supports presence_penalty parameter.","default":false},"logit_bias":{"type":"boolean","title":"Logit Bias","description":"Supports logit_bias parameter.","default":false},"repetition_penalty":{"type":"boolean","title":"Repetition Penalty","description":"Supports repetition_penalty parameter.","default":false}},"type":"object","title":"SupportedParameters","description":"Sampling parameters supported by the model."},"TimeInfo":{"properties":{"queue_time":{"anyOf":[{"type":"number","minimum":0.0},{"type":"null"}],"title":"Queue Time"},"prompt_time":{"anyOf":[{"type":"number","minimum":0.0},{"type":"null"}],"title":"Prompt Time"},"completion_time":{"anyOf":[{"type":"number","minimum":0.0},{"type":"null"}],"title":"Completion Time"},"total_time":{"anyOf":[{"type":"number","minimum":0.0},{"type":"null"}],"title":"Total Time"}},"additionalProperties":true,"type":"object","title":"TimeInfo","description":"Time information for different phases of request processing.\n\nAll times are measured in seconds.","examples":[{"completion_time":0.44,"prompt_time":0.02,"queue_time":0.0,"total_time":0.46}]},"TopLogProbs":{"properties":{"token":{"type":"string","title":"Token"},"logprob":{"type":"number","title":"Logprob"},"bytes":{"anyOf":[{"items":{"type":"integer"},"type":"array"},{"type":"null"}],"title":"Bytes"}},"additionalProperties":true,"type":"object","required":["token","logprob"],"title":"TopLogProbs"},"Usage":{"additionalProperties":true,"type":"object"},"ValidationError":{"properties":{"loc":{"items":{"anyOf":[{"type":"string"},{"type":"integer"}]},"type":"array","title":"Location"},"msg":{"type":"string","title":"Message"},"type":{"type":"string","title":"Error Type"}},"type":"object","required":["loc","msg","type"],"title":"ValidationError"}},"securitySchemes":{"HTTPBearer":{"type":"http","scheme":"bearer"}}}}