models.json

{
    "GPT": 
    {
        "gpt-4o-mini":
        {
            "label": "Our affordable and intelligent small model for fast, lightweight tasks. GPT-4o mini is cheaper and more capable than GPT-3.5 Turbo. Currently points to gpt-4o-mini-2024-07-18.",
            "max_token": 16384,
            "context_token": 128000,
            "data": "Up to Oct 2023 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": "vision"
        },
        "gpt-4o-mini-2024-07-18":
        {
            "label": "Our affordable and intelligent small model for fast, lightweight tasks. GPT-4o mini is cheaper and more capable than GPT-3.5 Turbo.",
            "max_token": 16384,
            "context_token": 128000,
            "data": "Up to Oct 2023 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": "vision"
        },
        "gpt-4o":
        {
            "label": "Our high-intelligence flagship model for complex, multi-step tasks. GPT-4o is cheaper and faster than GPT-4 Turbo. Currently points to gpt-4o-2024-08-06.",
            "max_token": 16384,
            "context_token": 128000,
            "data": "Up to Oct 2023 (as of 20240806)",
            "status": "active",
            "status_details": "",
            "capability": "vision"
        },
        "gpt-4o-2024-08-06":
        {
            "label": "Latest snapshot that supports Structured Outputs. gpt-4o currently points to this version.",
            "max_token": 16384,
            "context_token": 128000,
            "data": "Up to Oct 2023 (as of 20240806)",
            "status": "active",
            "status_details": "",
            "capability": "vision"
        },
        "gpt-4o-2024-05-13":
        {
            "label": "Original gpt-4o snapshot from May 13, 2024.",
            "max_token": 4096,
            "context_token": 128000,
            "data": "Up to Oct 2023 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": "vision"
        },
        "o1-preview":
        {
            "label": "o1 series of large language models are trained with reinforcement learning to perform complex reasoning. o1 models think before they answer, producing a long internal chain of thought before responding to the user. o1-preview: reasoning model designed to solve hard problems across domains. Points to the most recent snapshot of the o1 model: o1-preview-2024-09-12",
            "max_token": 32768,
            "context_token": 128000,
            "data": "Up to Oct 2023 (as of 20240912)",
            "status": "active",
            "status_details": "",
            "capability": "vision"
        },
        "o1-mini":
        {
            "label": "o1 series of large language models are trained with reinforcement learning to perform complex reasoning. o1 models think before they answer, producing a long internal chain of thought before responding to the user. o1-mini: faster and cheaper reasoning model particularly good at coding, math, and science. Points to the most recent o1-mini snapshot: o1-mini-2024-09-12",
            "max_token": 65536,
            "context_token": 128000,
            "data": "Up to Oct 2023 (as of 20240912)",
            "status": "active",
            "status_details": "",
            "capability": "vision"
        },
        "gpt-4-turbo":
        {
            "label": "The latest GPT-4 Turbo model with vision capabilities. Currently points to gpt-4-turbo-2024-04-09.",
            "max_token": 4096,
            "context_token": 128000,
            "data": "Up to Dec 2023 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": "vision"
        },
        "gpt-4-turbo-2024-04-09":
        {
            "label": "GPT-4 Turbo with Vision model. gpt-4-turbo currently points to this version.",
            "max_token": 4096,
            "context_token": 128000,
            "data": "Up to Dec 2023 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": "vision"
        },
        "gpt-4-turbo-preview":
        {
            "label": "Currently points to gpt-4-0125-preview: The latest GPT-4 model intended to reduce cases of laziness where the model doesn’t complete a task. Returns a maximum of 4,096 output tokens.",
            "max_token": 4096,
            "context_token": 128000,
            "data": "Up to Dec 2023 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": ""
        },
        "gpt-4-0125-preview":
        {
            "label": "GPT-4 Turbo preview model intended to reduce cases of laziness where the model doesn’t complete a task. Returns a maximum of 4,096 output tokens.",
            "max_token": 4096,
            "context_token": 128000,
            "data": "Up to Dec 2023 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": ""
        },
        "gpt-4-1106-preview":
        {
            "label": "GPT-4 Turbo model featuring improved instruction following, JSON mode, reproducible outputs, parallel function calling, and more. Returns a maximum of 4,096 output tokens. This is a preview model.",
            "max_token": 4096,
            "context_token": 128000,
            "data": "Up to Apr 2023 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": ""
        },
        "gpt-4":
        {
            "label": "Currently points to gpt-4-0613: Snapshot of gpt-4 from June 13th 2023 with improved function calling support.",
            "max_token": 4096,
            "context_token": 8192,
            "data": "Up to Sep 2021 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": ""
        },
        "gpt-4-0613":
        {
            "label": "Snapshot of gpt-4 from June 13th 2023 with improved function calling support.",
            "max_token": 4096,
            "context_token": 8192,
            "data": "Up to Sep 2021 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": ""
        },
        "gpt-4-32k":
        {
            "label": "Currently points to gpt-4-32k-0613: Snapshot of gpt-4-32k from June 13th 2023 with improved function calling support. This model was never rolled out widely in favor of GPT-4 Turbo.",
            "max_token": 4096,
            "context_token": 32768,
            "data": "Up to Sep 2021 (as of 20240606)",
            "status": "deprecated",
            "status_details": "",
            "capability": ""
        },
        "gpt-4-32k-0613":
        {
            "label": "Snapshot of gpt-4-32k from June 13th 2023 with improved function calling support. This model was never rolled out widely in favor of GPT-4 Turbo.",
            "max_token": 4096,
            "context_token": 32768,
            "data": "Up to Sep 2021 (as of 20240606)",
            "status": "deprecated",
            "status_details": "",
            "capability": ""
        },
        "gpt-3.5-turbo-0125":
        {
            "label": "The latest GPT-3.5 Turbo model with higher accuracy at responding in requested formats and a fix for a bug which caused a text encoding issue for non-English language function calls. Returns a maximum of 4,096 output tokens.",
            "max_token": 4096,
            "context_token": 16385,
            "data": "Up to Sep 2021 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": ""
        },
        "gpt-3.5-turbo":
        {
            "label": "Currently points to gpt-3.5-turbo-0125: The latest GPT-3.5 Turbo model with higher accuracy at responding in requested formats and a fix for a bug which caused a text encoding issue for non-English language function calls. Returns a maximum of 4,096 output tokens.",
            "max_token": 4096,
            "context_token": 16385,
            "data": "Up to Sep 2021 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": ""
        },
        "gpt-3.5-turbo-1106":
        {
            "label": "GPT-3.5 Turbo model with improved instruction following, JSON mode, reproducible outputs, parallel function calling, and more. Returns a maximum of 4,096 output tokens.",
            "max_token": 4096,
            "context_token": 16385,
            "data": "Up to Sep 2021 (as of 20240718)",
            "status": "active",
            "status_details": "",
            "capability": ""
        },
        "gpt-3.5-turbo-16k":
        {
            "label": "Currently points to gpt-3.5-turbo-16k-0613: Snapshot of gpt-3.5-turbo from June 13th 2023. Will be deprecated on June 13, 2024.",
            "max_token": 4096,
            "context_token": 16385,
            "data": "Up to Sep 2021 (as of 20240513)",
            "status": "deprecated",
            "status_details": "Will be deprecated on June 13, 2024.",
            "capability": ""
        },
        "gpt-3.5-turbo-0613":
        {
            "label": "Snapshot of gpt-3.5-turbo from June 13th 2023. Will be deprecated on June 13, 2024.",
            "max_token": 4096,
            "context_token": 4096,
            "data": "Up to Sep 2021 (as of 20240513)",
            "status": "deprecated",
            "status_details": "Will be deprecated on June 13, 2024.",
            "capability": ""
        },
        "gpt-3.5-turbo-16k-0613":
        {
            "label": "Snapshot of gpt-3.5-16k-turbo from June 13th 2023. Will be deprecated on June 13, 2024.",
            "max_token": 4096,
            "context_token": 16385,
            "data": "Up to Sep 2021 (as of 20240513)",
            "status": "deprecated",
            "status_details": "Will be deprecated on June 13, 2024.",
            "capability": ""
        }
    },
    "DallE":
    {
        "dall-e-3":
        {
            "label": "The latest DALL·E model released in Nov 2023. The maximum prompt length is 4000 characters.",
            "image_size": ["1024x1024", "1024x1792", "1792x1024"],
            "max_prompt_length": 4000,
            "status": "active",
            "status_details": ""
        },
        "dall-e-2":
        {
            "label": "The previous DALL·E model released in Nov 2022. The maximum prompt length is 1000 characters.",
            "image_size": ["256x256", "512x512", "1024x1024"],
            "max_prompt_length": 1000,
            "status": "active",
            "status_details": ""
        }
    }
}