Model/OpenAI/models.json

{
    "chat": {
        "gpt-3.5-turbo": {
            "description": "GPT-3.5 Turbo is a variant of GPT-3.5 that is optimized for speed and can generate responses in a fraction of the time.",
            "inputTokens": 16385,
            "inputTokenPrice": 1.5,
            "outputTokens": 4096,
            "outputTokenPrice": 2
        },
        "gpt-4": {
            "description": "GPT-4 is the latest version of OpenAI's Generative Pre-trained Transformer (GPT) language model. It is capable of generating human-like text and can be used for a wide range of natural language processing tasks.",
            "inputTokens": 8192,
            "inputTokenPrice": 30,
            "outputTokens": 4096,
            "outputTokenPrice": 60
        },
        "gpt-4-turbo": {
            "description": "GPT-4 Turbo is a variant of GPT-4 that is optimized for speed and can generate responses in a fraction of the time.",
            "inputTokens": 128000,
            "inputTokenPrice": 10,
            "outputTokens": 4096,
            "outputTokenPrice": 30
        },
        "gpt-4o": {
            "description": "GPT-4o has the same high intelligence as GPT-4 Turbo but is much more efficient",
            "inputTokens": 128000,
            "inputTokenPrice": 2.5,
            "outputTokens": 16384,
            "outputTokenPrice": 10
        },
        "gpt-4o-mini": {
            "description": "",
            "inputTokens": 128000,
            "inputTokenPrice": 0.15,
            "outputTokens": 16384,
            "outputTokenPrice": 0.6
        },
        "gpt-4-32k": {
            "description": "",
            "inputTokens": 32768,
            "inputTokenPrice": 60,
            "outputTokens": 4096,
            "outputTokenPrice": 120
        },
        "gpt-3.5-turbo-16k": {
            "description": "",
            "inputTokens": 16385,
            "inputTokenPrice": 3,
            "outputTokens": 4096,
            "outputTokenPrice": 4
        },
        "o1-mini": {
            "description": "",
            "inputTokens": 128000,
            "inputTokenPrice": 1.1,
            "outputTokens": 65536,
            "outputTokenPrice": 4.4
        },
        "chatgpt-4o-latest": {
            "description": "",
            "inputTokens": 128000,
            "inputTokenPrice": 5,
            "outputTokens": 4096,
            "outputTokenPrice": 15
        },
        "o1": {
            "description": "",
            "inputTokens": 200000,
            "inputTokenPrice": 15,
            "outputTokens": 100000,
            "outputTokenPrice": 60
        },
        "o3-mini": {
            "description": "",
            "inputTokens": 200000,
            "inputTokenPrice": 1.1,
            "outputTokens": 100000,
            "outputTokenPrice": 4.4
        }
    },
    "embedding": {
        "text-embedding-ada-002": {
            "description": "Most capable 2nd generation embedding model",
            "inputTokens": 8191,
            "inputTokenPrice": 0.1,
            "dimensions": 1536
        },
        "text-embedding-3-small": {
            "description": "Increased performance over 2nd generation ada embedding model",
            "inputTokens": 8191,
            "inputTokenPrice": 0.02,
            "dimensions": 1536
        },
        "text-embedding-3-large": {
            "description": "Most capable embedding model for both english and non-english tasks",
            "inputTokens": 8191,
            "inputTokenPrice": 0.13,
            "dimensions": 3072
        },
        "text-embedding-ada-002-v2": {
            "description": "",
            "inputTokens": 8191,
            "inputTokenPrice": 0.1,
            "dimensions": 1536
        }
    }
}