xref: /plugin/aichat/Model/OpenAI/models.json (revision 10789c175b44bee75b54261fbdf3bb1e6d176759)
1{
2    "chat": {
3        "gpt-3.5-turbo": {
4            "description": "GPT-3.5 Turbo is a variant of GPT-3.5 that is optimized for speed and can generate responses in a fraction of the time.",
5            "inputTokens": 16385,
6            "inputTokenPrice": 1.5,
7            "outputTokens": 4096,
8            "outputTokenPrice": 2
9        },
10        "gpt-4": {
11            "description": "GPT-4 is the latest version of OpenAI's Generative Pre-trained Transformer (GPT) language model. It is capable of generating human-like text and can be used for a wide range of natural language processing tasks.",
12            "inputTokens": 8192,
13            "inputTokenPrice": 30,
14            "outputTokens": 4096,
15            "outputTokenPrice": 60
16        },
17        "gpt-4-turbo": {
18            "description": "GPT-4 Turbo is a variant of GPT-4 that is optimized for speed and can generate responses in a fraction of the time.",
19            "inputTokens": 128000,
20            "inputTokenPrice": 10,
21            "outputTokens": 4096,
22            "outputTokenPrice": 30
23        },
24        "gpt-4o": {
25            "description": "GPT-4o has the same high intelligence as GPT-4 Turbo but is much more efficient",
26            "inputTokens": 128000,
27            "inputTokenPrice": 2.5,
28            "outputTokens": 16384,
29            "outputTokenPrice": 10
30        },
31        "gpt-4o-mini": {
32            "description": "",
33            "inputTokens": 128000,
34            "inputTokenPrice": 0.15,
35            "outputTokens": 16384,
36            "outputTokenPrice": 0.6
37        },
38        "gpt-4-32k": {
39            "description": "",
40            "inputTokens": 32768,
41            "inputTokenPrice": 60,
42            "outputTokens": 4096,
43            "outputTokenPrice": 120
44        },
45        "gpt-3.5-turbo-16k": {
46            "description": "",
47            "inputTokens": 16385,
48            "inputTokenPrice": 3,
49            "outputTokens": 4096,
50            "outputTokenPrice": 4
51        },
52        "o1-mini": {
53            "description": "",
54            "inputTokens": 128000,
55            "inputTokenPrice": 3,
56            "outputTokens": 65536,
57            "outputTokenPrice": 12
58        },
59        "chatgpt-4o-latest": {
60            "description": "",
61            "inputTokens": 128000,
62            "inputTokenPrice": 5,
63            "outputTokens": 4096,
64            "outputTokenPrice": 15
65        }
66    },
67    "embedding": {
68        "text-embedding-ada-002": {
69            "description": "Most capable 2nd generation embedding model",
70            "inputTokens": 8191,
71            "inputTokenPrice": 0.1,
72            "dimensions": 1536
73        },
74        "text-embedding-3-small": {
75            "description": "Increased performance over 2nd generation ada embedding model",
76            "inputTokens": 8191,
77            "inputTokenPrice": 0.02,
78            "dimensions": 1536
79        },
80        "text-embedding-3-large": {
81            "description": "Most capable embedding model for both english and non-english tasks",
82            "inputTokens": 8191,
83            "inputTokenPrice": 0.13,
84            "dimensions": 3072
85        },
86        "text-embedding-ada-002-v2": {
87            "description": "",
88            "inputTokens": 8191,
89            "inputTokenPrice": 0.1,
90            "dimensions": 1536
91        }
92    }
93}