|
51 | 51 | "gemini-1.5-pro-latest": 128000,
|
52 | 52 | "models/embedding-001": 2048
|
53 | 53 | },
|
54 |
| - "ollama": { "command-r": 12800, |
55 |
| - "codellama": 16000, |
56 |
| - "dbrx": 32768, |
57 |
| - "deepseek-coder:33b": 16000, |
58 |
| - "falcon": 2048, |
59 |
| - "llama2": 4096, |
60 |
| - "llama3": 8192, |
61 |
| - "llama3:70b": 8192, |
62 |
| - "llama3.1":128000, |
63 |
| - "llama3.1:8b": 128000, |
64 |
| - "llama3.1:70b": 128000, |
65 |
| - "lama3.1:405b": 128000, |
66 |
| - "scrapegraph": 8192, |
67 |
| - "llava": 4096, |
68 |
| - "mixtral:8x22b-instruct": 65536, |
69 |
| - "mistral-openorca": 32000, |
70 |
| - "nomic-embed-text": 8192, |
71 |
| - "nous-hermes2:34b": 4096, |
72 |
| - "orca-mini": 2048, |
73 |
| - "phi3:3.8b": 12800, |
74 |
| - "qwen:0.5b": 32000, |
75 |
| - "qwen:1.8b": 32000, |
76 |
| - "qwen:4b": 32000, |
77 |
| - "qwen:14b": 32000, |
78 |
| - "qwen:32b": 32000, |
79 |
| - "qwen:72b": 32000, |
80 |
| - "qwen:110b": 32000, |
81 |
| - "stablelm-zephyr": 8192, |
82 |
| - "wizardlm2:8x22b": 65536, |
83 |
| - # embedding models |
84 |
| - "shaw/dmeta-embedding-zh-small-q4": 8192, |
85 |
| - "shaw/dmeta-embedding-zh-q4": 8192, |
86 |
| - "chevalblanc/acge_text_embedding": 8192, |
87 |
| - "martcreation/dmeta-embedding-zh": 8192, |
88 |
| - "snowflake-arctic-embed": 8192, |
89 |
| - "mxbai-embed-large": 512 |
| 54 | + "ollama": { |
| 55 | + "command-r": 12800, |
| 56 | + "codellama": 16000, |
| 57 | + "dbrx": 32768, |
| 58 | + "deepseek-coder:33b": 16000, |
| 59 | + "falcon": 2048, |
| 60 | + "llama2": 4096, |
| 61 | + "llama3": 8192, |
| 62 | + "llama3:70b": 8192, |
| 63 | + "llama3.1":128000, |
| 64 | + "llama3.1:8b": 128000, |
| 65 | + "llama3.1:70b": 128000, |
| 66 | + "lama3.1:405b": 128000, |
| 67 | + "scrapegraph": 8192, |
| 68 | + "llava": 4096, |
| 69 | + "mixtral:8x22b-instruct": 65536, |
| 70 | + "mistral-openorca": 32000, |
| 71 | + "nomic-embed-text": 8192, |
| 72 | + "nous-hermes2:34b": 4096, |
| 73 | + "orca-mini": 2048, |
| 74 | + "phi3:3.8b": 12800, |
| 75 | + "qwen:0.5b": 32000, |
| 76 | + "qwen:1.8b": 32000, |
| 77 | + "qwen:4b": 32000, |
| 78 | + "qwen:14b": 32000, |
| 79 | + "qwen:32b": 32000, |
| 80 | + "qwen:72b": 32000, |
| 81 | + "qwen:110b": 32000, |
| 82 | + "stablelm-zephyr": 8192, |
| 83 | + "wizardlm2:8x22b": 65536, |
| 84 | + # embedding models |
| 85 | + "shaw/dmeta-embedding-zh-small-q4": 8192, |
| 86 | + "shaw/dmeta-embedding-zh-q4": 8192, |
| 87 | + "chevalblanc/acge_text_embedding": 8192, |
| 88 | + "martcreation/dmeta-embedding-zh": 8192, |
| 89 | + "snowflake-arctic-embed": 8192, |
| 90 | + "mxbai-embed-large": 512, |
90 | 91 | },
|
91 | 92 | "oneapi": {
|
92 |
| - "qwen-turbo": 6000 |
| 93 | + "qwen-turbo": 6000, |
93 | 94 | },
|
94 |
| - "nvidia": { |
| 95 | + "nv dia": { |
95 | 96 | "meta/llama3-70b-instruct": 419,
|
96 | 97 | "meta/llama3-8b-instruct": 419,
|
97 | 98 | "nemotron-4-340b-instruct": 1024,
|
98 |
| - "databricks/dbrx-instruct": 4096, |
99 |
| - "google/codegemma-7b": 8192, |
100 |
| - "google/gemma-2b": 2048, |
101 |
| - "google/gemma-7b": 8192, |
102 |
| - "google/recurrentgemma-2b": 2048, |
103 |
| - "meta/codellama-70b": 16384, |
104 |
| - "meta/llama2-70b": 4096, |
105 |
| - "microsoft/phi-3-mini-128k-instruct": 122880, |
106 |
| - "mistralai/mistral-7b-instruct-v0.2": 4096, |
107 |
| - "mistralai/mistral-large": 8192, |
108 |
| - "mistralai/mixtral-8x22b-instruct-v0.1": 32768, |
109 |
| - "mistralai/mixtral-8x7b-instruct-v0.1": 8192, |
110 |
| - "snowflake/arctic": 16384, |
| 99 | + "databricks/dbrx-instruct": 4096, |
| 100 | + "google/codegemma-7b": 8192, |
| 101 | + "google/gemma-2b": 2048, |
| 102 | + "google/gemma-7b": 8192, |
| 103 | + "google/recurrentgemma-2b": 2048, |
| 104 | + "meta/codellama-70b": 16384, |
| 105 | + "meta/llama2-70b": 4096, |
| 106 | + "microsoft/phi-3-mini-128k-instruct": 122880, |
| 107 | + "mistralai/mistral-7b-instruct-v0.2": 4096, |
| 108 | + "mistralai/mistral-large": 8192, |
| 109 | + "mistralai/mixtral-8x22b-instruct-v0.1": 32768, |
| 110 | + "mistralai/mixtral-8x7b-instruct-v0.1": 8192, |
| 111 | + "snowflake/arctic": 16384, |
111 | 112 | },
|
112 | 113 | "groq": {
|
113 | 114 | "llama3-8b-8192": 8192,
|
114 | 115 | "llama3-70b-8192": 8192,
|
115 | 116 | "mixtral-8x7b-32768": 32768,
|
116 | 117 | "gemma-7b-it": 8192,
|
117 |
| - "claude-3-haiku-20240307'": 8192 |
| 118 | + "claude-3-haiku-20240307'": 8192, |
118 | 119 | },
|
119 | 120 | "claude": {
|
120 | 121 | "claude_instant": 100000,
|
|
125 | 126 | "claude-3-opus-20240229": 200000,
|
126 | 127 | "claude-3-sonnet-20240229": 200000,
|
127 | 128 | "claude-3-haiku-20240307": 200000,
|
128 |
| - "claude-3-5-sonnet-20240620": 200000 |
| 129 | + "claude-3-5-sonnet-20240620": 200000, |
129 | 130 | },
|
130 | 131 | "google_vertexai": {
|
131 | 132 | "gemini-1.5-flash": 128000,
|
132 | 133 | "gemini-1.5-pro": 128000,
|
133 |
| - "gemini-1.0-pro": 128000 |
| 134 | + "gemini-1.0-pro": 128000, |
134 | 135 | },
|
135 | 136 | "bedrock": {
|
136 | 137 | "anthropic.claude-3-haiku-20240307-v1:0": 200000,
|
|
149 | 150 | "amazon.titan-embed-text-v1": 8000,
|
150 | 151 | "amazon.titan-embed-text-v2:0": 8000,
|
151 | 152 | "cohere.embed-english-v3": 512,
|
152 |
| - "cohere.embed-multilingual-v3": 512 |
| 153 | + "cohere.embed-multilingual-v3": 512, |
153 | 154 | },
|
154 | 155 | "mistralai": {
|
155 | 156 | "mistral-large-latest": 128000,
|
|
159 | 160 | "open-mistral-7b": 32000,
|
160 | 161 | "open-mixtral-8x7b": 32000,
|
161 | 162 | "open-mixtral-8x22b": 64000,
|
162 |
| - "open-codestral-mamba": 256000 |
| 163 | + "open-codestral-mamba": 256000, |
163 | 164 | },
|
164 | 165 | "hugging_face": {
|
165 | 166 | "xai-org/grok-1": 8192,
|
|
193 | 194 | "TheBloke/dolphin-2.7-mixtral-8x7b-GGUF": 32768,
|
194 | 195 | "deepseek-ai/DeepSeek-V2": 131072,
|
195 | 196 | "deepseek-ai/DeepSeek-V2-Chat": 131072,
|
196 |
| - "claude-3-haiku": 200000 |
| 197 | + "claude-3-haiku": 200000, |
197 | 198 | },
|
198 | 199 | "deepseek": {
|
199 | 200 | "deepseek-chat": 28672,
|
200 |
| - "deepseek-coder": 16384 |
| 201 | + "deepseek-coder": 16384, |
201 | 202 | },
|
202 | 203 | "ernie": {
|
203 | 204 | "ernie-bot-turbo": 4096,
|
|
207 | 208 | "ernie-bot-2-base-zh": 4096,
|
208 | 209 | "ernie-bot-2-base-en": 4096,
|
209 | 210 | "ernie-bot-2-base-en-zh": 4096,
|
210 |
| - "ernie-bot-2-base-zh-en": 4096 |
| 211 | + "ernie-bot-2-base-zh-en": 4096, |
211 | 212 | },
|
212 | 213 | "fireworks": {
|
213 | 214 | "llama-v2-7b": 4096,
|
214 | 215 | "mixtral-8x7b-instruct": 4096,
|
215 |
| - "nomic-ai/nomic-embed-text-v1.5": 8192, |
| 216 | + "nomic-ai/nomic-embed-text-v1.5": 8192, |
216 | 217 | "llama-3.1-405B-instruct": 131072,
|
217 | 218 | "llama-3.1-70B-instruct": 131072,
|
218 | 219 | "llama-3.1-8B-instruct": 131072,
|
219 | 220 | "mixtral-moe-8x22B-instruct": 65536,
|
220 |
| - "mixtral-moe-8x7B-instruct": 65536 |
| 221 | + "mixtral-moe-8x7B-instruct": 65536, |
221 | 222 | },
|
222 | 223 | }
|
0 commit comments