|
33 | 33 | },
|
34 | 34 |
|
35 | 35 | "ollama": {
|
| 36 | + "command-r": 12800, |
| 37 | + "command-r-plus": 12800, |
| 38 | + "codellama": 16000, |
| 39 | + "dbrx": 32768, |
| 40 | + "dbrx:instruct": 32768, |
| 41 | + "deepseek-coder:33b": 16000, |
| 42 | + "dolphin-mixtral": 32000, |
36 | 43 | "llama2": 4096,
|
37 | 44 | "llama3": 8192,
|
| 45 | + "llama3:70b-instruct": 8192, |
38 | 46 | "llava": 4096,
|
| 47 | + "llava:34b": 4096, |
39 | 48 | "llava_next": 4096,
|
40 | 49 | "mistral": 8192,
|
41 |
| - "codellama": 16000, |
42 |
| - "dolphin-mixtral": 32000, |
43 |
| - "mistral-openorca": 32000, |
44 |
| - "stablelm-zephyr": 8192, |
45 |
| - "command-r-plus": 12800, |
46 |
| - "command-r": 12800, |
47 | 50 | "mistral:7b-instruct": 32768,
|
48 |
| - "llama3:70b-instruct": 8192, |
| 51 | + "mistral-openorca": 32000, |
49 | 52 | "mixtral:8x22b-instruct": 65536,
|
50 |
| - "wizardlm2:8x22b": 65536, |
51 |
| - "dbrx": 32768, |
52 |
| - "dbrx:instruct": 32768, |
53 | 53 | "nous-hermes2:34b": 4096,
|
54 | 54 | "orca-mini": 2048,
|
| 55 | + "phi3:3.8b": 12800, |
| 56 | + "phi3:14b": 12800, |
| 57 | + "qwen:0.5b": 32000, |
| 58 | + "qwen:1.8b": 32000, |
| 59 | + "qwen:4b": 32000, |
| 60 | + "qwen:14b": 32000, |
| 61 | + "qwen:32b": 32000, |
| 62 | + "qwen:72b": 32000, |
| 63 | + "qwen:110b": 32000, |
| 64 | + "stablelm-zephyr": 8192, |
| 65 | + "wizardlm2:8x22b": 65536, |
55 | 66 | # embedding models
|
56 | 67 | "nomic-embed-text": 8192,
|
57 | 68 | "snowflake-arctic-embed:335m": 8192,
|
|
0 commit comments