Skip to content

Commit

Permalink
add known context lengths for hosted models (#14436)
Browse files Browse the repository at this point in the history
  • Loading branch information
mattf authored Jun 27, 2024
1 parent 663e170 commit 8d5ea16
Show file tree
Hide file tree
Showing 2 changed files with 28 additions and 10 deletions.
Original file line number Diff line number Diff line change
@@ -1,17 +1,35 @@
from typing import Dict, Optional

API_CATALOG_MODELS: Dict[str, int] = {
"mistralai/mistral-7b-instruct-v0.2": 16384,
"mistralai/mixtral-8x7b-instruct-v0.1": 16384,
"mistralai/mixtral-8x22b-instruct-v0.1": 32768,
"mistralai/mistral-large": 16384,
"google/gemma-7b": 4096,
"google/gemma-2b": 4096,
"01-ai/yi-large": 16384,
"aisingapore/sea-lion-7b-instruct": 1024,
"databricks/dbrx-instruct": 2048,
"google/codegemma-1.1-7b": 1024,
"google/codegemma-7b": 4096,
"meta/llama2-70b": 1024,
"google/gemma-2b": 4096,
"google/recurrentgemma-2b": 1024,
"ibm/granite-34b-code-instruct": 2048,
"ibm/granite-8b-code-instruct": 4096,
"mediatek/breeze-7b-instruct": 1024,
"meta/codellama-70b": 1024,
"meta/llama3-8b-instruct": 6000,
"meta/llama3-70b-instruct": 6000,
"meta/llama3-70b-instruct": 8192,
"meta/llama3-8b-instruct": 8192,
"microsoft/phi-3-medium-4k-instruct": 1024,
"microsoft/phi-3-mini-128k-instruct": 2048,
"microsoft/phi-3-mini-4k-instruct": 2048,
"microsoft/phi-3-small-128k-instruct": 2048,
"microsoft/phi-3-small-8k-instruct": 2048,
"mistralai/codestral-22b-instruct-v0.1": 32768,
"mistralai/mistral-7b-instruct-v0.2": 16384,
"mistralai/mistral-7b-instruct-v0.3": 32768,
"mistralai/mistral-large": 16384,
"mistralai/mixtral-8x22b-instruct-v0.1": 65536,
"mistralai/mixtral-8x7b-instruct-v0.1": 16384,
"nvidia/llama3-chatqa-1.5-70b": 1024,
"nvidia/llama3-chatqa-1.5-8b": 1024,
"nvidia/nemotron-4-340b-instruct": 2048,
"seallms/seallm-7b-v2.5": 4096,
"upstage/solar-10.7b-instruct": 4096,
}


Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@ license = "MIT"
name = "llama-index-llms-nvidia"
packages = [{include = "llama_index/"}]
readme = "README.md"
version = "0.1.3"
version = "0.1.4"

[tool.poetry.dependencies]
python = ">=3.8.1,<4.0"
Expand Down

0 comments on commit 8d5ea16

Please sign in to comment.