Nvidia NIM | liteLLM (original) (raw)

nvidia/nemotron-4-340b-reward

completion(model="nvidia_nim/nvidia/nemotron-4-340b-reward", messages)

01-ai/yi-large

completion(model="nvidia_nim/01-ai/yi-large", messages)

aisingapore/sea-lion-7b-instruct

completion(model="nvidia_nim/aisingapore/sea-lion-7b-instruct", messages)

databricks/dbrx-instruct

completion(model="nvidia_nim/databricks/dbrx-instruct", messages)

google/gemma-7b

completion(model="nvidia_nim/google/gemma-7b", messages)

google/gemma-2b

completion(model="nvidia_nim/google/gemma-2b", messages)

google/codegemma-1.1-7b

completion(model="nvidia_nim/google/codegemma-1.1-7b", messages)

google/codegemma-7b

completion(model="nvidia_nim/google/codegemma-7b", messages)

google/recurrentgemma-2b

completion(model="nvidia_nim/google/recurrentgemma-2b", messages)

ibm/granite-34b-code-instruct

completion(model="nvidia_nim/ibm/granite-34b-code-instruct", messages)

ibm/granite-8b-code-instruct

completion(model="nvidia_nim/ibm/granite-8b-code-instruct", messages)

mediatek/breeze-7b-instruct

completion(model="nvidia_nim/mediatek/breeze-7b-instruct", messages)

meta/codellama-70b

completion(model="nvidia_nim/meta/codellama-70b", messages)

meta/llama2-70b

completion(model="nvidia_nim/meta/llama2-70b", messages)

meta/llama3-8b

completion(model="nvidia_nim/meta/llama3-8b", messages)

meta/llama3-70b

completion(model="nvidia_nim/meta/llama3-70b", messages)

microsoft/phi-3-medium-4k-instruct

completion(model="nvidia_nim/microsoft/phi-3-medium-4k-instruct", messages)

microsoft/phi-3-mini-128k-instruct

completion(model="nvidia_nim/microsoft/phi-3-mini-128k-instruct", messages)

microsoft/phi-3-mini-4k-instruct

completion(model="nvidia_nim/microsoft/phi-3-mini-4k-instruct", messages)

microsoft/phi-3-small-128k-instruct

completion(model="nvidia_nim/microsoft/phi-3-small-128k-instruct", messages)

microsoft/phi-3-small-8k-instruct

completion(model="nvidia_nim/microsoft/phi-3-small-8k-instruct", messages)

mistralai/codestral-22b-instruct-v0.1

completion(model="nvidia_nim/mistralai/codestral-22b-instruct-v0.1", messages)

mistralai/mistral-7b-instruct

completion(model="nvidia_nim/mistralai/mistral-7b-instruct", messages)

mistralai/mistral-7b-instruct-v0.3

completion(model="nvidia_nim/mistralai/mistral-7b-instruct-v0.3", messages)

mistralai/mixtral-8x7b-instruct

completion(model="nvidia_nim/mistralai/mixtral-8x7b-instruct", messages)

mistralai/mixtral-8x22b-instruct

completion(model="nvidia_nim/mistralai/mixtral-8x22b-instruct", messages)

mistralai/mistral-large

completion(model="nvidia_nim/mistralai/mistral-large", messages)

nvidia/nemotron-4-340b-instruct

completion(model="nvidia_nim/nvidia/nemotron-4-340b-instruct", messages)

seallms/seallm-7b-v2.5

completion(model="nvidia_nim/seallms/seallm-7b-v2.5", messages)

snowflake/arctic

completion(model="nvidia_nim/snowflake/arctic", messages)

upstage/solar-10.7b-instruct

completion(model="nvidia_nim/upstage/solar-10.7b-instruct", messages)