diff --git a/api/core/model_runtime/model_providers/nvidia/llm/_position.yaml b/api/core/model_runtime/model_providers/nvidia/llm/_position.yaml index 0b622b060..fc6986272 100644 --- a/api/core/model_runtime/model_providers/nvidia/llm/_position.yaml +++ b/api/core/model_runtime/model_providers/nvidia/llm/_position.yaml @@ -1,7 +1,7 @@ - google/gemma-7b - google/codegemma-7b - meta/llama2-70b -- meta/llama3-8b -- meta/llama3-70b +- meta/llama3-8b-instruct +- meta/llama3-70b-instruct - mistralai/mixtral-8x7b-instruct-v0.1 - fuyu-8b diff --git a/api/core/model_runtime/model_providers/nvidia/llm/llama3-70b.yaml b/api/core/model_runtime/model_providers/nvidia/llm/llama3-70b.yaml index 9999ef5a8..4d591d422 100644 --- a/api/core/model_runtime/model_providers/nvidia/llm/llama3-70b.yaml +++ b/api/core/model_runtime/model_providers/nvidia/llm/llama3-70b.yaml @@ -1,7 +1,7 @@ -model: meta/llama3-70b +model: meta/llama3-70b-instruct label: - zh_Hans: meta/llama3-70b - en_US: meta/llama3-70b + zh_Hans: meta/llama3-70b-instruct + en_US: meta/llama3-70b-instruct model_type: llm features: - agent-thought diff --git a/api/core/model_runtime/model_providers/nvidia/llm/llama3-8b.yaml b/api/core/model_runtime/model_providers/nvidia/llm/llama3-8b.yaml index 4dd3215d7..013956667 100644 --- a/api/core/model_runtime/model_providers/nvidia/llm/llama3-8b.yaml +++ b/api/core/model_runtime/model_providers/nvidia/llm/llama3-8b.yaml @@ -1,7 +1,7 @@ -model: meta/llama3-8b +model: meta/llama3-8b-instruct label: - zh_Hans: meta/llama3-8b - en_US: meta/llama3-8b + zh_Hans: meta/llama3-8b-instruct + en_US: meta/llama3-8b-instruct model_type: llm features: - agent-thought diff --git a/api/core/model_runtime/model_providers/nvidia/llm/llm.py b/api/core/model_runtime/model_providers/nvidia/llm/llm.py index 84f5fc5e1..402ffb2cf 100644 --- a/api/core/model_runtime/model_providers/nvidia/llm/llm.py +++ b/api/core/model_runtime/model_providers/nvidia/llm/llm.py @@ -26,8 +26,8 @@ class NVIDIALargeLanguageModel(OAIAPICompatLargeLanguageModel): 'google/gemma-7b': '', 'google/codegemma-7b': '', 'meta/llama2-70b': '', - 'meta/llama3-8b': '', - 'meta/llama3-70b': '' + 'meta/llama3-8b-instruct': '', + 'meta/llama3-70b-instruct': '' }