feat: ollama support (#2003)

2024-01-12 12:29:13 +08:00
parent 5e75f7022f
commit cca9edc97a
21 changed files with 1369 additions and 13 deletions
--- a/api/tests/integration_tests/.env.example
+++ b/api/tests/integration_tests/.env.example
@@ -62,5 +62,8 @@ COHERE_API_KEY=
 # Jina Credentials
 JINA_API_KEY=

+# Ollama Credentials
+OLLAMA_BASE_URL=
+
 # Mock Switch
 MOCK_SWITCH=false
--- a/api/tests/integration_tests/model_runtime/ollama/init.py
+++ b/api/tests/integration_tests/model_runtime/ollama/init.py
--- a/api/tests/integration_tests/model_runtime/ollama/test_llm.py
+++ b/api/tests/integration_tests/model_runtime/ollama/test_llm.py
--- a/api/tests/integration_tests/model_runtime/ollama/test_text_embedding.py
+++ b/api/tests/integration_tests/model_runtime/ollama/test_text_embedding.py
@@ -0,0 +1,71 @@
+import os
+
+import pytest
+
+from core.model_runtime.entities.text_embedding_entities import TextEmbeddingResult
+from core.model_runtime.errors.validate import CredentialsValidateFailedError
+from core.model_runtime.model_providers.ollama.text_embedding.text_embedding import OllamaEmbeddingModel
+
+
+def test_validate_credentials():
+    model = OllamaEmbeddingModel()
+
+    with pytest.raises(CredentialsValidateFailedError):
+        model.validate_credentials(
+            model='mistral:text',
+            credentials={
+                'base_url': 'http://localhost:21434',
+                'mode': 'chat',
+                'context_size': 4096,
+            }
+        )
+
+    model.validate_credentials(
+        model='mistral:text',
+        credentials={
+            'base_url': os.environ.get('OLLAMA_BASE_URL'),
+            'mode': 'chat',
+            'context_size': 4096,
+        }
+    )
+
+
+def test_invoke_model():
+    model = OllamaEmbeddingModel()
+
+    result = model.invoke(
+        model='mistral:text',
+        credentials={
+            'base_url': os.environ.get('OLLAMA_BASE_URL'),
+            'mode': 'chat',
+            'context_size': 4096,
+        },
+        texts=[
+            "hello",
+            "world"
+        ],
+        user="abc-123"
+    )
+
+    assert isinstance(result, TextEmbeddingResult)
+    assert len(result.embeddings) == 2
+    assert result.usage.total_tokens == 2
+
+
+def test_get_num_tokens():
+    model = OllamaEmbeddingModel()
+
+    num_tokens = model.get_num_tokens(
+        model='mistral:text',
+        credentials={
+            'base_url': os.environ.get('OLLAMA_BASE_URL'),
+            'mode': 'chat',
+            'context_size': 4096,
+        },
+        texts=[
+            "hello",
+            "world"
+        ]
+    )
+
+    assert num_tokens == 2