From 645bda38e340a17fdc156c43a33a384d905ce603 Mon Sep 17 00:00:00 2001 From: Pavel Zorin Date: Fri, 31 Oct 2025 13:23:49 +0100 Subject: [PATCH 1/3] chore: Fix Ollama test / update Ollama API usage --- .github/workflows/test_ollama.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/test_ollama.yml b/.github/workflows/test_ollama.yml index fbd6873194..61aafb9b78 100644 --- a/.github/workflows/test_ollama.yml +++ b/.github/workflows/test_ollama.yml @@ -48,7 +48,7 @@ jobs: - name: Wait for Ollama to be ready run: | for i in {1..30}; do - if curl -s http://localhost:11434/v1/models > /dev/null; then + if curl -s http://localhost:11434/api/tags > /dev/null; then echo "Ollama is ready" exit 0 fi @@ -75,7 +75,7 @@ jobs: { "role": "user", "content": "Whatever I say, answer with Yes." } ] }' - curl -X POST http://127.0.0.1:11434/v1/embeddings \ + curl -X POST http://127.0.0.1:11434/api/embed \ -H "Content-Type: application/json" \ -d '{ "model": "avr/sfr-embedding-mistral:latest", @@ -98,7 +98,7 @@ jobs: LLM_MODEL: "phi4" EMBEDDING_PROVIDER: "ollama" EMBEDDING_MODEL: "avr/sfr-embedding-mistral:latest" - EMBEDDING_ENDPOINT: "http://localhost:11434/api/embeddings" + EMBEDDING_ENDPOINT: "http://localhost:11434/api/embed" EMBEDDING_DIMENSIONS: "4096" HUGGINGFACE_TOKENIZER: "Salesforce/SFR-Embedding-Mistral" run: uv run python ./examples/python/simple_example.py From 5d2d4e51f110d0832d30e3d72118d7adbcda8376 Mon Sep 17 00:00:00 2001 From: Pavel Zorin Date: Fri, 31 Oct 2025 13:30:26 +0100 Subject: [PATCH 2/3] Ollama: Use openAI compatible embeggings API --- .github/workflows/test_ollama.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/test_ollama.yml b/.github/workflows/test_ollama.yml index 61aafb9b78..edc36e24c7 100644 --- a/.github/workflows/test_ollama.yml +++ b/.github/workflows/test_ollama.yml @@ -48,7 +48,7 @@ jobs: - name: Wait for Ollama to be ready run: | for i in {1..30}; do - if curl -s http://localhost:11434/api/tags > /dev/null; then + if curl -s http://localhost:11434/v1/models > /dev/null; then echo "Ollama is ready" exit 0 fi @@ -75,7 +75,7 @@ jobs: { "role": "user", "content": "Whatever I say, answer with Yes." } ] }' - curl -X POST http://127.0.0.1:11434/api/embed \ + curl -X POST http://127.0.0.1:11434/v1/embeddings \ -H "Content-Type: application/json" \ -d '{ "model": "avr/sfr-embedding-mistral:latest", @@ -98,7 +98,7 @@ jobs: LLM_MODEL: "phi4" EMBEDDING_PROVIDER: "ollama" EMBEDDING_MODEL: "avr/sfr-embedding-mistral:latest" - EMBEDDING_ENDPOINT: "http://localhost:11434/api/embed" + EMBEDDING_ENDPOINT: "http://localhost:11434/v1/embeddings" EMBEDDING_DIMENSIONS: "4096" HUGGINGFACE_TOKENIZER: "Salesforce/SFR-Embedding-Mistral" run: uv run python ./examples/python/simple_example.py From 737f792ac6fe175930dcea5f5185104f4029c19d Mon Sep 17 00:00:00 2001 From: Pavel Zorin Date: Fri, 31 Oct 2025 13:43:29 +0100 Subject: [PATCH 3/3] use api/embed for ollama api --- .github/workflows/test_ollama.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/test_ollama.yml b/.github/workflows/test_ollama.yml index edc36e24c7..686545c700 100644 --- a/.github/workflows/test_ollama.yml +++ b/.github/workflows/test_ollama.yml @@ -75,7 +75,7 @@ jobs: { "role": "user", "content": "Whatever I say, answer with Yes." } ] }' - curl -X POST http://127.0.0.1:11434/v1/embeddings \ + curl -X POST http://127.0.0.1:11434/api/embed \ -H "Content-Type: application/json" \ -d '{ "model": "avr/sfr-embedding-mistral:latest", @@ -98,7 +98,7 @@ jobs: LLM_MODEL: "phi4" EMBEDDING_PROVIDER: "ollama" EMBEDDING_MODEL: "avr/sfr-embedding-mistral:latest" - EMBEDDING_ENDPOINT: "http://localhost:11434/v1/embeddings" + EMBEDDING_ENDPOINT: "http://localhost:11434/api/embed" EMBEDDING_DIMENSIONS: "4096" HUGGINGFACE_TOKENIZER: "Salesforce/SFR-Embedding-Mistral" run: uv run python ./examples/python/simple_example.py