topoteretes · Vasilije1990 · Feb 28, 2025 · Feb 19, 2025 · Feb 20, 2025 · Feb 20, 2025
diff --git a/.github/workflows/test_gemini.yml b/.github/workflows/test_gemini.yml
@@ -0,0 +1,33 @@
+name: test | gemini
+
+on:
+  workflow_dispatch:
+  pull_request:
+    types: [labeled, synchronize]
+
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
+  cancel-in-progress: true
+
+jobs:
+  run_simple_example_test:
+      uses: ./.github/workflows/reusable_python_example.yml
+      with:
+        example-location: ./examples/python/simple_example.py
+      secrets:
+        OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
+        GRAPHISTRY_USERNAME: ${{ secrets.GRAPHISTRY_USERNAME }}
+        GRAPHISTRY_PASSWORD: ${{ secrets.GRAPHISTRY_PASSWORD }}
+        EMBEDDING_PROVIDER: "gemini"
+        EMBEDDING_API_KEY: ${{ secrets.GEMINI_API_KEY }}
+        EMBEDDING_MODEL: "gemini/text-embedding-004"
+        EMBEDDING_ENDPOINT: "https://generativelanguage.googleapis.com/v1beta/models/text-embedding-004"
+        EMBEDDING_API_VERSION: "v1beta"
+        EMBEDDING_DIMENSIONS: 768
+        EMBEDDING_MAX_TOKENS: 8076
+        LLM_PROVIDER: "gemini"
+        LLM_API_KEY: ${{ secrets.GEMINI_API_KEY }}
+        LLM_MODEL: "gemini/gemini-1.5-flash"
+        LLM_ENDPOINT: "https://generativelanguage.googleapis.com/"
+        LLM_API_VERSION: "v1beta"
diff --git a/.github/workflows/test_ollama.yml b/.github/workflows/test_ollama.yml
@@ -0,0 +1,115 @@
+name: test | ollama
+
+on:
+  workflow_dispatch:
+  pull_request:
+    types: [ labeled, synchronize ]
+
+jobs:
+
+  run_simple_example_test:
+
+    runs-on: ubuntu-latest
+#    services:
+#      ollama:
+#        image: ollama/ollama
+#        ports:
+#          - 11434:11434
+
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+
+      - name: Setup Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.12.x'
+
+      - name: Install Poetry
+        uses: snok/install-poetry@v1.4.1
+        with:
+          virtualenvs-create: true
+          virtualenvs-in-project: true
+          installer-parallel: true
+
+      - name: Install dependencies
+        run: |
+          poetry install --no-interaction --all-extras
+          poetry add torch
+
+#      - name: Install ollama
+#        run: curl -fsSL https://ollama.com/install.sh | sh
+#      - name: Run ollama
+#        run: |
+#          ollama serve --openai &
+#          ollama pull llama3.2 &
+#          ollama pull avr/sfr-embedding-mistral:latest
+
+      - name: Start Ollama container
+        run: |
+          docker run -d --name ollama -p 11434:11434 ollama/ollama
+          sleep 5
+          docker exec -d ollama bash -c "ollama serve --openai"
+
+      - name: Check Ollama logs
+        run: docker logs ollama
+
+      - name: Wait for Ollama to be ready
+        run: |
+          for i in {1..30}; do
+            if curl -s http://localhost:11434/v1/models > /dev/null; then
+              echo "Ollama is ready"
+              exit 0
+            fi
+            echo "Waiting for Ollama... attempt $i"
+            sleep 2
+          done
+          echo "Ollama failed to start"
+          exit 1
+
+      - name: Pull required Ollama models
+        run: |
+          curl -X POST http://localhost:11434/api/pull -d '{"name": "llama3.2"}'
+          curl -X POST http://localhost:11434/api/pull -d '{"name": "avr/sfr-embedding-mistral:latest"}'
+
+      - name: Call ollama API
+        run: |
+          curl -X POST http://localhost:11434/v1/chat/completions \
+            -H "Content-Type: application/json" \
+            -d '{
+              "model": "llama3.2",
+              "stream": false,
+              "messages": [
+                { "role": "system", "content": "You are a helpful assistant." },
+                { "role": "user", "content": "Whatever I say, answer with Yes." }
+              ]
+            }'
+          curl -X POST http://127.0.0.1:11434/v1/embeddings \
+            -H "Content-Type: application/json" \
+             -d '{
+              "model": "avr/sfr-embedding-mistral:latest",
+            "input": "This is a test sentence to generate an embedding."
+            }'
+
+      - name: Dump Docker logs
+        run: |
+          docker ps
+          docker logs $(docker ps --filter "ancestor=ollama/ollama" --format "{{.ID}}")
+
+
+      - name: Run example test
+        env:
+          OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
+          GRAPHISTRY_USERNAME: ${{ secrets.GRAPHISTRY_USERNAME }}
+          GRAPHISTRY_PASSWORD: ${{ secrets.GRAPHISTRY_PASSWORD }}
+          PYTHONFAULTHANDLER: 1
+          LLM_PROVIDER: "ollama"
+          LLM_API_KEY: "ollama"
+          LLM_ENDPOINT: "http://localhost:11434/v1/"
+          LLM_MODEL: "llama3.2"
+          EMBEDDING_PROVIDER: "ollama"
+          EMBEDDING_MODEL: "avr/sfr-embedding-mistral:latest"
+          EMBEDDING_ENDPOINT: "http://localhost:11434/v1/"
+          EMBEDDING_DIMENSIONS: "4096"
+          HUGGINGFACE_TOKENIZER: "Salesforce/SFR-Embedding-Mistral"
+        run: poetry run python ./examples/python/simple_example.py
diff --git a/.github/workflows/upgrade_deps.yml b/.github/workflows/upgrade_deps.yml
@@ -2,8 +2,29 @@ name: Update Poetry Dependencies
 
 on:
   schedule:
-    - cron: '0 3 * * 0'
+    - cron: '0 3 * * 0'  # Runs at 3 AM every Sunday
+  push:
+    paths:
+      - 'poetry.lock'
+      - 'pyproject.toml'
+    branches:
+      - main
+      - dev
+  pull_request:
+    paths:
+      - 'poetry.lock'
+      - 'pyproject.toml'
+    types: [opened, synchronize, reopened]
+    branches:
+      - main
+      - dev
   workflow_dispatch:
+    inputs:
+      debug_enabled:
+        type: boolean
+        description: 'Run the update with debug logging'
+        required: false
+        default: false
 
 jobs:
   update-dependencies:

diff --git a/cognee/infrastructure/llm/ollama/adapter.py b/cognee/infrastructure/llm/ollama/adapter.py
@@ -1,44 +1,109 @@
-from typing import Type
+from typing import Type, Optional
 from pydantic import BaseModel
 import instructor
 from cognee.infrastructure.llm.llm_interface import LLMInterface
-from cognee.infrastructure.llm.config import get_llm_config
-from openai import OpenAI
+from openai import AsyncOpenAI  # Use AsyncOpenAI for async compatibility
+import base64
+import os
 
 
 class OllamaAPIAdapter(LLMInterface):
-    """Adapter for a Generic API LLM provider using instructor with an OpenAI backend."""
+    """Adapter for an Ollama API LLM provider using instructor with an OpenAI backend."""
 
-    def __init__(self, endpoint: str, api_key: str, model: str, name: str, max_tokens: int):
+    MAX_RETRIES = 5
+
-    MAX_RETRIES = 5
+    transcription = self.aclient.audio.transcriptions.create(
+        model="whisper-1",  # Ensure the correct model for transcription
+        file=audio_file,
+        language="en",
+        max_retries=self.MAX_RETRIES,
+    )
-    MAX_RETRIES = 5
+    transcription = self.aclient.audio.transcriptions.create(
+        model="whisper-1",  # Ensure the correct model for transcription
+        file=audio_file,
+        language="en",
+        max_retries=self.MAX_RETRIES,
+    )
+    def __init__(
+        self,
+        endpoint: str,
+        api_key: str,
+        model: str,
+        name: str,
+        max_tokens: int,
+        api_version: Optional[str] = None,
+    ) -> None:
         self.name = name
         self.model = model
         self.api_key = api_key
         self.endpoint = endpoint
         self.max_tokens = max_tokens
+        self.api_version = api_version
 
+        # Use AsyncOpenAI for proper async handling
         self.aclient = instructor.from_openai(
-            OpenAI(base_url=self.endpoint, api_key=self.api_key), mode=instructor.Mode.JSON
+            AsyncOpenAI(base_url=self.endpoint, api_key=self.api_key), mode=instructor.Mode.JSON
         )
 
     async def acreate_structured_output(
         self, text_input: str, system_prompt: str, response_model: Type[BaseModel]
     ) -> BaseModel:
         """Generate a structured output from the LLM using the provided text and system prompt."""
 
+        # Ensure the function being awaited is actually async
+        if not callable(getattr(self.aclient.chat.completions, "create", None)):
+            raise TypeError("self.aclient.chat.completions.create is not callable!")
+
+        response = await self.aclient.chat.completions.create(
+            model=self.model,
+            messages=[
+                {"role": "system", "content": system_prompt},
+                {"role": "user", "content": text_input},
+            ],
+            max_tokens=self.max_tokens,
+        )
+
+        # Ensure response is valid before passing to Pydantic model
+        if not isinstance(response, dict):
+            raise ValueError(f"Unexpected response format: {response}")
+
+        return response_model(**response)
+
+    def create_transcript(self, input_file: str) -> str:
+        """Generate an audio transcript from a user query."""
+
+        if not os.path.isfile(input_file):
+            raise FileNotFoundError(f"The file {input_file} does not exist.")
+
+        with open(input_file, "rb") as audio_file:
+            transcription = self.aclient.audio.transcriptions.create(
+                model="whisper-1",  # Ensure the correct model for transcription
+                file=audio_file,
+                language="en",
+            )
+
+        # Ensure the response contains a valid transcript
+        if not hasattr(transcription, "text"):
+            raise ValueError("Transcription failed. No text returned.")
+
+        return transcription.text
-    def create_transcript(self, input_file: str) -> str:
-        """Generate an audio transcript from a user query."""
-
-        if not os.path.isfile(input_file):
-            raise FileNotFoundError(f"The file {input_file} does not exist.")
-
-        with open(input_file, "rb") as audio_file:
-            transcription = self.aclient.audio.transcriptions.create(
-                model="whisper-1",  # Ensure the correct model for transcription
-                file=audio_file,
-                language="en",
-            )
-
-        # Ensure the response contains a valid transcript
-        if not hasattr(transcription, "text"):
-            raise ValueError("Transcription failed. No text returned.")
-
-        return transcription.text
+    def create_transcript(self, input_file: str) -> str:
+        """Generate an audio transcript from a user query."""
+
+        if not os.path.isfile(input_file):
+            raise FileNotFoundError(f"The file {input_file} does not exist.")
+
+        try:
+            with open(input_file, "rb") as audio_file:
+                transcription = self.client.audio.transcriptions.create(
+                    model="whisper-1",  # Ensure the correct model for transcription
+                    file=audio_file,
+                    language="en",
+                    max_retries=self.MAX_RETRIES,
+                )
+
+            # Ensure the response contains a valid transcript
+            if not hasattr(transcription, "text"):
+                raise ValueError("Transcription failed. No text returned.")
+
+            return transcription.text
+        except Exception as e:
+            raise Exception(f"Error transcribing audio: {str(e)}")
-    def create_transcript(self, input_file: str) -> str:
-        """Generate an audio transcript from a user query."""
-
-        if not os.path.isfile(input_file):
-            raise FileNotFoundError(f"The file {input_file} does not exist.")
-
-        with open(input_file, "rb") as audio_file:
-            transcription = self.aclient.audio.transcriptions.create(
-                model="whisper-1",  # Ensure the correct model for transcription
-                file=audio_file,
-                language="en",
-            )
-
-        # Ensure the response contains a valid transcript
-        if not hasattr(transcription, "text"):
-            raise ValueError("Transcription failed. No text returned.")
-
-        return transcription.text
+    def create_transcript(self, input_file: str) -> str:
+        """Generate an audio transcript from a user query."""
+
+        if not os.path.isfile(input_file):
+            raise FileNotFoundError(f"The file {input_file} does not exist.")
+
+        try:
+            with open(input_file, "rb") as audio_file:
+                transcription = self.client.audio.transcriptions.create(
+                    model="whisper-1",  # Ensure the correct model for transcription
+                    file=audio_file,
+                    language="en",
+                    max_retries=self.MAX_RETRIES,
+                )
+
+            # Ensure the response contains a valid transcript
+            if not hasattr(transcription, "text"):
+                raise ValueError("Transcription failed. No text returned.")
+
+            return transcription.text
+        except Exception as e:
+            raise Exception(f"Error transcribing audio: {str(e)}")
+
+    def transcribe_image(self, input_file: str) -> str:
+        """Transcribe content from an image using base64 encoding."""
+
+        if not os.path.isfile(input_file):
+            raise FileNotFoundError(f"The file {input_file} does not exist.")
+
+        with open(input_file, "rb") as image_file:
+            encoded_image = base64.b64encode(image_file.read()).decode("utf-8")
+
         response = self.aclient.chat.completions.create(
-        response = self.aclient.chat.completions.create(
+        response = self.client.chat.completions.create(
-        response = self.aclient.chat.completions.create(
+        response = self.client.chat.completions.create(
             model=self.model,
             messages=[
                 {
                     "role": "user",
-                    "content": f"Use the given format to extract information from the following input: {text_input}",
-                },
-                {
-                    "role": "system",
-                    "content": system_prompt,
-                },
+                    "content": [
+                        {"type": "text", "text": "What’s in this image?"},
+                        {
+                            "type": "image_url",
+                            "image_url": {"url": f"data:image/jpeg;base64,{encoded_image}"},
+                        },
+                    ],
+                }
             ],
-            max_retries=5,
-            response_model=response_model,
+            max_tokens=300,
         )
-            max_tokens=300,
-        )
+            max_tokens=self.max_tokens,
+        )
-            max_tokens=300,
-        )
+            max_tokens=self.max_tokens,
+        )
 
-        return response
+        # Ensure response is valid before accessing .choices[0].message.content
+        if not hasattr(response, "choices") or not response.choices:
+            raise ValueError("Image transcription failed. No response received.")
+
+        return response.choices[0].message.content