FalkorDB
diff --git a/‎.env.template‎
Lines changed: 9 additions & 1 deletion b/‎.env.template‎
Lines changed: 9 additions & 1 deletion
diff --git a/‎.wordlist.txt‎
Lines changed: 2 additions & 1 deletion b/‎.wordlist.txt‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎README.md‎
Lines changed: 3 additions & 1 deletion b/‎README.md‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎graphrag_sdk/models/litellm.py‎
Lines changed: 291 additions & 0 deletions b/‎graphrag_sdk/models/litellm.py‎
Lines changed: 291 additions & 0 deletions
diff --git a/‎graphrag_sdk/steps/create_ontology_step.py‎
Lines changed: 0 additions & 1 deletion b/‎graphrag_sdk/steps/create_ontology_step.py‎
Lines changed: 0 additions & 1 deletion
@@ -5,4 +5,12 @@
    # Endpoint format: https://{your-resource-name}.openai.azure.com
    AZURE_ENDPOINT="AZURE_ENDPOINT"
    # API Version (e.g., 2023-05-15)
-   AZURE_API_VERSION="AZURE_API_VERSION"
+   AZURE_API_VERSION="AZURE_API_VERSION"
+
+   # For LiteLLM usage 
+   GEMINI_API_KEY = "GEMINI_API_KEY"
+   OLLAMA_API_BASE = "OLLAMA_API_BASE" # "http://localhost:11434"
+
+   AZURE_API_KEY = "AZURE_API_KEY" # "my-azure-api-key"
+   AZURE_API_BASE = "AZURE_API_BASE" # "https://example-endpoint.openai.azure.com"
+   AZURE_API_VERSION = "AZURE_API_VERSION" # "2023-05-15"
@@ -27,4 +27,5 @@ www
 faq
 Ollama
 ollama
-Cypher
+Cypher
+LiteLLM
@@ -13,7 +13,7 @@ GraphRAG-SDK is a comprehensive solution for building Graph Retrieval-Augmented
 
 * Ontology Management: Manage ontologies either manually or automatically from unstructured data.
 * Knowledge Graph (KG): Construct and query knowledge graphs for efficient data retrieval.
-* LLMs Integration: Support for OpenAI and Google Gemini models.
+* LLMs Integration: Support for OpenAI, Google Gemini, Ollama and LiteLLM models.
 * Multi-Agent System: Multi-agent orchestrators using KG-based agents.
 
 ## Get Started
@@ -50,6 +50,8 @@ Currently, this SDK supports the following LLMs API:
 * [Google](https://makersuite.google.com/app/apikey) Recommended model:`gemini-1.5-flash-001`
 * [Azure-OpenAI](https://ai.azure.com) Recommended model:`gpt-4o`
 * [Ollama](https://ollama.com/) Available only to the Q&A step. Recommended models: `llama3`. Ollama models are suitable for the Q&A step only (after the knowledge graph (KG) created).
+* [LiteLLM](https://docs.litellm.ai): A framework supporting inference of large language models, allowing flexibility in deployment and use cases.
+
 
 ## Basic Usage
 
 
@@ -0,0 +1,291 @@
+import os
+import logging
+from ollama import Client
+from typing import Optional
+from litellm import completion, validate_environment, utils as litellm_utils
+from .model import (
+    OutputMethod,
+    GenerativeModel,
+    GenerativeModelConfig,
+    GenerationResponse,
+    FinishReason,
+    GenerativeModelChatSession,
+)
+
+logger = logging.getLogger(__name__)
+logger.setLevel(logging.INFO) 
+
+class LiteModel(GenerativeModel):
+    """
+    A generative model that interfaces with the LiteLLM for chat completions.
+    """
+
+    def __init__(
+        self,
+        model_name: str,
+        generation_config: Optional[GenerativeModelConfig] = None,
+        system_instruction: Optional[str] = None,
+    ):
+        """
+        Initialize the LiteModel with the required parameters.
+        
+        LiteLLM model_name format: <provider>/<model_name>
+         Examples:
+         - openai/gpt-4o
+         - azure/gpt-4o
+         - gemini/gemini-1.5-pro
+         - ollama/llama3:8b
+
+        Args:
+            model_name (str): The name and the provider for the LiteLLM client.
+            generation_config (Optional[GenerativeModelConfig]): Configuration settings for generation.
+            system_instruction (Optional[str]): Instruction to guide the model.
+        """
+
+        
+        env_val = validate_environment(model_name)
+        if not env_val['keys_in_environment']:
+            raise ValueError(f"Missing {env_val['missing_keys']} in the environment.")
+        self.model_name, provider, _, _ = litellm_utils.get_llm_provider(model_name)
+        self.model = model_name
+        
+        if provider == "ollama":
+            self.ollama_client = Client()
+            self.check_and_pull_model()
+        if not self.check_valid_key(model_name):
+            raise ValueError(f"Invalid keys for model {model_name}.")
+        
+
+        self.generation_config = generation_config or GenerativeModelConfig()
+        self.system_instruction = system_instruction
+        
+    def check_valid_key(self, model: str):
+        """
+        Checks if the environment key is valid for a specific model by making a litellm.completion call with max_tokens=10
+
+        Args:
+            model (str): The name of the model to check the key against.
+
+        Returns:
+            bool: True if the key is valid for the model, False otherwise.
+        """
+        messages = [{"role": "user", "content": "Hey, how's it going?"}]
+        try:
+            completion(
+                model=model, messages=messages, max_tokens=10
+            )
+            return True
+        except:
+            return False
+            
+    def check_and_pull_model(self) -> None:
+        """
+        Checks if the specified model is available locally, and pulls it if not.
+
+        Logs:
+            - Info: If the model is already available or after successfully pulling the model.
+            - Error: If there is a failure in pulling the model.
+
+        Raises:
+            Exception: If there is an error during the model pull process.
+        """
+        # Get the list of available models
+        response = self.ollama_client.list()  # This returns a dictionary
+        available_models = [model['name'] for model in response['models']]  # Extract model names
+
+        # Check if the model is already pulled
+        if self.model_name in available_models:
+            logger.info(f"The model '{self.model_name}' is already available.")
+        else:
+            logger.info(f"Pulling the model '{self.model_name}'...")
+            try:
+                self.ollama_client.pull(self.model_name)  # Pull the model
+                logger.info(f"Model '{self.model_name}' pulled successfully.")
+            except Exception as e:
+                logger.error(f"Failed to pull the model '{self.model_name}': {e}")
+                raise ValueError(f"Failed to pull the model '{self.model_name}': {e}")
+
+    def with_system_instruction(self, system_instruction: str) -> "GenerativeModel":
+        """
+        Set or update the system instruction for new model instance.
+
+        Args:
+            system_instruction (str): Instruction for guiding the model's behavior.
+        
+        Returns:
+            GenerativeModel: The updated model instance.
+        """
+        self.system_instruction = system_instruction
+        return self
+
+    def start_chat(self, args: Optional[dict] = None) -> GenerativeModelChatSession:
+        """
+        Start a new chat session.
+
+        Args:
+            args (Optional[dict]): Additional arguments for the chat session.
+
+        Returns:
+            GenerativeModelChatSession: A new instance of the chat session.
+        """
+        return LiteModelChatSession(self, args)
+
+    def parse_generate_content_response(self, response: any) -> GenerationResponse:
+        """
+        Parse the model's response and extract content for the user.
+
+        Args:
+            response (any): The raw response from the model.
+
+        Returns:
+            GenerationResponse: Parsed response containing the generated text.
+        """
+        return GenerationResponse(
+            text=response.choices[0].message.content,
+            finish_reason=(
+                FinishReason.STOP
+                if response.choices[0].finish_reason == "stop"
+                else (
+                    FinishReason.MAX_TOKENS
+                    if response.choices[0].finish_reason == "length"
+                    else FinishReason.OTHER
+                )
+            ),
+        )
+
+    def to_json(self) -> dict:
+        """
+        Serialize the model's configuration and state to JSON format.
+
+        Returns:
+            dict: The serialized JSON data.
+        """
+        return {
+            "model_name": self.model_name,
+            "generation_config": self.generation_config.to_json(),
+            "system_instruction": self.system_instruction,
+        }
+
+    @staticmethod
+    def from_json(json: dict) -> "GenerativeModel":
+        """
+        Deserialize a JSON object to create an instance of LiteLLMGenerativeModel.
+
+        Args:
+            json (dict): The serialized JSON data.
+
+        Returns:
+            GenerativeModel: A new instance of the model.
+        """
+        return LiteModel(
+            json["model_name"],
+            generation_config=GenerativeModelConfig.from_json(
+                json["generation_config"]
+            ),
+            system_instruction=json["system_instruction"],
+        )
+
+
+class LiteModelChatSession(GenerativeModelChatSession):
+    """
+    A chat session for interacting with the LiteLLM model, maintaining conversation history.
+    """
+
+    def __init__(self, model: LiteModel, args: Optional[dict] = None):
+        """
+        Initialize the chat session and set up the conversation history.
+
+        Args:
+            model (LiteLLMGenerativeModel): The model instance for the session.
+            args (Optional[dict]): Additional arguments for customization.
+        """
+        self._model = model
+        self._args = args
+        self._chat_history = (
+            [{"role": "system", "content": self._model.system_instruction}]
+            if self._model.system_instruction is not None
+            else []
+        )
+        
+    def get_chat_history(self) -> list[dict]:
+        """
+        Retrieve the conversation history for the current chat session.
+
+        Returns:
+            list[dict]: The chat session's conversation history.
+        """
+        return self._chat_history.copy()
+
+    def send_message(self, message: str, output_method: OutputMethod = OutputMethod.DEFAULT) -> GenerationResponse:
+        """
+        Send a message in the chat session and receive the model's response.
+
+        Args:
+            message (str): The message to send.
+            output_method (OutputMethod): Format for the model's output.
+
+        Returns:
+            GenerationResponse: The generated response.
+        """
+        generation_config = self._adjust_generation_config(output_method)
+        self._chat_history.append({"role": "user", "content": message})
+        try:
+            response = completion(
+                model=self._model.model,
+                messages=self._chat_history,
+                **generation_config
+            )
+        except Exception as e:
+            raise ValueError(f"Error during completion request, please check the credentials - {e}")
+        content = self._model.parse_generate_content_response(response)
+        self._chat_history.append({"role": "assistant", "content": content.text})
+        return content
+    
+    def _adjust_generation_config(self, output_method: OutputMethod):
+        """
+        Adjust the generation configuration based on the specified output method.
+
+        Args:
+            output_method (OutputMethod): The desired output method (e.g., default or JSON).
+
+        Returns:
+            dict: The adjusted configuration settings for generation.
+        """
+        config = self._model.generation_config.to_json()
+        if output_method == OutputMethod.JSON:
+            config['temperature'] = 0
+            config['response_format'] = { "type": "json_object" }
+        
+        return config
+    
+    def delete_last_message(self):
+        """
+        Deletes the last message exchange (user message and assistant response) from the chat history.
+        Preserves the system message if present.
+        
+        Example:
+            Before:
+            [
+                {"role": "system", "content": "System message"},
+                {"role": "user", "content": "User message"},
+                {"role": "assistant", "content": "Assistant response"},
+            ]
+            After:
+            [
+                {"role": "system", "content": "System message"},
+            ]
+
+        Note: Does nothing if the chat history is empty or contains only a system message.
+        """
+        # Keep at least the system message if present
+        min_length = 1 if self._model.system_instruction else 0
+        if len(self._chat_history) - 2 >= min_length:
+            self._chat_history.pop()
+            self._chat_history.pop()
+        else:
+            # Reset to initial state with just system message if present
+            self._chat_history = (
+            [{"role": "system", "content": self._model.system_instruction}]
+            if self._model.system_instruction is not None
+            else []
+        )
@@ -17,7 +17,6 @@
 from graphrag_sdk.models import (
     GenerativeModel,
     GenerativeModelChatSession,
-    GenerativeModelConfig,
     GenerationResponse,
     FinishReason,
 )
-Original file line number
+Diff line change
 faq
 Ollama
 ollama
 -Cypher
 +Cypher
 +LiteLLM
Original file line number	Diff line number	Diff line change
`@@ -17,7 +17,6 @@`
`17`	`17`	`from graphrag_sdk.models import (`
`18`	`18`	`GenerativeModel,`
`19`	`19`	`GenerativeModelChatSession,`
`20`		`- GenerativeModelConfig,`
`21`	`20`	`GenerationResponse,`
`22`	`21`	`FinishReason,`
`23`	`22`	`)`