Tutorial-Codebase-Knowledge/utils/call_llm.py at main · itzlambda/Tutorial-Codebase-Knowledge

History

87 lines (72 loc) · 2.49 KB

Raw

import litellm

import os

import logging

import json

from datetime import datetime

import dotenv

dotenv.load_dotenv()

# Configure logging

log_directory = os.getenv("LOG_DIR", "logs")

os.makedirs(log_directory, exist_ok=True)

log_file = os.path.join(log_directory, f"llm_calls_{datetime.now().strftime('%Y%m%d')}.log")

# Set up logger

logger = logging.getLogger("llm_logger")

logger.setLevel(logging.INFO)

logger.propagate = False

file_handler = logging.FileHandler(log_file)

file_handler.setFormatter(logging.Formatter('%(asctime)s - %(levelname)s - %(message)s'))

logger.addHandler(file_handler)

# Simple cache configuration

cache_file = "llm_cache.json"

# By default, we Google Gemini 2.5 pro, as it shows great performance for code understanding

def call_llm(prompt: str, use_cache: bool = True) -> str:

# Log the prompt

logger.info(f"PROMPT: {prompt}")

# Check cache if enabled

if use_cache:

# Load cache from disk

cache = {}

if os.path.exists(cache_file):

try:

with open(cache_file, 'r') as f:

cache = json.load(f)

except:

logger.warning(f"Failed to load cache, starting with empty cache")

# Return from cache if exists

if prompt in cache:

logger.info(f"RESPONSE: {cache[prompt]}")

return cache[prompt]

model = os.getenv("AI_MODEL")

api_key = os.getenv("AI_API_KEY")

try:

response = litellm.completion(

api_key=api_key,

model=model,

messages=[{"role": "user", "content": prompt}]

)

response_text = response.choices[0].message.content

except Exception as e:

logger.error(f"LiteLLM call failed: {e}")

raise e

logger.info(f"RESPONSE: {response_text}")

if use_cache:

cache = {}

if os.path.exists(cache_file):

try:

with open(cache_file, 'r') as f:

cache = json.load(f)

except:

pass

cache[prompt] = response_text

try:

with open(cache_file, 'w') as f:

json.dump(cache, f)

except Exception as e:

logger.error(f"Failed to save cache: {e}")

return response_text

if __name__ == "__main__":

test_prompt = "Hello, how are you?"

# First call - should hit the API

print("Making call...")

response1 = call_llm(test_prompt, use_cache=False)

print(f"Response: {response1}")

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

call_llm.py

Latest commit

History

call_llm.py

File metadata and controls