tomhartke
diff --git a/‎.env.example‎
Lines changed: 8 additions & 0 deletions b/‎.env.example‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 60 additions & 0 deletions b/‎.github/workflows/ci.yml‎
Lines changed: 60 additions & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 70 additions & 3 deletions b/‎.gitignore‎
Lines changed: 70 additions & 3 deletions
diff --git a/‎README.md‎
Lines changed: 83 additions & 1 deletion b/‎README.md‎
Lines changed: 83 additions & 1 deletion
diff --git a/‎basic_user_interface.py‎
Lines changed: 47 additions & 9 deletions b/‎basic_user_interface.py‎
Lines changed: 47 additions & 9 deletions
@@ -0,0 +1,8 @@
+# OpenAI Configuration
+OPENAI_API_KEY=your-api-key-here
+OPENAI_MODEL=gpt-3.5-turbo
+OPENAI_MAX_TOKENS=1000
+OPENAI_TEMPERATURE=0.0
+
+# Copy this file to .env and fill in your actual API key
+# Never commit .env to version control!
@@ -0,0 +1,60 @@
+name: CI
+
+on:
+  push:
+    branches: [ main, master, claude/* ]
+  pull_request:
+    branches: [ main, master ]
+
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: ["3.9", "3.10", "3.11"]
+
+    steps:
+    - uses: actions/checkout@v3
+
+    - name: Set up Python ${{ matrix.python-version }}
+      uses: actions/setup-python@v4
+      with:
+        python-version: ${{ matrix.python-version }}
+
+    - name: Cache pip packages
+      uses: actions/cache@v3
+      with:
+        path: ~/.cache/pip
+        key: ${{ runner.os }}-pip-${{ hashFiles('**/requirements*.txt') }}
+        restore-keys: |
+          ${{ runner.os }}-pip-
+
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        pip install -r requirements.txt
+        pip install -r requirements-dev.txt
+
+    - name: Lint with ruff
+      run: |
+        ruff check . --exit-zero
+
+    - name: Check formatting with black
+      run: |
+        black --check . --diff || true
+
+    - name: Type check with mypy
+      run: |
+        mypy . --ignore-missing-imports --check-untyped-defs || true
+
+    - name: Run tests with pytest
+      env:
+        OPENAI_API_KEY: test-key-for-ci
+      run: |
+        pytest tests/ -v --cov=. --cov-report=xml --cov-report=term
+
+    - name: Upload coverage to Codecov
+      uses: codecov/codecov-action@v3
+      with:
+        file: ./coverage.xml
+        fail_ci_if_error: false
@@ -1,4 +1,71 @@
-KnowledgeGraphFigures.key
-__pycache__/*
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+pip-wheel-metadata/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# Virtual environments
+venv/
+ENV/
+env/
+.venv
+
+# IDEs
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
 .DS_Store
-.ipynb_checkpoints/*
+
+# Environment variables
+.env
+.env.local
+.env.*.local
+
+# Testing
+.pytest_cache/
+.coverage
+htmlcov/
+coverage.xml
+*.cover
+.hypothesis/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+*.ipynb_checkpoints/
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Ruff
+.ruff_cache/
+
+# Data files (uncomment if you don't want to track data)
+# *.csv
+# *.json
+
+# Model outputs
+outputs/
+logs/
@@ -1,5 +1,87 @@
 # A knowledge graph from GPT
- 
+
+[![Python 3.9+](https://img.shields.io/badge/python-3.9+-blue.svg)](https://www.python.org/downloads/)
+[![License](https://img.shields.io/badge/license-MIT-green.svg)](LICENSE)
+
+## Quick Start
+
+### Installation
+
+1. **Clone the repository**
+```bash
+git clone https://github.com/tomhartke/knowledge-graph-from-GPT.git
+cd knowledge-graph-from-GPT
+```
+
+2. **Create a virtual environment**
+```bash
+python -m venv venv
+source venv/bin/activate  # On Windows: venv\Scripts\activate
+```
+
+3. **Install dependencies**
+```bash
+pip install -r requirements.txt
+```
+
+4. **Set up your OpenAI API key**
+```bash
+# Option 1: Export as environment variable
+export OPENAI_API_KEY='your-api-key-here'
+
+# Option 2: Create a .env file
+cp .env.example .env
+# Then edit .env and add your API key
+```
+
+### Basic Usage
+
+```python
+from knowledge_graph import KnowledgeGraph, Card
+from initial_card_processing import get_cards_df_abstraction_groups_from_front_and_back_csv
+from knowledge_graph_querying import query_knowledge_graph
+
+# Load flashcards from CSV
+cards_df = get_cards_df_abstraction_groups_from_front_and_back_csv('my_flash_cards_general')
+
+# Build knowledge graph
+kg = KnowledgeGraph()
+kg.add_card_deck(cards_df)
+kg.update_all_embeddings()
+
+# Query the graph
+answer = query_knowledge_graph(
+    question="What is a PixelVAE?",
+    knowledge_graph=kg,
+    top_k=5
+)
+print(answer)
+```
+
+### Running Tests
+
+```bash
+# Install development dependencies
+pip install -r requirements-dev.txt
+
+# Run tests
+pytest tests/ -v
+
+# Run with coverage
+pytest tests/ --cov=. --cov-report=html
+```
+
+## Recent Updates
+
+- **Fixed critical bugs**: Corrected exception handling and variable assignments
+- **Modernized OpenAI API**: Updated from deprecated `text-davinci-003` to `gpt-3.5-turbo` ChatCompletion API
+- **Centralized configuration**: New `config.py` module for managing all settings
+- **Improved error handling**: Replaced bare `except` clauses with specific exception types
+- **Added type hints**: Comprehensive type annotations for better IDE support and code clarity
+- **Dependency management**: Added `requirements.txt`, `pyproject.toml`, and `.env` support
+- **Test suite**: Initial test coverage for configuration and utilities
+- **CI/CD ready**: GitHub Actions workflow for automated testing
+
 ## High-level description
 This program is meant to create an external memory module for a language model, and ultimately provide 
 agent-like capabilities to a language model (long-term goal).
 
@@ -18,15 +18,36 @@
 from knowledge_graph_querying import *
 from initial_card_processing import *
 
-# Load your API key from an environment variable or secret management service
-openai.api_key = os.getenv("OPENAI_API_KEY")
+try:
+    from config import config
+except ImportError:
+    config = None
 
-model_chat_engine = "gpt-3.5-turbo" 
+# Load your API key from an environment variable or secret management service
+if config:
+    openai.api_key = config.openai.api_key
+    model_chat_engine = config.openai.model
+else:
+    openai.api_key = os.getenv("OPENAI_API_KEY")
+    if not openai.api_key:
+        raise ValueError(
+            "OPENAI_API_KEY environment variable is not set.\n"
+            "Please set it: export OPENAI_API_KEY='your-key-here'"
+        )
+    model_chat_engine = os.getenv("OPENAI_MODEL", "gpt-3.5-turbo") 
 
 SYSTEM_MESSAGE = ("You are a helpful professor and polymath scientist. You want to help a fellow researcher learn more about the world. "
                   + "You are clear, concise, and precise in your answers, and you follow instructions carefully.")
 
-def _gen_chat_response(prompt='hi'):
+def _gen_chat_response(prompt: str = 'hi') -> str:
+    """Generate chat response using OpenAI API.
+
+    Args:
+        prompt: The user's prompt
+
+    Returns:
+        The assistant's response text
+    """
     response = openai.ChatCompletion.create(
         model=model_chat_engine,
         messages=[
@@ -37,17 +58,34 @@ def _gen_chat_response(prompt='hi'):
 
     return message['content']
 
-def gen_chat_response(prompt='hi'):
+def gen_chat_response(prompt: str = 'hi', max_retries: int = 10) -> str:
+    """Generate chat response with retry logic.
+
+    Args:
+        prompt: The user's prompt
+        max_retries: Maximum number of retry attempts
+
+    Returns:
+        The assistant's response text
+
+    Raises:
+        Exception: If all retries fail
+    """
     prompt_succeeded = False
     wait_time = 0.1
-    while not prompt_succeeded:
+    retry_count = 0
+
+    while not prompt_succeeded and retry_count < max_retries:
         try:
             response = _gen_chat_response(prompt)
             prompt_succeeded = True
-        except:
-            print('  LM response failed. Server probably overloaded. Retrying after ', wait_time, ' seconds...')
+        except (openai.error.APIError, openai.error.RateLimitError, openai.error.Timeout, openai.error.ServiceUnavailableError) as e:
+            retry_count += 1
+            print(f'  LM response failed: {e}. Retry {retry_count}/{max_retries}. Retrying after {wait_time} seconds...')
+            if retry_count >= max_retries:
+                raise Exception(f"Failed after {max_retries} retries: {e}")
             time.sleep(wait_time)
-            wait_time += wait_time*2  # exponential backoff 
+            wait_time += wait_time * 2  # exponential backoff
     return response
 
 def convert_abstraction_group_to_concept_list(abs_grp):