Spaces:

willwade
/

AACKGDemo

Sleeping

App Files Files Community

willwade commited on May 15

Commit

6d19e58

1 Parent(s): 36fcf07

try and switch to llm library

Browse files

Files changed (5) hide show

.huggingface-space +9 -0
app.py +100 -30
llm_interface.py +1 -1
requirements.txt +4 -0
setup.sh +39 -0

.huggingface-space ADDED Viewed

	@@ -0,0 +1,9 @@

+title: AAC Knowledge Graph Demo
+emoji: 💬
+colorFrom: blue
+colorTo: green
+sdk: gradio
+sdk_version: 4.19.2
+app_file: app.py
+pinned: false
+license: mit

app.py CHANGED Viewed

@@ -2,28 +2,72 @@ import gradio as gr
 import whisper
 import random
 import time
 from utils import SocialGraphManager
 from llm_interface import LLMInterface
-# Define available models
 AVAILABLE_MODELS = {
     # Gemini models (online API)
-    "gemini-1.5-flash-latest": "🌐 Gemini 1.5 Flash (Online API - Fast, Recommended)",
-    "gemini-1.5-pro-latest": "🌐 Gemini 1.5 Pro (Online API - High quality)",
-    # OpenAI models (if API key is set)
-    "gpt-3.5-turbo": "🌐 ChatGPT 3.5 (Online API)",
-    "gpt-4o-mini": "🌐 GPT-4o Mini (Online API - Fast)",
-    # Ollama models (if installed locally)
-    "ollama/gemma:7b": "💻 Gemma 7B (Offline - requires Ollama)",
-    "ollama/llama3:8b": "💻 Llama 3 8B (Offline - requires Ollama)",
 }
 # Initialize the social graph manager
 social_graph = SocialGraphManager("social_graph.json")
-# Initialize the suggestion generator with a fast online model by default
-print("Initializing with Gemini 1.5 Flash (online model)")
-suggestion_generator = LLMInterface("gemini-1.5-flash-latest")
 # Test the model to make sure it's working
 print("Testing model connection...")
@@ -145,7 +189,7 @@ def change_model(model_name, progress=gr.Progress()):
     Returns:
         A status message about the model change
     """
-    global suggestion_generator
     print(f"Changing model to: {model_name}")
@@ -156,24 +200,50 @@ def change_model(model_name, progress=gr.Progress()):
     # Show progress indicator
     progress(0, desc=f"Loading model: {model_name}")
-    # Create a new LLMInterface with the selected model
     try:
         progress(0.3, desc=f"Initializing {model_name}...")
-        new_generator = LLMInterface(model_name)
-        # Test if the model works
-        progress(0.6, desc="Testing model connection...")
-        test_result = new_generator.test_model()
-        print(f"Model test result: {test_result}")
-        if new_generator.model_loaded:
-            # Replace the current generator with the new one
-            suggestion_generator = new_generator
-            progress(1.0, desc=f"Model loaded: {model_name}")
-            return f"Successfully switched to model: {model_name}"
         else:
-            progress(1.0, desc="Model loading failed")
-            return f"Failed to load model: {model_name}. Using previous model instead."
     except Exception as e:
         print(f"Error changing model: {e}")
         progress(1.0, desc="Error loading model")
@@ -576,9 +646,9 @@ with gr.Blocks(title="Will's AAC Communication Aid", css="custom.css") as demo:
             with gr.Row():
                 model_dropdown = gr.Dropdown(
                     choices=list(AVAILABLE_MODELS.keys()),
-                    value="gemini-1.5-flash-latest",
                     label="Language Model",
-                    info="Select which AI model to use (🌐 = online API, 💻 = offline model)",
                 )
                 temperature_slider = gr.Slider(

 import whisper
 import random
 import time
+import os
+import subprocess
+import warnings
+# Set environment variable to avoid tokenizer warnings
+os.environ["TOKENIZERS_PARALLELISM"] = "false"
 from utils import SocialGraphManager
 from llm_interface import LLMInterface
+# Define available models - using only the ones specified by the user
 AVAILABLE_MODELS = {
     # Gemini models (online API)
+    "gemini-1.5-flash-8b-latest": "🌐 Gemini 1.5 Flash 8B (Online API - Fast, Cheapest)",
+    "gemini-2.0-flash": "🌐 Gemini 2.0 Flash (Online API - Better quality)",
+    "gemma-3-27b-it": "🌐 Gemma 3 27B-IT (Online API - High quality)",
 }
 # Initialize the social graph manager
 social_graph = SocialGraphManager("social_graph.json")
+# Check if we're running on Hugging Face Spaces
+is_huggingface_spaces = "SPACE_ID" in os.environ
+# Print environment info for debugging
+print(f"Running on Hugging Face Spaces: {is_huggingface_spaces}")
+print(f"GEMINI_API_KEY set: {'Yes' if os.environ.get('GEMINI_API_KEY') else 'No'}")
+print(f"HF_TOKEN set: {'Yes' if os.environ.get('HF_TOKEN') else 'No'}")
+# Try to run the setup script if we're on Hugging Face Spaces
+if is_huggingface_spaces:
+    try:
+        print("Running setup script...")
+        subprocess.run(["bash", "setup.sh"], check=True)
+        print("Setup script completed successfully")
+    except Exception as e:
+        print(f"Error running setup script: {e}")
+# Check if LLM tool is installed
+llm_installed = False
+try:
+    result = subprocess.run(
+        ["llm", "--version"],
+        capture_output=True,
+        text=True,
+        timeout=5,
+    )
+    if result.returncode == 0:
+        print(f"LLM tool is installed: {result.stdout.strip()}")
+        llm_installed = True
+    else:
+        print("LLM tool returned an error.")
+except Exception as e:
+    print(f"LLM tool not available: {e}")
+# Initialize the suggestion generator
+if llm_installed:
+    print("Initializing with Gemini 1.5 Flash 8B (online model via LLM tool)")
+    suggestion_generator = LLMInterface("gemini-1.5-flash-8b-latest")
+    use_llm_interface = True
+else:
+    print("LLM tool not available, falling back to direct Hugging Face implementation")
+    from utils import SuggestionGenerator
+    suggestion_generator = SuggestionGenerator("google/gemma-3-1b-it")
+    use_llm_interface = False
 # Test the model to make sure it's working
 print("Testing model connection...")
     Returns:
         A status message about the model change
     """
+    global suggestion_generator, use_llm_interface
     print(f"Changing model to: {model_name}")
     # Show progress indicator
     progress(0, desc=f"Loading model: {model_name}")
     try:
         progress(0.3, desc=f"Initializing {model_name}...")
+        # Use the appropriate interface based on what's available
+        if use_llm_interface:
+            # Create a new LLMInterface with the selected model
+            new_generator = LLMInterface(model_name)
+            # Test if the model works
+            progress(0.6, desc="Testing model connection...")
+            test_result = new_generator.test_model()
+            print(f"Model test result: {test_result}")
+            if new_generator.model_loaded:
+                # Replace the current generator with the new one
+                suggestion_generator = new_generator
+                progress(1.0, desc=f"Model loaded: {model_name}")
+                return f"Successfully switched to model: {model_name}"
+            else:
+                progress(1.0, desc="Model loading failed")
+                return (
+                    f"Failed to load model: {model_name}. Using previous model instead."
+                )
         else:
+            # Using direct Hugging Face implementation
+            from utils import SuggestionGenerator
+            # Create a new SuggestionGenerator with the selected model
+            new_generator = SuggestionGenerator(model_name)
+            # Test if the model works
+            progress(0.6, desc="Testing model connection...")
+            success = new_generator.load_model(model_name)
+            if success:
+                # Replace the current generator with the new one
+                suggestion_generator = new_generator
+                progress(1.0, desc=f"Model loaded: {model_name}")
+                return f"Successfully switched to model: {model_name}"
+            else:
+                progress(1.0, desc="Model loading failed")
+                return (
+                    f"Failed to load model: {model_name}. Using previous model instead."
+                )
     except Exception as e:
         print(f"Error changing model: {e}")
         progress(1.0, desc="Error loading model")
             with gr.Row():
                 model_dropdown = gr.Dropdown(
                     choices=list(AVAILABLE_MODELS.keys()),
+                    value="gemini-1.5-flash-8b-latest",
                     label="Language Model",
+                    info="Select which AI model to use (all are online API models)",
                 )
                 temperature_slider = gr.Slider(

llm_interface.py CHANGED Viewed

@@ -225,7 +225,7 @@ My conversation starter to {name}:"""
                 ],
                 capture_output=True,
                 text=True,
-                timeout=15,  # Add timeout to prevent hanging
             )
             if progress_callback:

                 ],
                 capture_output=True,
                 text=True,
+                timeout=30,  # Increase timeout for Gemini API calls
             )
             if progress_callback:

requirements.txt CHANGED Viewed

@@ -7,3 +7,7 @@ openai-whisper>=20231117
 bitsandbytes>=0.41.0
 accelerate>=0.21.0
 google-generativeai>=0.3.0

 bitsandbytes>=0.41.0
 accelerate>=0.21.0
 google-generativeai>=0.3.0
+llm>=0.25.0
+llm-gemini>=0.1.0
+llm-openai>=0.1.0
+llm-ollama>=0.1.0

setup.sh ADDED Viewed

	@@ -0,0 +1,39 @@

+#!/bin/bash
+# Install Simon Willison's LLM library and plugins
+pip install llm
+pip install llm-gemini
+pip install llm-openai
+pip install llm-ollama
+# Set up environment variables
+echo "Setting up environment variables..."
+if [ -n "$GEMINI_API_KEY" ]; then
+    echo "GEMINI_API_KEY is set"
+    # Configure LLM to use Gemini
+    llm keys set gemini "$GEMINI_API_KEY"
+else
+    echo "GEMINI_API_KEY is not set"
+fi
+if [ -n "$OPENAI_API_KEY" ]; then
+    echo "OPENAI_API_KEY is set"
+    # Configure LLM to use OpenAI
+    llm keys set openai "$OPENAI_API_KEY"
+else
+    echo "OPENAI_API_KEY is not set"
+fi
+if [ -n "$HF_TOKEN" ]; then
+    echo "HF_TOKEN is set"
+    # Configure Hugging Face token
+    huggingface-cli login --token "$HF_TOKEN"
+else
+    echo "HF_TOKEN is not set"
+fi
+# List available models
+echo "Available LLM models:"
+llm models
+echo "Setup complete!"