Spaces:

willwade
/

AACKGDemo

Sleeping

App Files Files Community

willwade commited on 25 days ago

Commit

c8d94c7

1 Parent(s): d8b372b

adding better style changes and tone

Browse files

Files changed (3) hide show

app.py +82 -31
custom.css +137 -0
utils.py +23 -0

app.py CHANGED Viewed

@@ -6,21 +6,23 @@ from utils import SocialGraphManager, SuggestionGenerator
 # Define available models
 AVAILABLE_MODELS = {
-    "distilgpt2": "DistilGPT2 (Fast, smaller model)",
-    "gpt2": "GPT-2 (Medium size, better quality)",
     "google/gemma-3-1b-it": "Gemma 3 1B-IT (Small, instruction-tuned)",
     "Qwen/Qwen1.5-0.5B": "Qwen 1.5 0.5B (Very small, efficient)",
     "Qwen/Qwen1.5-1.8B": "Qwen 1.5 1.8B (Small, good quality)",
     "TinyLlama/TinyLlama-1.1B-Chat-v1.0": "TinyLlama 1.1B (Small, chat-tuned)",
     "microsoft/phi-3-mini-4k-instruct": "Phi-3 Mini (Small, instruction-tuned)",
     "microsoft/phi-2": "Phi-2 (Small, high quality for size)",
 }
 # Initialize the social graph manager
 social_graph = SocialGraphManager("social_graph.json")
-# Initialize the suggestion generator with Gemma 3B (default)
-suggestion_generator = SuggestionGenerator("google/gemma-3-1b-it")
 # Test the model to make sure it's working
 test_result = suggestion_generator.test_model()
@@ -67,9 +69,19 @@ def get_topics_for_person(person_id):
 def get_suggestion_categories():
-    """Get suggestion categories from the social graph."""
     if "common_utterances" in social_graph.graph:
-        return list(social_graph.graph["common_utterances"].keys())
     return []
@@ -140,15 +152,16 @@ def generate_suggestions(
     user_input,
     suggestion_type,
     selected_topic=None,
-    model_name="google/gemma-3-1b-it",
     temperature=0.7,
     progress=gr.Progress(),
 ):
     """Generate suggestions based on the selected person and user input."""
     print(
         f"Generating suggestions with: person_id={person_id}, user_input={user_input}, "
         f"suggestion_type={suggestion_type}, selected_topic={selected_topic}, "
-        f"model={model_name}, temperature={temperature}"
     )
     # Initialize progress
@@ -166,9 +179,16 @@ def generate_suggestions(
     person_context = social_graph.get_person_context(person_id)
     print(f"Person context: {person_context}")
     # Try to infer conversation type if user input is provided
     inferred_category = None
-    if user_input and suggestion_type == "auto_detect":
         # Simple keyword matching for now - could be enhanced with ML
         user_input_lower = user_input.lower()
         if any(
@@ -215,7 +235,7 @@ def generate_suggestions(
     result = ""
     # If suggestion type is "model", use the language model for multiple suggestions
-    if suggestion_type == "model":
         print("Using model for suggestions")
         progress(0.2, desc="Preparing to generate suggestions...")
@@ -226,6 +246,8 @@ def generate_suggestions(
             progress(progress_value, desc=f"Generating suggestion {i+1}/3")
             print(f"Generating suggestion {i+1}/3")
             try:
                 suggestion = suggestion_generator.generate_suggestion(
                     person_context, user_input, temperature=temperature
                 )
@@ -244,14 +266,14 @@ def generate_suggestions(
         print(f"Final result: {result[:100]}...")
     # If suggestion type is "common_phrases", use the person's common phrases
-    elif suggestion_type == "common_phrases":
         phrases = social_graph.get_relevant_phrases(person_id, user_input)
         result = "### My Common Phrases with this Person:\n\n"
         for i, phrase in enumerate(phrases, 1):
             result += f"{i}. {phrase}\n\n"
     # If suggestion type is "auto_detect", use the inferred category or default to model
-    elif suggestion_type == "auto_detect":
         print(f"Auto-detect mode, inferred category: {inferred_category}")
         if inferred_category:
             utterances = social_graph.get_common_utterances(inferred_category)
@@ -270,6 +292,8 @@ def generate_suggestions(
                     progress(
                         progress_value, desc=f"Generating fallback suggestion {i+1}/3"
                     )
                     suggestion = suggestion_generator.generate_suggestion(
                         person_context, user_input, temperature=temperature
                     )
@@ -284,17 +308,25 @@ def generate_suggestions(
                 result += "1. Sorry, I couldn't generate a suggestion at this time.\n\n"
     # If suggestion type is a category from common_utterances
-    elif suggestion_type in get_suggestion_categories():
-        print(f"Using category: {suggestion_type}")
-        utterances = social_graph.get_common_utterances(suggestion_type)
         print(f"Got utterances: {utterances}")
-        result = f"### {suggestion_type.replace('_', ' ').title()} Phrases:\n\n"
         for i, utterance in enumerate(utterances, 1):
             result += f"{i}. {utterance}\n\n"
     # Default fallback
     else:
-        print(f"No handler for suggestion type: {suggestion_type}")
         result = "No suggestions available. Please try a different option."
     print(f"Returning result: {result[:100]}...")
@@ -325,7 +357,7 @@ def transcribe_audio(audio_path):
 # Create the Gradio interface
-with gr.Blocks(title="Will's AAC Communication Aid") as demo:
     gr.Markdown("# Will's AAC Communication Aid")
     gr.Markdown(
         """
@@ -385,33 +417,51 @@ with gr.Blocks(title="Will's AAC Communication Aid") as demo:
                     lines=3,
                 )
-            # Audio input
-            with gr.Row():
                 audio_input = gr.Audio(
-                    label="Or record what they said:",
                     type="filepath",
                     sources=["microphone"],
                 )
-                transcribe_btn = gr.Button("Transcribe", variant="secondary")
-            # Suggestion type selection
             suggestion_type = gr.Radio(
                 choices=[
-                    "model",
-                    "auto_detect",
-                    "common_phrases",
                 ]
                 + get_suggestion_categories(),
-                value="model",  # Default to model for better results
                 label="How should I respond?",
-                info="Choose response type (model = AI-generated, auto_detect = automatic category detection)",
             )
             # Model selection
             with gr.Row():
                 model_dropdown = gr.Dropdown(
                     choices=list(AVAILABLE_MODELS.keys()),
-                    value="google/gemma-3-1b-it",
                     label="Language Model",
                     info="Select which AI model to use for generating responses",
                 )
@@ -491,12 +541,13 @@ with gr.Blocks(title="Will's AAC Communication Aid") as demo:
             topic_dropdown,
             model_dropdown,
             temperature_slider,
         ],
         outputs=[suggestions_output],
     )
-    # Transcribe audio to text
-    transcribe_btn.click(
         transcribe_audio,
         inputs=[audio_input],
         outputs=[user_input],

 # Define available models
 AVAILABLE_MODELS = {
     "google/gemma-3-1b-it": "Gemma 3 1B-IT (Small, instruction-tuned)",
+    "google/gemma-3-2b-it": "Gemma 3 2B-IT (Default, instruction-tuned)",
+    "google/gemma-3-4b-it": "Gemma 3 4B-IT (Better quality, instruction-tuned)",
     "Qwen/Qwen1.5-0.5B": "Qwen 1.5 0.5B (Very small, efficient)",
     "Qwen/Qwen1.5-1.8B": "Qwen 1.5 1.8B (Small, good quality)",
     "TinyLlama/TinyLlama-1.1B-Chat-v1.0": "TinyLlama 1.1B (Small, chat-tuned)",
     "microsoft/phi-3-mini-4k-instruct": "Phi-3 Mini (Small, instruction-tuned)",
     "microsoft/phi-2": "Phi-2 (Small, high quality for size)",
+    "distilgpt2": "DistilGPT2 (Fast, smaller model)",
+    "gpt2": "GPT-2 (Medium size, better quality)",
 }
 # Initialize the social graph manager
 social_graph = SocialGraphManager("social_graph.json")
+# Initialize the suggestion generator with Gemma 3 2B (default)
+suggestion_generator = SuggestionGenerator("google/gemma-3-2b-it")
 # Test the model to make sure it's working
 test_result = suggestion_generator.test_model()
 def get_suggestion_categories():
+    """Get suggestion categories from the social graph with emoji prefixes."""
     if "common_utterances" in social_graph.graph:
+        categories = list(social_graph.graph["common_utterances"].keys())
+        emoji_map = {
+            "greetings": "👋 greetings",
+            "needs": "🆘 needs",
+            "emotions": "😊 emotions",
+            "questions": "❓ questions",
+            "tech_talk": "💻 tech_talk",
+            "reminiscing": "🔙 reminiscing",
+            "organization": "📅 organization",
+        }
+        return [emoji_map.get(cat, cat) for cat in categories]
     return []
     user_input,
     suggestion_type,
     selected_topic=None,
+    model_name="google/gemma-3-2b-it",
     temperature=0.7,
+    mood=3,
     progress=gr.Progress(),
 ):
     """Generate suggestions based on the selected person and user input."""
     print(
         f"Generating suggestions with: person_id={person_id}, user_input={user_input}, "
         f"suggestion_type={suggestion_type}, selected_topic={selected_topic}, "
+        f"model={model_name}, temperature={temperature}, mood={mood}"
     )
     # Initialize progress
     person_context = social_graph.get_person_context(person_id)
     print(f"Person context: {person_context}")
+    # Remove emoji prefix from suggestion_type if present
+    clean_suggestion_type = suggestion_type
+    if suggestion_type.startswith(
+        ("🤖", "🔍", "💬", "👋", "🆘", "😊", "❓", "💻", "🔙", "📅")
+    ):
+        clean_suggestion_type = suggestion_type[2:].strip()  # Remove emoji and space
     # Try to infer conversation type if user input is provided
     inferred_category = None
+    if user_input and clean_suggestion_type == "auto_detect":
         # Simple keyword matching for now - could be enhanced with ML
         user_input_lower = user_input.lower()
         if any(
     result = ""
     # If suggestion type is "model", use the language model for multiple suggestions
+    if clean_suggestion_type == "model":
         print("Using model for suggestions")
         progress(0.2, desc="Preparing to generate suggestions...")
             progress(progress_value, desc=f"Generating suggestion {i+1}/3")
             print(f"Generating suggestion {i+1}/3")
             try:
+                # Add mood to person context
+                person_context["mood"] = mood
                 suggestion = suggestion_generator.generate_suggestion(
                     person_context, user_input, temperature=temperature
                 )
         print(f"Final result: {result[:100]}...")
     # If suggestion type is "common_phrases", use the person's common phrases
+    elif clean_suggestion_type == "common_phrases":
         phrases = social_graph.get_relevant_phrases(person_id, user_input)
         result = "### My Common Phrases with this Person:\n\n"
         for i, phrase in enumerate(phrases, 1):
             result += f"{i}. {phrase}\n\n"
     # If suggestion type is "auto_detect", use the inferred category or default to model
+    elif clean_suggestion_type == "auto_detect":
         print(f"Auto-detect mode, inferred category: {inferred_category}")
         if inferred_category:
             utterances = social_graph.get_common_utterances(inferred_category)
                     progress(
                         progress_value, desc=f"Generating fallback suggestion {i+1}/3"
                     )
+                    # Add mood to person context
+                    person_context["mood"] = mood
                     suggestion = suggestion_generator.generate_suggestion(
                         person_context, user_input, temperature=temperature
                     )
                 result += "1. Sorry, I couldn't generate a suggestion at this time.\n\n"
     # If suggestion type is a category from common_utterances
+    elif clean_suggestion_type in [
+        "greetings",
+        "needs",
+        "emotions",
+        "questions",
+        "tech_talk",
+        "reminiscing",
+        "organization",
+    ]:
+        print(f"Using category: {clean_suggestion_type}")
+        utterances = social_graph.get_common_utterances(clean_suggestion_type)
         print(f"Got utterances: {utterances}")
+        result = f"### {clean_suggestion_type.replace('_', ' ').title()} Phrases:\n\n"
         for i, utterance in enumerate(utterances, 1):
             result += f"{i}. {utterance}\n\n"
     # Default fallback
     else:
+        print(f"No handler for suggestion type: {clean_suggestion_type}")
         result = "No suggestions available. Please try a different option."
     print(f"Returning result: {result[:100]}...")
 # Create the Gradio interface
+with gr.Blocks(title="Will's AAC Communication Aid", css="custom.css") as demo:
     gr.Markdown("# Will's AAC Communication Aid")
     gr.Markdown(
         """
                     lines=3,
                 )
+            # Audio input with auto-transcription
+            with gr.Column(elem_classes="audio-recorder-container"):
+                gr.Markdown("### 🎤 Or record what they said")
                 audio_input = gr.Audio(
+                    label="",
                     type="filepath",
                     sources=["microphone"],
+                    elem_classes="audio-recorder",
+                )
+                gr.Markdown(
+                    "*Recording will auto-transcribe when stopped*",
+                    elem_classes="auto-transcribe-hint",
                 )
+            # Suggestion type selection with emojis
             suggestion_type = gr.Radio(
                 choices=[
+                    "🤖 model",
+                    "🔍 auto_detect",
+                    "💬 common_phrases",
                 ]
                 + get_suggestion_categories(),
+                value="🤖 model",  # Default to model for better results
                 label="How should I respond?",
+                info="Choose response type",
+                elem_classes="emoji-response-options",
             )
+            # Add a mood slider with emoji indicators at the ends
+            with gr.Column(elem_classes="mood-slider-container"):
+                mood_slider = gr.Slider(
+                    minimum=1,
+                    maximum=5,
+                    value=3,
+                    step=1,
+                    label="How am I feeling today?",
+                    info="This will influence the tone of your responses (😢 Sad → Happy 😄)",
+                    elem_classes="mood-slider",
+                )
             # Model selection
             with gr.Row():
                 model_dropdown = gr.Dropdown(
                     choices=list(AVAILABLE_MODELS.keys()),
+                    value="google/gemma-3-2b-it",
                     label="Language Model",
                     info="Select which AI model to use for generating responses",
                 )
             topic_dropdown,
             model_dropdown,
             temperature_slider,
+            mood_slider,
         ],
         outputs=[suggestions_output],
     )
+    # Auto-transcribe audio to text when recording stops
+    audio_input.stop_recording(
         transcribe_audio,
         inputs=[audio_input],
         outputs=[user_input],

custom.css ADDED Viewed

	@@ -0,0 +1,137 @@

+/* Custom CSS for Will's AAC Communication Aid */
+/* Main container styling */
+.gradio-container {
+    font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
+}
+/* Emoji response options */
+.emoji-response-options .gr-form {
+    margin-top: 10px;
+}
+/* Direct emoji labels for radio buttons */
+.emoji-response-options label[for$="model"] span:first-child::before {
+    content: "🤖 ";
+}
+.emoji-response-options label[for$="auto_detect"] span:first-child::before {
+    content: "🔍 ";
+}
+.emoji-response-options label[for$="common_phrases"] span:first-child::before {
+    content: "💬 ";
+}
+.emoji-response-options label[for$="greetings"] span:first-child::before {
+    content: "👋 ";
+}
+.emoji-response-options label[for$="needs"] span:first-child::before {
+    content: "🆘 ";
+}
+.emoji-response-options label[for$="emotions"] span:first-child::before {
+    content: "😊 ";
+}
+.emoji-response-options label[for$="questions"] span:first-child::before {
+    content: "❓ ";
+}
+.emoji-response-options label[for$="tech_talk"] span:first-child::before {
+    content: "💻 ";
+}
+.emoji-response-options label[for$="reminiscing"] span:first-child::before {
+    content: "🔙 ";
+}
+.emoji-response-options label[for$="organization"] span:first-child::before {
+    content: "📅 ";
+}
+/* Mood slider styling */
+.mood-slider-container {
+    margin-bottom: 20px;
+    position: relative;
+}
+.mood-slider .gr-slider {
+    height: 20px;
+    border-radius: 10px;
+}
+.mood-slider .gr-slider-value {
+    font-weight: bold;
+}
+/* Add emoji indicators to the ends of the slider */
+.mood-slider::before {
+    content: "😢";
+    position: absolute;
+    left: 0;
+    bottom: 5px;
+    font-size: 24px;
+}
+.mood-slider::after {
+    content: "😄";
+    position: absolute;
+    right: 0;
+    bottom: 5px;
+    font-size: 24px;
+}
+/* Style for audio recorder */
+.audio-recorder-container {
+    margin-top: 15px;
+    margin-bottom: 15px;
+    border: 2px solid #2563eb;
+    border-radius: 8px;
+    padding: 10px;
+    background-color: rgba(37, 99, 235, 0.05);
+}
+.audio-recorder-container h3 {
+    margin-top: 0;
+    color: #2563eb;
+}
+.audio-recorder {
+    margin: 10px 0;
+}
+.audio-recorder .mic-icon {
+    color: #2563eb;
+    font-size: 24px;
+}
+.auto-transcribe-hint {
+    font-size: 12px;
+    color: #666;
+    margin-top: 0;
+    text-align: center;
+}
+/* Improve button styling */
+.gr-button-primary {
+    background-color: #2563eb;
+    border-radius: 8px;
+    font-weight: 600;
+    transition: all 0.3s ease;
+}
+.gr-button-primary:hover {
+    background-color: #1d4ed8;
+    transform: translateY(-2px);
+    box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1);
+}
+/* Improve markdown output */
+#suggestions_output {
+    border-radius: 8px;
+    padding: 15px;
+    background-color: #f8fafc;
+    border-left: 4px solid #2563eb;
+}

utils.py CHANGED Viewed

@@ -277,6 +277,26 @@ class SuggestionGenerator:
             self.model_loaded = False
             return False
     def test_model(self) -> str:
         """Test if the model is working correctly."""
         if not self.model_loaded:
@@ -330,6 +350,7 @@ class SuggestionGenerator:
         selected_topic = person_context.get("selected_topic", "")
         common_phrases = person_context.get("common_phrases", [])
         frequency = person_context.get("frequency", "")
         # Get AAC user information
         aac_user = self.aac_user_info
@@ -344,6 +365,8 @@ I am talking to {name}, who is my {role}.
 About {name}: {context}
 We typically talk about: {', '.join(topics)}
 We communicate {frequency}.
 """
         # Add communication style based on relationship

             self.model_loaded = False
             return False
+    def _get_mood_description(self, mood_value: int) -> str:
+        """Convert mood value (1-5) to a descriptive string.
+        Args:
+            mood_value: Integer from 1-5 representing mood (1=sad, 5=happy)
+        Returns:
+            String description of the mood
+        """
+        mood_descriptions = {
+            1: "I'm feeling quite down and sad today. My responses might be more subdued.",
+            2: "I'm feeling a bit low today. I might be less enthusiastic than usual.",
+            3: "I'm feeling okay today - neither particularly happy nor sad.",
+            4: "I'm feeling pretty good today. I'm in a positive mood.",
+            5: "I'm feeling really happy and upbeat today! I'm in a great mood.",
+        }
+        # Default to neutral if value is out of range
+        return mood_descriptions.get(mood_value, mood_descriptions[3])
     def test_model(self) -> str:
         """Test if the model is working correctly."""
         if not self.model_loaded:
         selected_topic = person_context.get("selected_topic", "")
         common_phrases = person_context.get("common_phrases", [])
         frequency = person_context.get("frequency", "")
+        mood = person_context.get("mood", 3)  # Default to neutral mood (3)
         # Get AAC user information
         aac_user = self.aac_user_info
 About {name}: {context}
 We typically talk about: {', '.join(topics)}
 We communicate {frequency}.
+My current mood: {self._get_mood_description(mood)}
 """
         # Add communication style based on relationship