patch chat behavior

Benjamin Feuer · Benjamin Feuer · commit c34c57dd71b4 · 2026-02-20T12:04:46.000-05:00
diff --git a/marvis/models/marvis_tsne.py b/marvis/models/marvis_tsne.py
@@ -2029,7 +2029,13 @@ def chat(self, user_input: str, max_history: int = 10) -> str:
 - Completion Rate: {prediction_context.get('completion_rate', 'N/A')}
 """)
 
-        # Add visualization context if available
+        # Add visualization context
+        has_viz_image = hasattr(self, '_last_viz_image') and self._last_viz_image is not None
+        if has_viz_image:
+            context_parts.append("""
+**Visualization:** The most recent t-SNE visualization from the prediction session is attached to this message. You can see the exact spatial layout of training points, test points, and the query point that was classified. Reference specific visual details (cluster positions, neighbor distributions, color patterns) in your response.
+""")
+
         if prediction_context.get('visualization_context'):
             viz_context = prediction_context['visualization_context']
             context_parts.append(f"""
@@ -2078,41 +2084,45 @@ def chat(self, user_input: str, max_history: int = 10) -> str:
             # Generate response using the VLM
             self.logger.info("Generating chat response...")
             
+            # Get the stored visualization image from the last prediction (if any)
+            chat_image = getattr(self, '_last_viz_image', None)
+
             # Use the VLM wrapper interface for chat
             if hasattr(self.vlm_wrapper, 'generate_response'):
                 # Use the standard generate_response interface
                 response = self.vlm_wrapper.generate_response(
                     text_input=chat_prompt,
-                    image_input=None,  # Text-only conversation
+                    image_input=chat_image,  # Pass last visualization if available
                     max_tokens=1000,
                     temperature=0.7  # Slightly higher temperature for conversational responses
                 )
-            elif hasattr(self.vlm_wrapper, 'generate'):
-                # Use the direct generate interface with proper parameters
+            elif hasattr(self.vlm_wrapper, 'generate_from_conversation'):
+                # Use conversation interface if available
                 from marvis.utils.model_loader import GenerationConfig
+                from marvis.utils.vlm_prompting import create_vlm_conversation
+                conversation = create_vlm_conversation(chat_image, chat_prompt) if chat_image else [{"role": "user", "content": chat_prompt}]
                 config = GenerationConfig(
-                    max_new_tokens=512,
+                    max_new_tokens=1000,
                     temperature=0.7,
                     do_sample=True,
                     top_p=0.9
                 )
-                response = self.vlm_wrapper.generate(
-                    inputs=chat_prompt,
-                    config=config
+                response = self.vlm_wrapper.generate_from_conversation(
+                    conversation,
+                    config
                 )
-            elif hasattr(self.vlm_wrapper, 'generate_from_conversation'):
-                # Use conversation interface if available
+            elif hasattr(self.vlm_wrapper, 'generate'):
+                # Use the direct generate interface with proper parameters
                 from marvis.utils.model_loader import GenerationConfig
-                conversation = [{"role": "user", "content": chat_prompt}]
                 config = GenerationConfig(
-                    max_new_tokens=512,
+                    max_new_tokens=1000,
                     temperature=0.7,
                     do_sample=True,
                     top_p=0.9
                 )
-                response = self.vlm_wrapper.generate_from_conversation(
-                    conversation,
-                    config
+                response = self.vlm_wrapper.generate(
+                    inputs=chat_prompt,
+                    config=config
                 )
             else:
                 # Final fallback - raise informative error
diff --git a/marvis/models/process_one_sample.py b/marvis/models/process_one_sample.py
@@ -566,6 +566,11 @@ def process_one_sample(
 
     # Process image and generate VLM response
     image = _process_image(classifier_instance, image)
+
+    # Store the last visualization image and prompt on the classifier for chat access
+    classifier_instance._last_viz_image = image.copy()
+    classifier_instance._last_viz_prompt = prompt
+
     response = _generate_vlm_response(classifier_instance, image, prompt)
     prediction = _parse_prediction(response, classifier_instance, all_classes)
 
diff --git a/marvis/utils/class_name_utils.py b/marvis/utils/class_name_utils.py
@@ -603,7 +603,7 @@ def normalize_predictions_to_target(
     Returns:
         List of predictions converted to the same type space as y_reference.
     """
-    if not y_reference:
+    if y_reference is None or len(y_reference) == 0:
         return predictions
 
     tgt_example = y_reference[0]
diff --git a/scripts/analysis/visualize_chat.py b/scripts/analysis/visualize_chat.py