fix: add defensive field width limits and improve explain_action docstrings

sshekhar563 · sshekhar563 · commit 763493ed6c93 · 2025-12-22T16:18:12.000+05:30
diff --git a/nexum_ai/optimizer.py b/nexum_ai/optimizer.py
@@ -361,8 +361,24 @@ def feed_metrics(self, query: str, latency_ms: float) -> None:
     
     def explain_action(self, query: str, available_actions: List[str]) -> Dict[str, Any]:
         """
-        Explain what action would be taken without executing
-        Returns Q-values and predicted action for EXPLAIN command
+        Explain what action would be taken without executing.
+        
+        Returns Q-values and predicted action for EXPLAIN command.
+        This method provides a read-only analysis of the optimizer's decision-making
+        process without actually executing any action or updating the Q-table.
+        
+        Args:
+            query: SQL query string
+            available_actions: List of possible actions
+        
+        Returns:
+            Dict containing:
+                - state: state key string
+                - q_values: Q-values for all actions
+                - best_action: action with highest Q-value
+                - epsilon: current exploration rate
+                - would_explore: whether exploration is possible
+                - explanation: human-readable explanation of optimizer behavior
         """
         state = f"query_type_{len(query) // 10}"
         
@@ -374,13 +390,16 @@ def explain_action(self, query: str, available_actions: List[str]) -> Dict[str,
         
         best_action = max(available_actions, key=lambda a: q_values.get(a, 0.0))
         
+        # Defensive truncation for display (limit to 20 chars)
+        best_action_display = best_action[:20] if len(best_action) > 20 else best_action
+        
         return {
             'state': state,
             'q_values': q_values,
-            'best_action': best_action,
+            'best_action': best_action_display,
             'epsilon': self.epsilon,
             'would_explore': self.epsilon > 0,
-            'exploration_note': f'Random action possible (ε={self.epsilon})' if self.epsilon > 0 else 'Would use best action'
+            'explanation': f'With ε={self.epsilon:.4f}, agent would explore {self.epsilon*100:.1f}% of the time'
         }
 
 
@@ -477,65 +496,79 @@ def explain_query_plan(query: str, cache: Optional[SemanticCache] = None,
 
 
 def format_explain_output(explain_result: Dict[str, Any]) -> str:
-    """Format EXPLAIN result as a readable table"""
+    """Format EXPLAIN result as a readable table with defensive field width limits"""
+    
+    def truncate(value: Any, max_len: int) -> str:
+        """Truncate value to max length for box alignment"""
+        s = str(value)
+        if len(s) > max_len:
+            return s[:max_len - 3] + "..."
+        return s
+    
     lines = []
     lines.append("=" * 70)
     lines.append("QUERY EXECUTION PLAN")
     lines.append("=" * 70)
     
     # Smart query truncation
     query = explain_result['query']
-    if len(query) > 60:
-        display_query = query[:60] + "..."
-    else:
-        display_query = query
+    display_query = truncate(query, 60)
     
     lines.append(f"Query: {display_query}")
     lines.append("")
     
     # Parsing section
     lines.append("┌─ PARSING ─────────────────────────────────────────────────────────┐")
     p = explain_result['parsing']
-    lines.append(f"│ Type: {p['query_type']:<15} Complexity: {p['complexity_estimate']}/10              │")
+    query_type = truncate(p['query_type'], 15)
+    lines.append(f"│ Type: {query_type:<15} Complexity: {p['complexity_estimate']}/10              │")
     lines.append(f"│ WHERE: {str(p['has_where_clause']):<8} JOIN: {str(p['has_join']):<8} AGG: {str(p['has_aggregation']):<8}     │")
     lines.append("└───────────────────────────────────────────────────────────────────┘")
     lines.append("")
     
     # Cache section
     lines.append("┌─ CACHE LOOKUP ────────────────────────────────────────────────────┐")
     c = explain_result['cache_analysis']
-    lines.append(f"│ Entries checked: {c['cache_entries_checked']:<5} Threshold: {c['similarity_threshold']:<6}            │")
+    # Defensive limits: cache_entries_checked capped at 99999 for display
+    entries_checked = min(c['cache_entries_checked'], 99999)
+    lines.append(f"│ Entries checked: {entries_checked:<5} Threshold: {c['similarity_threshold']:<6}            │")
     lines.append(f"│ Best similarity: {c['best_similarity']:<6} Would hit: {str(c['would_hit_cache']):<6}              │")
     if c['top_matches']:
         lines.append("│ Top matches:                                                      │")
         for match in c['top_matches'][:3]:
             sim = match['similarity']
             hit = "✓" if match['would_hit'] else "✗"
-            # Smart truncation for cached queries
-            cached_query = match['cached_query']
-            if not cached_query.endswith('...') and len(cached_query) > 45:
-                cached_query = cached_query[:42] + "..."
+            # Smart truncation for cached queries (limit to 45 chars)
+            cached_query = truncate(match['cached_query'], 45)
             lines.append(f"│   {hit} {sim:.4f} - {cached_query:<45} │")
     lines.append("└───────────────────────────────────────────────────────────────────┘")
     lines.append("")
     
     # RL Agent section
     lines.append("┌─ RL AGENT ────────────────────────────────────────────────────────┐")
     r = explain_result['rl_agent']
-    lines.append(f"│ State: {r['state']:<30} Epsilon: {r.get('epsilon', r.get('exploration_probability', 0)):<6}        │")
-    lines.append(f"│ Best action: {r['best_action']:<20}                          │")
+    # Defensive truncation for state (30 chars) and best_action (20 chars)
+    state_display = truncate(r['state'], 30)
+    best_action_display = truncate(r['best_action'], 20)
+    lines.append(f"│ State: {state_display:<30} Epsilon: {r.get('epsilon', 0):<6}        │")
+    lines.append(f"│ Best action: {best_action_display:<20}                          │")
     lines.append("│ Q-values:                                                         │")
     for action, qval in r['q_values'].items():
-        lines.append(f"│   {action:<15}: {qval:>8.4f}                                    │")
+        # Truncate action names to 15 chars for alignment
+        action_display = truncate(action, 15)
+        lines.append(f"│   {action_display:<15}: {qval:>8.4f}                                    │")
     lines.append("└───────────────────────────────────────────────────────────────────┘")
     lines.append("")
     
     # Execution strategy
     lines.append("┌─ EXECUTION STRATEGY ──────────────────────────────────────────────┐")
     e = explain_result['execution_strategy']
-    lines.append(f"│ Strategy: {e['strategy']:<20} Est. latency: {e['estimated_latency']:<10}   │")
+    # Defensive truncation for strategy (20 chars)
+    strategy_display = truncate(e['strategy'], 20)
+    recommendation_display = truncate(e['recommendation'], 40)
+    lines.append(f"│ Strategy: {strategy_display:<20} Est. latency: {e['estimated_latency']:<10}   │")
     lines.append(f"│ Will cache: {str(e['will_cache_result']):<8}                                          │")
-    lines.append(f"│ Recommendation: {e['recommendation']:<40}       │")
+    lines.append(f"│ Recommendation: {recommendation_display:<40}       │")
     lines.append("└───────────────────────────────────────────────────────────────────┘")
     
     return "\n".join(lines)
diff --git a/nexum_ai/rl_agent.py b/nexum_ai/rl_agent.py
@@ -175,8 +175,28 @@ def get_stats(self) -> Dict[str, float]:
     
     def explain_action(self, query_length: int, cache_hit: bool, complexity: int) -> Dict[str, Any]:
         """
-        Explain what action would be taken without executing
-        Returns Q-values, state analysis, and predicted action for EXPLAIN command
+        Explain what action would be taken without executing.
+        
+        Returns Q-values, state analysis, and predicted action for EXPLAIN command.
+        This method provides a read-only analysis of the RL agent's decision-making
+        process without actually executing any action or updating the Q-table.
+        
+        Args:
+            query_length: Length of SQL query
+            cache_hit: Whether query hit cache
+            complexity: Complexity score (0-10)
+        
+        Returns:
+            Dict containing:
+                - state: state key string
+                - state_breakdown: dict with query_length_bucket, cache_hit, complexity
+                - q_values: Q-values for all actions
+                - best_action: action with highest Q-value
+                - epsilon: current exploration rate
+                - would_explore: whether exploration is possible
+                - predicted_action: deterministic best action (ignores epsilon-greedy)
+                - explanation: human-readable explanation of agent behavior
+                - agent_stats: total_states_learned, total_updates, episodes
         """
         state = self._get_state_key(query_length, cache_hit, complexity)
         
@@ -189,6 +209,9 @@ def explain_action(self, query_length: int, cache_hit: bool, complexity: int) ->
         # Determine best action
         best_action = max(self.actions, key=lambda a: q_values.get(a, 0.0))
         
+        # Truncate best_action for display if needed (defensive limit)
+        best_action_display = best_action[:20] if len(best_action) > 20 else best_action
+        
         return {
             'state': state,
             'state_breakdown': {
@@ -197,11 +220,11 @@ def explain_action(self, query_length: int, cache_hit: bool, complexity: int) ->
                 'complexity': complexity
             },
             'q_values': q_values,
-            'best_action': best_action,
+            'best_action': best_action_display,
             'epsilon': round(self.epsilon, 4),
             'would_explore': self.epsilon > 0,
-            'predicted_action': best_action,  # Deterministic for explain
-            'exploration_probability': round(self.epsilon, 4),
+            'predicted_action': best_action_display,  # Deterministic for explain
+            'explanation': f'With ε={self.epsilon:.4f}, agent would explore {self.epsilon*100:.1f}% of the time',
             'agent_stats': {
                 'total_states_learned': len(self.q_table),
                 'total_updates': len(self.training_history),