NexumDB/nexum_ai/optimizer.py at eef50dc0b061e889e15c28f0f9e38fb9e6f9d25b · aviralgarg05/NexumDB · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
"""
Semantic cache and query optimizer using local embedding models
"""

import numpy as np
from typing import Optional, List, Dict, Any
import json
import os
from pathlib import Path

class SemanticCache:
    """
    Caches query results using semantic similarity
    Uses local embedding models only
    Supports persistence to disk via JSON or pickle files
    """

    def __init__(self, similarity_threshold: float = 0.95, cache_file: str = "semantic_cache.pkl") -> None:
        self.cache: List[Dict] = []
        self.similarity_threshold = similarity_threshold
        self.model = None
        self.hf_model = None
        self.hf_tokenizer = None

        # Support environment variable for cache file path
        cache_file_env = os.environ.get('NEXUMDB_CACHE_FILE', cache_file)
        self.cache_file = cache_file_env

        self.cache_dir = Path("cache")
        self.cache_dir.mkdir(exist_ok=True)
        self.cache_path = self.cache_dir / self.cache_file

        # Load existing cache on initialization
        self.load_cache()

    def initialize_model(self) -> None:
        """Initialize local embedding model - deferred to avoid import errors"""
        model_name = os.environ.get('NEXUM_EMBEDDING_MODEL', 'all-MiniLM-L6-v2')

        # Try SentenceTransformer first (preferred for embedding models)
        try:
            from sentence_transformers import SentenceTransformer
            self.model = SentenceTransformer(model_name)
            print(f"Semantic cache initialized with SentenceTransformer: {model_name}")
            self.hf_model = None
            self.hf_tokenizer = None
            return
        except ImportError:
            print("Warning: sentence-transformers not installed, trying transformers fallback")
        except Exception as e:
            print(f"Warning: Failed to load with SentenceTransformer ({e}), trying transformers fallback")

        # Fallback to generic HuggingFace transformers
        try:
            from transformers import AutoTokenizer, AutoModel
            import torch

            # If default model was used but ST failed, we might want a different default for raw transformers
            # but usually the same model name works for both if it's on HF Hub.
            # However, 'all-MiniLM-L6-v2' is a sentence-transformers specific alias often mapped to
            # 'sentence-transformers/all-MiniLM-L6-v2' on HF Hub.
            if model_name == 'all-MiniLM-L6-v2':
                model_name = 'sentence-transformers/all-MiniLM-L6-v2'

            self.hf_tokenizer = AutoTokenizer.from_pretrained(model_name)
            self.hf_model = AutoModel.from_pretrained(model_name)
            self.model = None
            print(f"Semantic cache initialized with HuggingFace transformers: {model_name}")
        except ImportError:
             print("Warning: transformers not installed, using simple fallback")
             self.model = None
             self.hf_model = None
             self.hf_tokenizer = None
        except Exception as e:
            print(f"Warning: Failed to load with transformers ({e}), using simple fallback")
            self.model = None
            self.hf_model = None
            self.hf_tokenizer = None

    def vectorize(self, text: str) -> List[float]:
        """Convert text to embedding vector"""
        if self.model is None and self.hf_model is None:
            self.initialize_model()

        if self.model is not None:
            embedding = self.model.encode(text)
            return embedding.tolist()
        elif self.hf_model is not None and self.hf_tokenizer is not None:
            try:
                import torch
                # Tokenize and compute embedding
                inputs = self.hf_tokenizer(text, return_tensors="pt", padding=True, truncation=True, max_length=512)
                with torch.no_grad():
                    outputs = self.hf_model(**inputs)

                # Mean pooling
                # attention_mask shape: (batch, seq_len)
                # last_hidden_state shape: (batch, seq_len, hidden_dim)
                attention_mask = inputs['attention_mask']
                token_embeddings = outputs.last_hidden_state

                input_mask_expanded = attention_mask.unsqueeze(-1).expand(token_embeddings.size()).float()
                sum_embeddings = torch.sum(token_embeddings * input_mask_expanded, 1)
                sum_mask = torch.clamp(input_mask_expanded.sum(1), min=1e-9)

                embedding = sum_embeddings / sum_mask
                return embedding[0].tolist()
            except Exception as e:
                print(f"Error during HF vectorization: {e}, using fallback")
                return self._fallback_vectorize(text)
        else:
            return self._fallback_vectorize(text)

    def _fallback_vectorize(self, text: str) -> List[float]:
        """Simple fallback vectorization using character hashing"""
        vec = [0.0] * 384
        for i, char in enumerate(text[:384]):
            vec[i] = float(ord(char)) / 128.0
        return vec

    def cosine_similarity(self, vec1: List[float], vec2: List[float]) -> float:
        """Calculate cosine similarity between two vectors"""
        vec1_arr = np.array(vec1)
        vec2_arr = np.array(vec2)

        dot_product = np.dot(vec1_arr, vec2_arr)
        norm1 = np.linalg.norm(vec1_arr)
        norm2 = np.linalg.norm(vec2_arr)

        if norm1 == 0 or norm2 == 0:
            return 0.0

        return float(dot_product / (norm1 * norm2))

    def get(self, query: str) -> Optional[str]:
        """Retrieve cached result if similar query exists"""
        query_vec = self.vectorize(query)

        for entry in self.cache:
            similarity = self.cosine_similarity(query_vec, entry['vector'])
            if similarity >= self.similarity_threshold:
                print(f"Cache hit! Similarity: {similarity:.4f}")
                return entry['result']

        return None

    def put(self, query: str, result: str) -> None:
        """Store query and result in cache"""
        query_vec = self.vectorize(query)
        self.cache.append({
            'query': query,
            'vector': query_vec,
            'result': result
        })
        print(f"Cached query: {query[:50]}...")

    def clear(self) -> None:
        """Clear the cache"""
        self.cache.clear()
        # Remove cache file when clearing
        if self.cache_path.exists():
            self.cache_path.unlink()
            print("Cache file deleted")

    def save_cache(self, filepath: Optional[str] = None) -> None:
        """Save cache to disk using JSON format (secure default)"""
        if filepath is None:
            filepath = str(self.cache_path)

        # Use JSON format by default for security
        json_filepath = filepath.replace('.pkl', '.json') if filepath.endswith('.pkl') else filepath
        self.save_cache_json(json_filepath)

    def load_cache(self, filepath: Optional[str] = None) -> None:
        """Load cache from disk using JSON (safe) or pickle (legacy)"""
        if filepath is None:
            filepath = str(self.cache_path)

        # Try JSON first (safer format)
        json_filepath = filepath.replace('.pkl', '.json') if filepath.endswith('.pkl') else f"{filepath}.json"
        if os.path.exists(json_filepath):
            self.load_cache_json(json_filepath)
            return

        # Fall back to pickle for legacy files (with restricted unpickler for safety)
        if os.path.exists(filepath) and filepath.endswith('.pkl'):
            try:
                import pickle

                # Use RestrictedUnpickler to limit allowed classes
                class RestrictedUnpickler(pickle.Unpickler):
                    """Restricted unpickler that only allows safe types"""
                    ALLOWED_CLASSES = {
                        ('builtins', 'dict'),
                        ('builtins', 'list'),
                        ('builtins', 'str'),
                        ('builtins', 'int'),
                        ('builtins', 'float'),
                        ('builtins', 'bool'),
                        ('builtins', 'tuple'),
                        ('builtins', 'set'),
                        ('builtins', 'frozenset'),
                    }

                    def find_class(self, module: str, name: str) -> type:
                        if (module, name) not in self.ALLOWED_CLASSES:
                            raise pickle.UnpicklingError(
                                f"Forbidden class: {module}.{name}"
                            )
                        return super().find_class(module, name)

                with open(filepath, 'rb') as f:
                    data = RestrictedUnpickler(f).load()

                self.cache = data.get('cache', [])
                self.similarity_threshold = data.get('similarity_threshold', self.similarity_threshold)

                print(f"Semantic cache loaded from {filepath} ({len(self.cache)} entries)")
                print("Note: Converting legacy pickle cache to JSON format for security")

                # Validate cache entries
                valid_entries = []
                for entry in self.cache:
                    if all(key in entry for key in ['query', 'vector', 'result']):
                        valid_entries.append(entry)
                    else:
                        print("Warning: Invalid cache entry found and removed")

                self.cache = valid_entries

                # Auto-convert to JSON format for future use
                self.save_cache_json(json_filepath)

            except Exception as e:
                print(f"Error loading semantic cache: {e}")
                print("Starting with empty cache")
                self.cache = []
        else:
            print(f"No cache file found at {filepath}, starting with empty cache")

    def save_cache_json(self, filepath: Optional[str] = None) -> None:
        """Save cache to JSON format (secure and portable)"""
        if filepath is None:
            filepath = str(self.cache_path).replace('.pkl', '.json')

        try:
            # Create backup of existing cache
            backup_path = f"{filepath}.backup"
            if os.path.exists(filepath):
                os.rename(filepath, backup_path)

            cache_data = {
                'cache': self.cache,
                'similarity_threshold': self.similarity_threshold,
                'cache_size': len(self.cache),
                'format_version': '1.0'
            }

            with open(filepath, 'w') as f:
                json.dump(cache_data, f, indent=2)

            print(f"Semantic cache saved to {filepath} ({len(self.cache)} entries)")

            # Remove backup if save was successful
            if os.path.exists(backup_path):
                os.remove(backup_path)

        except Exception as e:
            print(f"Error saving cache to JSON: {e}")
            # Restore backup if save failed
            if os.path.exists(backup_path):
                os.rename(backup_path, filepath)

    def load_cache_json(self, filepath: Optional[str] = None) -> None:
        """Load cache from JSON format"""
        if filepath is None:
            filepath = str(self.cache_path).replace('.pkl', '.json')

        if os.path.exists(filepath):
            try:
                with open(filepath, 'r') as f:
                    data = json.load(f)

                self.cache = data.get('cache', [])
                self.similarity_threshold = data.get('similarity_threshold', self.similarity_threshold)

                print(f"Semantic cache loaded from JSON: {filepath} ({len(self.cache)} entries)")

            except Exception as e:
                print(f"Error loading cache from JSON: {e}")
                self.cache = []
        else:
            print(f"No JSON cache file found at {filepath}")

    def get_cache_stats(self) -> Dict[str, Any]:
        """Get cache statistics"""
        return {
            'total_entries': len(self.cache),
            'similarity_threshold': self.similarity_threshold,
            'cache_file': str(self.cache_path),
            'cache_exists': self.cache_path.exists(),
            'cache_size_bytes': self.cache_path.stat().st_size if self.cache_path.exists() else 0
        }

    def explain_query(self, query: str) -> Dict[str, Any]:
        """
        Analyze query without executing - returns cache similarity scores
        and potential cache hits for EXPLAIN command
        """
        query_vec = self.vectorize(query)

        cache_analysis = []
        best_match = None
        best_similarity = 0.0

        for entry in self.cache:
            similarity = self.cosine_similarity(query_vec, entry['vector'])
            # Smart truncation for cached query display
            cached_query = entry['query']
            if len(cached_query) > 50:
                display_query = cached_query[:50] + '...'
            else:
                display_query = cached_query

            cache_analysis.append({
                'cached_query': display_query,
                'similarity': round(similarity, 4),
                'would_hit': similarity >= self.similarity_threshold
            })
            if similarity > best_similarity:
                best_similarity = similarity
                best_match = entry['query']

        # Sort by similarity descending
        cache_analysis.sort(key=lambda x: x['similarity'], reverse=True)

        # Smart truncation for best match
        if best_match and len(best_match) > 50:
            best_match_display = best_match[:50] + '...'
        else:
            best_match_display = best_match

        return {
            'query': query,
            'cache_entries_checked': len(self.cache),
            'similarity_threshold': self.similarity_threshold,
            'best_match': best_match_display,
            'best_similarity': round(best_similarity, 4),
            'would_hit_cache': best_similarity >= self.similarity_threshold,
            'top_matches': cache_analysis[:5]  # Top 5 similar cached queries
        }

    def set_cache_expiration(self, max_age_hours: int = 24) -> None:
        """Remove cache entries older than specified hours (future enhancement)"""
        # This would require adding timestamps to cache entries
        # For now, just a placeholder for TTL functionality
        print(f"Cache expiration set to {max_age_hours} hours (not yet implemented)")

    def optimize_cache(self, max_entries: int = 1000) -> None:
        """Remove oldest entries if cache exceeds max size"""
        if len(self.cache) > max_entries:
            removed_count = len(self.cache) - max_entries
            self.cache = self.cache[-max_entries:]  # Keep most recent entries
            print(f"Cache optimized: removed {removed_count} oldest entries")
            self.save_cache()


class QueryOptimizer:
    """
    Reinforcement learning-based query optimizer
    Uses Q-learning to optimize query execution
    """

    def __init__(self, learning_rate: float = 0.1, discount_factor: float = 0.9) -> None:
        self.q_table: Dict[str, Dict[str, float]] = {}
        self.learning_rate = learning_rate
        self.discount_factor = discount_factor
        self.epsilon = 0.1

    def get_action(self, state: str, available_actions: List[str]) -> str:
        """Select action using epsilon-greedy strategy"""
        if np.random.random() < self.epsilon:
            return np.random.choice(available_actions)

        if state not in self.q_table:
            self.q_table[state] = {action: 0.0 for action in available_actions}

        state_values = self.q_table[state]
        best_action = max(available_actions, key=lambda a: state_values.get(a, 0.0))
        return best_action

    def update(self, state: str, action: str, reward: float, next_state: str) -> None:
        """Update Q-values based on observed reward"""
        if state not in self.q_table:
            self.q_table[state] = {}

        if action not in self.q_table[state]:
            self.q_table[state][action] = 0.0

        current_q = self.q_table[state][action]

        max_next_q = 0.0
        if next_state in self.q_table:
            max_next_q = max(self.q_table[next_state].values()) if self.q_table[next_state] else 0.0

        new_q = current_q + self.learning_rate * (reward + self.discount_factor * max_next_q - current_q)
        self.q_table[state][action] = new_q

        print(f"Updated Q({state}, {action}) = {new_q:.4f}")

    def feed_metrics(self, query: str, latency_ms: float) -> None:
        """Feed execution metrics to the optimizer"""
        reward = -latency_ms / 1000.0

        state = f"query_type_{len(query) // 10}"
        action = "execute"
        next_state = "completed"

        self.update(state, action, reward, next_state)

    def explain_action(self, query: str, available_actions: List[str]) -> Dict[str, Any]:
        """
        Explain what action would be taken without executing.

        Returns Q-values and predicted action for EXPLAIN command.
        This method provides a read-only analysis of the optimizer's decision-making
        process without actually executing any action or updating the Q-table.

        Args:
            query: SQL query string
            available_actions: List of possible actions

        Returns:
            Dict containing:
                - state: state key string
                - q_values: Q-values for all actions
                - best_action: action with highest Q-value
                - epsilon: current exploration rate
                - would_explore: whether exploration is possible
                - explanation: human-readable explanation of optimizer behavior
        """
        state = f"query_type_{len(query) // 10}"

        q_values = {}
        if state in self.q_table:
            q_values = {a: round(v, 4) for a, v in self.q_table[state].items()}
        else:
            q_values = {a: 0.0 for a in available_actions}

        best_action = max(available_actions, key=lambda a: q_values.get(a, 0.0))

        # Defensive truncation for display (limit to 20 chars)
        best_action_display = best_action[:20] if len(best_action) > 20 else best_action

        return {
            'state': state,
            'q_values': q_values,
            'best_action': best_action_display,
            'epsilon': self.epsilon,
            'would_explore': self.epsilon > 0,
            'explanation': f'With ε={self.epsilon:.4f}, agent would explore {self.epsilon*100:.1f}% of the time'
        }


def test_vectorization() -> Dict[str, Any]:
    """Test function for Rust integration"""
    cache = SemanticCache()
    test_query = "SELECT * FROM users WHERE age > 25"
    vector = cache.vectorize(test_query)
    return {
        'query': test_query,
        'vector': vector[:10],
        'dimension': len(vector)
    }


def explain_query_plan(query: str, cache: Optional[SemanticCache] = None,
                       optimizer: Optional[QueryOptimizer] = None) -> Dict[str, Any]:
    """
    Generate a complete EXPLAIN plan for a query
    Shows parsing, cache analysis, and RL agent predictions
    """
    result = {
        'query': query,
        'query_length': len(query),
        'parsing': {},
        'cache_analysis': {},
        'rl_agent': {},
        'execution_strategy': {}
    }

    # 1. Query Parsing Analysis
    query_upper = query.upper().strip()
    if query_upper.startswith('SELECT'):
        query_type = 'SELECT'
    elif query_upper.startswith('INSERT'):
        query_type = 'INSERT'
    elif query_upper.startswith('UPDATE'):
        query_type = 'UPDATE'
    elif query_upper.startswith('DELETE'):
        query_type = 'DELETE'
    elif query_upper.startswith('CREATE'):
        query_type = 'CREATE'
    else:
        query_type = 'UNKNOWN'

    result['parsing'] = {
        'query_type': query_type,
        'query_length': len(query),
        'complexity_estimate': min(len(query) // 20, 10),
        'has_where_clause': 'WHERE' in query_upper,
        'has_join': 'JOIN' in query_upper,
        'has_aggregation': any(agg in query_upper for agg in ['COUNT', 'SUM', 'AVG', 'MAX', 'MIN']),
        'has_order_by': 'ORDER BY' in query_upper,
        'has_group_by': 'GROUP BY' in query_upper
    }

    # 2. Cache Analysis
    if cache is None:
        cache = SemanticCache()
    result['cache_analysis'] = cache.explain_query(query)

    # 3. RL Agent Analysis
    if optimizer is None:
        optimizer = QueryOptimizer()

    available_actions = ['use_cache', 'bypass_cache', 'full_scan', 'index_scan']
    result['rl_agent'] = optimizer.explain_action(query, available_actions)

    # 4. Execution Strategy
    would_hit_cache = result['cache_analysis'].get('would_hit_cache', False)
    best_action = result['rl_agent'].get('best_action', 'full_scan')

    if would_hit_cache:
        strategy = 'CACHE_HIT'
        estimated_latency = '< 1ms'
    elif best_action == 'use_cache':
        strategy = 'CACHE_MISS_THEN_STORE'
        estimated_latency = '5-50ms'
    elif best_action == 'index_scan':
        strategy = 'INDEX_SCAN'
        estimated_latency = '1-10ms'
    else:
        strategy = 'FULL_SCAN'
        estimated_latency = '10-100ms'

    result['execution_strategy'] = {
        'strategy': strategy,
        'estimated_latency': estimated_latency,
        'will_cache_result': query_type == 'SELECT' and not would_hit_cache,
        'recommendation': 'Use cached result' if would_hit_cache else 'Execute and cache'
    }

    return result


def format_explain_output(explain_result: Dict[str, Any]) -> str:
    """Format EXPLAIN result as a readable table with defensive field width limits"""

    def truncate(value: Any, max_len: int) -> str:
        """Truncate value to max length for box alignment"""
        s = str(value)
        if len(s) > max_len:
            return s[:max_len - 3] + "..."
        return s

    lines = []
    lines.append("=" * 70)
    lines.append("QUERY EXECUTION PLAN")
    lines.append("=" * 70)

    # Smart query truncation
    query = explain_result['query']
    display_query = truncate(query, 60)

    lines.append(f"Query: {display_query}")
    lines.append("")

    # Parsing section
    lines.append("┌─ PARSING ─────────────────────────────────────────────────────────┐")
    p = explain_result['parsing']
    query_type = truncate(p['query_type'], 15)
    lines.append(f"│ Type: {query_type:<15} Complexity: {p['complexity_estimate']}/10              │")
    lines.append(f"│ WHERE: {str(p['has_where_clause']):<8} JOIN: {str(p['has_join']):<8} AGG: {str(p['has_aggregation']):<8}     │")
    lines.append("└───────────────────────────────────────────────────────────────────┘")
    lines.append("")

    # Cache section
    lines.append("┌─ CACHE LOOKUP ────────────────────────────────────────────────────┐")
    c = explain_result['cache_analysis']
    # Defensive limits: cache_entries_checked capped at 99999 for display
    entries_checked = min(c['cache_entries_checked'], 99999)
    lines.append(f"│ Entries checked: {entries_checked:<5} Threshold: {c['similarity_threshold']:<6}            │")
    lines.append(f"│ Best similarity: {c['best_similarity']:<6} Would hit: {str(c['would_hit_cache']):<6}              │")
    if c['top_matches']:
        lines.append("│ Top matches:                                                      │")
        for match in c['top_matches'][:3]:
            sim = match['similarity']
            hit = "✓" if match['would_hit'] else "✗"
            # Smart truncation for cached queries (limit to 45 chars)
            cached_query = truncate(match['cached_query'], 45)
            lines.append(f"│   {hit} {sim:.4f} - {cached_query:<45} │")
    lines.append("└───────────────────────────────────────────────────────────────────┘")
    lines.append("")

    # RL Agent section
    lines.append("┌─ RL AGENT ────────────────────────────────────────────────────────┐")
    r = explain_result['rl_agent']
    # Defensive truncation for state (30 chars) and best_action (20 chars)
    state_display = truncate(r['state'], 30)
    best_action_display = truncate(r['best_action'], 20)
    lines.append(f"│ State: {state_display:<30} Epsilon: {r.get('epsilon', 0):<6}        │")
    lines.append(f"│ Best action: {best_action_display:<20}                          │")
    lines.append("│ Q-values:                                                         │")
    for action, qval in r['q_values'].items():
        # Truncate action names to 15 chars for alignment
        action_display = truncate(action, 15)
        lines.append(f"│   {action_display:<15}: {qval:>8.4f}                                    │")
    lines.append("└───────────────────────────────────────────────────────────────────┘")
    lines.append("")

    # Execution strategy
    lines.append("┌─ EXECUTION STRATEGY ──────────────────────────────────────────────┐")
    e = explain_result['execution_strategy']
    # Defensive truncation for strategy (20 chars)
    strategy_display = truncate(e['strategy'], 20)
    recommendation_display = truncate(e['recommendation'], 40)
    lines.append(f"│ Strategy: {strategy_display:<20} Est. latency: {e['estimated_latency']:<10}   │")
    lines.append(f"│ Will cache: {str(e['will_cache_result']):<8}                                          │")
    lines.append(f"│ Recommendation: {recommendation_display:<40}       │")
    lines.append("└───────────────────────────────────────────────────────────────────┘")

    return "\n".join(lines)


def test_cache_persistence() -> Dict[str, Any]:
    """Test semantic cache persistence functionality"""
    print("\n" + "="*60)
    print("Testing Semantic Cache Persistence")
    print("="*60 + "\n")

    # Test 1: Create cache and add entries
    print("1. Creating cache and adding test entries...")
    cache1 = SemanticCache(cache_file="test_cache.pkl")

    test_queries = [
        ("SELECT * FROM users WHERE age > 25", "User data for age > 25"),
        ("SELECT name FROM products WHERE price < 100", "Product names under $100"),
        ("SELECT COUNT(*) FROM orders WHERE status = 'active'", "Active order count: 42")
    ]

    for query, result in test_queries:
        cache1.put(query, result)

    # Save cache after adding entries
    cache1.save_cache()

    stats1 = cache1.get_cache_stats()
    print(f"Cache stats after adding entries: {stats1}")

    # Test 2: Create new cache instance and verify persistence
    print("\n2. Creating new cache instance to test persistence...")
    cache2 = SemanticCache(cache_file="test_cache.pkl")

    stats2 = cache2.get_cache_stats()
    print(f"Cache stats after reload: {stats2}")

    # Test 3: Verify cache hits work after reload
    print("\n3. Testing cache hits after reload...")
    for query, expected_result in test_queries:
        cached_result = cache2.get(query)
        if cached_result:
            print(f"✓ Cache hit for: {query[:30]}...")
            print(f"  Result: {cached_result[:50]}...")
        else:
            print(f"✗ Cache miss for: {query[:30]}...")

    # Test 4: Test JSON export
    print("\n4. Testing JSON export...")
    cache2.save_cache_json("test_cache.json")

    # Test 5: Test cache optimization
    print("\n5. Testing cache optimization...")
    cache2.optimize_cache(max_entries=2)

    # Cleanup
    print("\n6. Cleaning up test files...")
    cache2.clear()

    return {
        'test_passed': True,
        'entries_before_reload': stats1['total_entries'],
        'entries_after_reload': stats2['total_entries'],
        'persistence_working': stats1['total_entries'] == stats2['total_entries']
    }


if __name__ == "__main__":
    # Run both tests
    print("Running vectorization test...")
    result = test_vectorization()
    print(json.dumps(result, indent=2))

    print("\nRunning persistence test...")
    persistence_result = test_cache_persistence()
    print(f"\nPersistence test result: {persistence_result}")

    # Test EXPLAIN functionality
    print("\n" + "="*70)
    print("Testing EXPLAIN Query Plan")
    print("="*70)

    # Add some test data to cache first
    cache = SemanticCache()
    cache.put("SELECT * FROM users WHERE age > 25", "User data result")
    cache.put("SELECT name FROM products WHERE price < 100", "Product names")

    # Test explain
    test_query = "SELECT * FROM users WHERE age > 30"
    explain_result = explain_query_plan(test_query, cache)
    print(format_explain_output(explain_result))