RAG-evaluator/quick_test.py at main · SDdev96/RAG-evaluator · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
#!/usr/bin/env python3
"""
Test rapido del sistema RAG per verificare che tutti i componenti funzionino
"""
import os
import sys
from pathlib import Path
from dotenv import load_dotenv

# Carica variabili d'ambiente
load_dotenv()

def test_imports():
    """Test degli import di tutti i moduli"""
    print("🔍 Testing imports...")

    try:
        from config.config import get_default_config
        print("✅ Config module")

        from src.document_processing import create_processor
        print("✅ Document processing module (Docling)")

        from src.chunking.semantic_chunker import create_semantic_chunker
        print("✅ Semantic chunking module")

        from src.query_handling.query_transformations import create_query_transformer
        print("✅ Query Transformations module")

        from src.retrieval.fusion_retriever import create_fusion_retriever
        print("✅ Fusion retrieval module")

        from src.generation.gemini_generator import create_gemini_generator
        print("✅ Gemini generation module")

        from src.pipeline.advanced_rag_pipeline import create_rag_pipeline
        print("✅ Pipeline module")

        from src.utils.logging_config import setup_logging
        from src.utils.helpers import validate_api_keys
        print("✅ Utils modules")

        return True

    except ImportError as e:
        print(f"❌ Import error: {e}")
        return False


def test_api_keys():
    """Test delle API keys"""
    print("\n🔑 Testing API keys...")

    from src.utils.helpers import validate_api_keys

    required_keys = ["GOOGLE_API_KEY"]
    validation = validate_api_keys(required_keys)

    all_valid = True
    for key, is_valid in validation.items():
        if is_valid:
            print(f"✅ {key} configurata")
        else:
            print(f"❌ {key} mancante")
            all_valid = False

    return all_valid


def test_configuration():
    """Test della configurazione"""
    print("\n⚙️ Testing configuration...")

    try:
        from config.config import get_default_config

        config = get_default_config()
        print(f"✅ Configurazione caricata")
        print(f"  - Document processing: {config.document_processing.input_dir}")
        print(f"  - Chunking method: {config.chunking.chunking_method} - {config.chunking.breakpoint_threshold_type}")
        print(f"  - Query transformations: decompose={config.query_transformations.enable_decompose}, rewrite={config.query_transformations.enable_rewrite}, expand={config.query_transformations.enable_expand}")
        print(f"  - Fusion weights: {config.fusion_retrieval.vector_weight}/{config.fusion_retrieval.bm25_weight}")
        print(f"  - Generation model: {config.generation.model_name}")

        return True

    except Exception as e:
        print(f"❌ Configuration error: {e}")
        return False


def test_document_processing():
    """Test del document processing"""
    print("\n📄 Testing document processing...")

    try:
        from src.document_processing import create_processor
        from config.config import DocumentProcessingConfig

        # Controlla se esiste il PDF di test
        pdf_path = Path("data/X.AMN.PNRR.U.001.07.00 Manuale utente IoT Control Plane.pdf")

        if not pdf_path.exists():
            print(f"⚠️ PDF di test non trovato: {pdf_path}")
            print("   Creando un documento di test...")

            # Crea un documento di test semplice
            test_doc_path = Path("data/test_document.txt")
            test_doc_path.parent.mkdir(exist_ok=True)

            with open(test_doc_path, 'w', encoding='utf-8') as f:
                f.write("""# Documento di Test per Sistema RAG

                    ## Introduzione
                    Questo è un documento di test per verificare il funzionamento del sistema RAG avanzato.

                    ## Configurazione Sistema
                    Per configurare il sistema IoT Control Plane, seguire questi passaggi:
                    1. Installare il software base
                    2. Configurare le credenziali di accesso
                    3. Verificare la connessione di rete

                    ## Risoluzione Problemi
                    In caso di errori di connessione:
                    - Verificare le impostazioni di rete
                    - Controllare le credenziali
                    - Riavviare il servizio se necessario

                    ## Monitoraggio
                    Il sistema fornisce strumenti di monitoraggio per:
                    - Stato delle connessioni
                    - Performance del sistema
                    - Log degli eventi
                    """)

            pdf_path = test_doc_path

        # Test del processor
        config = DocumentProcessingConfig()
        processor = create_processor(config)

        processed_doc = processor.process_document(str(pdf_path))

        print(f"✅ Documento processato: {processed_doc.metadata.get('title', 'Unknown')}")
        print(f"  - Contenuto: {len(processed_doc.content)} caratteri")
        print(f"  - Metodo: {processed_doc.metadata.get('processing_method', 'Unknown')}")

        return True, processed_doc

    except Exception as e:
        print(f"❌ Document processing error: {e}")
        return False, None


def test_semantic_chunking(processed_doc):
    """Test del semantic chunking"""
    print("\n🔪 Testing semantic chunking...")

    try:
        from src.chunking.semantic_chunker import create_semantic_chunker
        from config.config import ChunkingConfig, get_default_config
        from src.embeddings.provider import EmbeddingsProvider

        if not processed_doc:
            print("❌ Nessun documento processato disponibile")
            return False, []

        config = ChunkingConfig()
        # Inizializza provider centralizzato dagli defaults
        rag_cfg = get_default_config()
        provider = EmbeddingsProvider.get(rag_cfg.embeddings)
        chunker = create_semantic_chunker(config, embeddings_provider=provider)

        # Usa un testo più breve per il test se necessario
        test_content = processed_doc.content[:2000] if len(processed_doc.content) > 2000 else processed_doc.content

        chunks = chunker.chunk_text(test_content, {"source": "test"})

        print(f"✅ Creati {len(chunks)} chunks semantici")
        if chunks:
            print(f"  - Chunk medio: {sum(len(c.content) for c in chunks) // len(chunks)} caratteri")
            print(f"  - Metodo: {chunks[0].metadata.get('chunking_method', 'Unknown')}")

        return True, chunks

    except Exception as e:
        print(f"❌ Semantic chunking error: {e}")
        return False, []


def test_basic_pipeline():
    """Test base della pipeline senza API calls costose"""
    print("\n🔧 Testing basic pipeline initialization...")

    try:
        from src.pipeline.advanced_rag_pipeline import create_rag_pipeline
        from config.config import get_default_config

        config = get_default_config()

        # Modifica config per test più veloce
        config.query_transformations.max_transformations = 3  # Riduci per test

        pipeline = create_rag_pipeline(config)

        print("✅ Pipeline inizializzata correttamente")
        print(f"  - Document processor: {type(pipeline.doc_processor).__name__}")
        print(f"  - Chunker: {type(pipeline.chunker).__name__}")
        print(f"  - Query transformer: {type(pipeline.query_transformer).__name__}")
        print(f"  - Retriever: {type(pipeline.retriever).__name__}")
        print(f"  - Generator: {type(pipeline.generator).__name__}")

        return True, pipeline

    except Exception as e:
        print(f"❌ Pipeline initialization error: {e}")
        return False, None


def test_langfuse_chain_invoke():
    """Test minimale di integrazione Langfuse con una chain LangChain usando CallbackHandler.

    Crea una piccola catena (echo) e invoca chain.invoke con il callback di Langfuse.
    Se le credenziali Langfuse non sono configurate, il test viene segnalato come 'skipped'.
    """
    print("\n🧪 Testing Langfuse + LangChain chain.invoke...")
    try:
        from src.telemetry.langfuse_setup import init_langfuse
        from langchain_core.runnables import RunnableLambda
    except ImportError as e:
        print(f"❌ Import error (LangChain/Langfuse): {e}")
        return False, False

    # Inizializza Langfuse (client e handler)
    langfuse, handler = init_langfuse()
    if handler is None:
        print("ℹ️ Langfuse non configurato (manca LANGFUSE_PUBLIC_KEY/SECRET_KEY). Test saltato.")
        return True, False

    try:
        # Piccola chain di test: echo dell'input
        def _echo(inputs: dict):
            text = inputs.get("input", "")
            return {"output": f"Echo: {text}"}

        chain = RunnableLambda(_echo)

        # Invoca con il callback Langfuse
        result = chain.invoke({"input": "hello from quick_test"}, config={"callbacks": [handler]})
        ok = isinstance(result, dict) and "output" in result
        if ok:
            print(f"✅ chain.invoke eseguito. Output: {result['output']}")
            return True, True
        else:
            print("❌ chain.invoke non ha prodotto output atteso")
            return False, True
    except Exception as e:
        print(f"❌ Errore nell'invocazione chain.invoke con Langfuse: {e}")
        return False, True


def test_langfuse_gemini_langchain():
    """Test di integrazione Langfuse con il modello Gemini via LangChain.

    - Usa ChatGoogleGenerativeAI (pacchetto: langchain-google-genai)
    - Invia un prompt semplice e verifica la risposta
    - Collega il CallbackHandler di Langfuse alla invocazione
    Se le credenziali Langfuse non sono configurate, il test viene segnalato come 'skipped'.
    Se il pacchetto langchain-google-genai non è installato, il test fallisce in modo esplicito con suggerimento.
    """
    print("\n🧪 Testing Langfuse + LangChain Gemini (ChatGoogleGenerativeAI)...")
    try:
        from src.telemetry.langfuse_setup import init_langfuse
        from langchain_google_genai import ChatGoogleGenerativeAI
        from config.config import get_default_config
    except ImportError as e:
        print(f"❌ Import error: {e}")
        print("   Assicurati di avere installato 'langchain-google-genai'.")
        return False, False

    # Inizializza Langfuse (client e handler)
    langfuse, handler = init_langfuse()
    if handler is None:
        print("ℹ️ Langfuse non configurato (manca LANGFUSE_PUBLIC_KEY/SECRET_KEY). Test saltato.")
        return True, False

    # Crea il modello Gemini tramite LangChain usando la configurazione
    try:
        rag_cfg = get_default_config()
        gen_cfg = rag_cfg.generation
        model = ChatGoogleGenerativeAI(
            model=gen_cfg.model_name,
            temperature=gen_cfg.temperature,
            max_output_tokens=gen_cfg.max_tokens,
            top_p=gen_cfg.top_p,
            top_k=gen_cfg.top_k,
        )

        # Prompt semplice di test
        prompt = "Di' ciao dal quick_test con Langfuse!"

        # Invoca il modello con il callback di Langfuse
        result = model.invoke(prompt, config={"callbacks": [handler]})

        # result è un AIMessage; verifichiamo che abbia del contenuto
        content = getattr(result, "content", None)
        if content and isinstance(content, str) and content.strip():
            print(f"✅ Gemini LangChain invoke eseguito (model={gen_cfg.model_name}). Output: {content[:120]}...")
            return True, True
        else:
            print("❌ Nessun contenuto prodotto dal modello Gemini via LangChain")
            return False, True
    except Exception as e:
        print(f"❌ Errore nell'invocazione Gemini LangChain con Langfuse: {e}")
        return False, True

def main():
    """Test principale"""
    print("🚀 QUICK TEST - Sistema RAG Avanzato")
    print("=" * 50)

    # Test degli import
    if not test_imports():
        print("\n❌ Test fallito: problemi con gli import")
        sys.exit(1)

    # Test API keys
    api_keys_ok = test_api_keys()
    if not api_keys_ok:
        print("\n⚠️ API keys mancanti - alcuni test potrebbero fallire")

    # Test configurazione
    if not test_configuration():
        print("\n❌ Test fallito: problemi con la configurazione")
        sys.exit(1)

    # Test document processing
    doc_ok, processed_doc = test_document_processing()
    if not doc_ok:
        print("\n❌ Test fallito: problemi con document processing")
        sys.exit(1)

    # Test semantic chunking
    chunk_ok, chunks = test_semantic_chunking(processed_doc)
    if not chunk_ok:
        print("\n⚠️ Warning: problemi con semantic chunking")

    # Test basic pipeline
    pipeline_ok, pipeline = test_basic_pipeline()
    if not pipeline_ok:
        print("\n❌ Test fallito: problemi con la pipeline")
        sys.exit(1)

    # Prompt per eseguire i test Langfuse
    try:
        answer = input("\n❓ Do you want to test Langfuse? [y/n]: ").strip().lower()
    except Exception:
        answer = "n"

    # Inizializza i flag di default
    lf_invoke_ok, lf_configured = False, False
    lf_gemini_ok, lf_gemini_configured = False, False

    if answer == "y" :
        # Test Langfuse + chain.invoke (non bloccante se non configurato)
        lf_invoke_ok, lf_configured = test_langfuse_chain_invoke()

        # Test Langfuse + LangChain Gemini (non bloccante se non configurato)
        lf_gemini_ok, lf_gemini_configured = test_langfuse_gemini_langchain()
    else:
        print("\nℹ️ Test Langfuse saltati per scelta utente.")

    # Riepilogo
    print("\n" + "=" * 50)
    print("📊 RIEPILOGO TEST")
    print("=" * 50)
    print("✅ Import modules: OK")
    print(f"{'✅' if api_keys_ok else '⚠️'} API Keys: {'OK' if api_keys_ok else 'Parziale'}")
    print("✅ Configuration: OK")
    print("✅ Document Processing: OK")
    print("✅ Semantic Chunking: OK" if chunk_ok else "⚠️ Semantic Chunking: Issues")
    print("✅ Pipeline Initialization: OK")
    if answer == "y":
        if lf_configured:
            print("✅ Langfuse chain.invoke: OK" if lf_invoke_ok else "❌ Langfuse chain.invoke: Error")
        else:
            print("ℹ️ Langfuse chain.invoke: Non configurato (test saltato)")
        if lf_gemini_configured:
            print("✅ Langfuse + Gemini (LangChain): OK" if lf_gemini_ok else "❌ Langfuse + Gemini (LangChain): Error")
        else:
            print("ℹ️ Langfuse + Gemini (LangChain): Non configurato o dipendenze mancanti (test saltato)")
    else:
        print("ℹ️ Langfuse: test saltati per scelta utente")

    if api_keys_ok:
        print("\n🎉 Tutti i test superati! Il sistema è pronto per l'uso.")
        print("\nPer testare completamente il sistema:")
        print("  python main.py --docs data/ --interactive")
    else:
        print("\n⚠️ Test base superati, ma configura le API keys per funzionalità complete.")
        print("\nConfigura nel file .env:")
        print("  GOOGLE_API_KEY=your_key_here")
        print("  # Opzionale per Hugging Face (modelli privati o limiti più alti):")
        print("  HUGGINGFACEHUB_API_TOKEN=your_hf_token_here")

    print("\n📚 Per maggiori informazioni consulta il README.md")


if __name__ == "__main__":
    main()