Spaces:

syntaxhacker
/

developer-portfolio-rag

Runtime error

developer-portfolio-rag / test_integration.py

rohit

add tests

3e7266f 4 months ago

8.78 kB

	"""
	Integration tests for RAG Pipeline application.
	Tests actual components without mocking for real confidence.
	"""

	import pytest
	import asyncio
	import time
	from fastapi.testclient import TestClient
	from app.main import app, rag_qa
	from app.pipeline import RAGPipeline

	# Test client
	client = TestClient(app)


	class TestRealIntegration:
	"""Integration tests using actual components"""

	def test_real_rag_pipeline_creation(self):
	"""Test creating real RAG pipeline with actual dataset"""
	# This test uses real components but minimal dataset
	pipeline = RAGPipeline.from_preset('developer-portfolio')

	# Verify real pipeline was created
	assert pipeline is not None
	assert hasattr(pipeline, 'config')
	assert hasattr(pipeline, 'documents')
	assert len(pipeline.documents) > 0

	# Verify document structure
	first_doc = pipeline.documents[0]
	assert hasattr(first_doc, 'content')
	assert hasattr(first_doc, 'meta')
	assert 'question' in first_doc.meta
	assert 'answer' in first_doc.meta

	def test_real_rag_question_answering(self):
	"""Test actual RAG question answering"""
	pipeline = RAGPipeline.from_preset('developer-portfolio')

	# Ask a real question
	question = "What is your current role?"
	result = pipeline.answer_question(question)

	# Verify we get a meaningful response
	assert result is not None
	assert len(result) > 100 # Should be substantial
	assert 'role' in result.lower() or 'tech lead' in result.lower()

	def test_rag_qa_function_with_real_pipeline(self):
	"""Test rag_qa function with actual loaded pipeline"""
	# Import and modify global pipelines for this test
	from app.main import pipelines
	original_pipelines = pipelines.copy()

	try:
	# Load a real pipeline
	test_pipeline = RAGPipeline.from_preset('developer-portfolio')
	pipelines['developer-portfolio'] = test_pipeline

	# Test the rag_qa function
	result = rag_qa("What is your experience?", "developer-portfolio")

	# Verify real results
	assert result is not None
	assert len(result) > 50
	assert "still loading" not in result.lower()

	finally:
	# Restore original pipelines
	pipelines.clear()
	pipelines.update(original_pipelines)

	def test_chat_endpoint_with_real_components(self):
	"""Test chat endpoint with actual OpenRouter client"""
	# This test makes real API calls but uses simple requests

	request_data = {
	"messages": [
	{"role": "user", "content": "Hello! Can you help me?"}
	]
	}

	response = client.post("/chat", json=request_data)

	# Should get a response (may fail if API issues, but structure should be correct)
	assert response.status_code in [200, 500] # 500 if API issues

	if response.status_code == 200:
	data = response.json()
	assert "response" in data
	assert "tool_calls" in data
	# For simple greeting, probably no tool calls
	assert isinstance(data["tool_calls"], (type(None), list))

	def test_dataset_loading_performance(self):
	"""Test that dataset loading completes in reasonable time"""
	start_time = time.time()

	# Load pipeline and time it
	pipeline = RAGPipeline.from_preset('developer-portfolio')

	load_time = time.time() - start_time

	# Should load in under 30 seconds (even with embeddings)
	assert load_time < 30.0
	assert len(pipeline.documents) > 0

	# Verify embeddings were created
	assert hasattr(pipeline, 'document_store')
	assert hasattr(pipeline, 'retriever')

	def test_pipeline_document_structure(self):
	"""Test that loaded documents have expected structure"""
	pipeline = RAGPipeline.from_preset('developer-portfolio')

	# Check document metadata
	for doc in pipeline.documents[:5]: # Check first 5 docs
	assert hasattr(doc, 'content')
	assert hasattr(doc, 'meta')
	assert doc.content is not None
	assert len(doc.content) > 0

	# Check expected metadata fields
	meta = doc.meta
	assert isinstance(meta, dict)
	# Should have question and answer from dataset
	if 'question' in meta:
	assert isinstance(meta['question'], str)
	if 'answer' in meta:
	assert isinstance(meta['answer'], str)

	def test_multiple_different_questions(self):
	"""Test pipeline with multiple different questions"""
	pipeline = RAGPipeline.from_preset('developer-portfolio')

	questions = [
	"What is your current role?",
	"What technologies do you use?",
	"Tell me about your experience"
	]

	results = []
	for question in questions:
	result = pipeline.answer_question(question)
	results.append(result)

	# Should get different responses for different questions
	assert len(results) == len(questions)

	# Results should be different (not identical)
	for i in range(len(results)):
	for j in range(i + 1, len(results)):
	# Allow some similarity but not exact matches
	similarity = len(set(results[i].split()) & set(results[j].split()))
	assert similarity < len(results[i].split()) * 0.8 # Less than 80% similar

	def test_error_handling_with_real_pipeline(self):
	"""Test error handling with real pipeline"""
	pipeline = RAGPipeline.from_preset('developer-portfolio')

	# Test with empty question
	result = pipeline.answer_question("")

	# Should handle gracefully
	assert result is not None
	assert len(result) > 0

	def test_config_access(self):
	"""Test that pipeline configuration is accessible"""
	pipeline = RAGPipeline.from_preset('developer-portfolio')

	# Verify config properties
	assert hasattr(pipeline, 'config')
	config = pipeline.config
	assert hasattr(config, 'name')
	assert hasattr(config, 'content_field')
	assert hasattr(config, 'prompt_template')

	# Verify specific config values
	assert config.name == 'syntaxhacker/developer-portfolio-rag'
	assert config.content_field == 'answer'
	assert config.prompt_template is not None


	class TestSystemIntegration:
	"""Test system-level integration"""

	def test_fastapi_app_startup(self):
	"""Test that FastAPI app starts correctly"""
	# Test app import and basic structure
	from app.main import app

	assert app is not None
	assert hasattr(app, 'routes')

	# Check that our endpoints are registered
	route_paths = [route.path for route in app.routes]
	assert '/chat' in route_paths
	assert '/answer' in route_paths
	assert '/health' in route_paths
	assert '/datasets' in route_paths

	def test_openrouter_client_configuration(self):
	"""Test OpenRouter client is properly configured"""
	from app.main import openrouter_client, MODEL_NAME

	assert openrouter_client is not None
	assert hasattr(openrouter_client, 'base_url')
	assert hasattr(openrouter_client, 'api_key')

	# Check model configuration
	assert MODEL_NAME == "z-ai/glm-4.5-air:free"
	assert str(openrouter_client.base_url) == "https://openrouter.ai/api/v1/"

	def test_tools_configuration_structure(self):
	"""Test that tools are properly configured for real use"""
	from app.main import TOOLS

	assert isinstance(TOOLS, list)
	assert len(TOOLS) > 0

	# Check rag_qa tool structure
	rag_tool = None
	for tool in TOOLS:
	if tool['function']['name'] == 'rag_qa':
	rag_tool = tool
	break

	assert rag_tool is not None
	assert 'parameters' in rag_tool['function']
	assert 'properties' in rag_tool['function']['parameters']
	assert 'question' in rag_tool['function']['parameters']['properties']


	if __name__ == "__main__":
	pytest.main([__file__, "-v", "-s"])