Spaces:

toll-brigs-0
/

ltu-chat

Sleeping

ltu-chat / app.py

Stepan

Small fixes

2614015 9 days ago

7.1 kB

	import streamlit as st
	import os
	import logging
	from typing import List, Dict, Any
	from data_processor import load_json_data, process_documents, split_documents
	from rag_pipeline import RAGPipeline

	# Configure logging
	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger(__name__)

	# Constants
	DATA_PATH = "ltu_programme_data.json"
	QDRANT_PATH = "./qdrant_data"
	EMBEDDING_MODEL = "BAAI/bge-en-icl"
	LLM_MODEL = "meta-llama/Llama-3.3-70B-Instruct"
	qdrant = None

	# Initialize session state
	if "messages" not in st.session_state:
	st.session_state.messages = []

	@st.cache_resource
	def get_rag_pipeline():
	return RAGPipeline(
	embedding_model_name=EMBEDDING_MODEL,
	llm_model_name=LLM_MODEL,
	qdrant_path = QDRANT_PATH
	)

	def load_and_index_documents(rag_pipeline: RAGPipeline) -> bool:
	"""Load and index documents"""
	if not os.path.exists(DATA_PATH):
	st.error(f"Data file not found: {DATA_PATH}")
	return False

	with st.spinner("Loading and processing documents..."):
	# Load data
	data = load_json_data(DATA_PATH)

	if not data:
	st.error("Failed to load data")
	return False

	# Process documents
	processed_docs = process_documents(data)

	if not processed_docs:
	st.error("Failed to process documents")
	return False

	# Split documents
	chunked_docs = split_documents(processed_docs, chunk_size=1000, overlap=100)

	if not chunked_docs:
	st.error("Failed to split documents")
	return False

	# Index documents
	with st.spinner(f"Indexing {len(chunked_docs)} document chunks..."):
	rag_pipeline.index_documents(chunked_docs)

	return True

	def display_document_sources(documents: List[Dict[str, Any]]):
	"""Display the sources of the retrieved documents"""
	if documents:
	with st.expander("View Sources"):
	for i, doc in enumerate(documents):
	st.markdown(f"Source {i+1}: [{doc.meta.get('url', 'Unknown')}]({doc.meta.get('url', '#')})")
	st.markdown(f"Excerpt: {doc.content[:200]}...")
	st.markdown("---")

	def check_documents_indexed(qdrant_path: str) -> int:
	"""Check if documents are already indexed by returning the number of documents in Qdrant"""
	try:
	from haystack_integrations.document_stores.qdrant import QdrantDocumentStore

	# Initialize the document store with the existing path
	document_store = QdrantDocumentStore(
	path=qdrant_path,
	embedding_dim=4096,
	recreate_index=False,
	index="ltu_documents"
	)

	# Get the document count
	document_count = len(document_store.filter_documents({}))
	return document_count
	except Exception:
	# If there's an error (e.g., Qdrant not initialized), return 0
	return 0

	def main():
	# Set page config
	st.set_page_config(
	page_title="LTU Chat - QA App",
	page_icon="🎓",
	layout="wide"
	)

	# Header
	st.title("🎓 LTU Chat - QA App")
	st.markdown("""
	Ask questions about LTU programmes and get answers powered by AI.
	This app uses RAG (Retrieval Augmented Generation) to provide accurate information.
	""")
	rag_pipeline = get_rag_pipeline()
	# Sidebar
	with st.sidebar:
	st.header("Sett`ings")

	# Initialize RAG pipeline if not already done
	# if st.session_state.rag_pipeline is None:
	# if st.button("Initialize RAG Pipeline"):
	# st.session_state.rag_pipeline = get_rag_pipeline()
	# st.success("RAG pipeline initialized successfully!")
	# else:
	# st.success("RAG pipeline is ready!")

	# Check if documents are already indexed
	documents_indexed = rag_pipeline.get_document_count()
	if not documents_indexed:
	if st.button("Index Documents"):
	success = load_and_index_documents(rag_pipeline)
	if success:
	st.success("Documents indexed successfully!")
	# Refresh the documents_indexed status
	documents_indexed = True

	# Get document counts
	count = rag_pipeline.get_document_count()
	st.info(f"Indexed {count} documents documents in vector store.")
	else:
	st.success(f"{documents_indexed} documents are indexed and ready!")

	top_k = st.slider("Number of documents to retrieve", min_value=1, max_value=10, value=5)
	# Work in progress
	st.title("Work in progress")
	st.toggle("Hybrid retrieval", disabled=True)
	st.toggle("Self RAG", disabled=True)
	st.toggle("Query Expansion", disabled=True)
	st.toggle("Graph RAG", disabled=True)
	st.toggle("Prompt engineering (CoT, Step-Back Prompt, Active Prompt)", disabled=True)


	# Display chat messages
	for message in st.session_state.messages:
	with st.chat_message(message["role"]):
	st.markdown(message["content"])
	if message.get("documents"):
	display_document_sources(message["documents"])

	# Chat input
	if prompt := st.chat_input("Ask a question about LTU programmes"):
	# Add user message to chat history
	st.session_state.messages.append({"role": "user", "content": prompt})

	# Display user message
	with st.chat_message("user"):
	st.markdown(prompt)

	# Generate response
	if rag_pipeline and documents_indexed:
	with st.chat_message("assistant"):
	with st.spinner("Thinking..."):
	# Query the RAG pipeline
	result = rag_pipeline.query(prompt, top_k=top_k)

	# Display the answer
	st.markdown(result["answer"])

	# Display sources
	if result.get("documents"):
	display_document_sources(result["documents"])

	# Add assistant message to chat history
	st.session_state.messages.append({
	"role": "assistant",
	"content": result["answer"],
	"documents": result.get("documents", [])
	})
	else:
	with st.chat_message("assistant"):
	if not rag_pipeline:
	error_message = "Please initialize the RAG pipeline first."
	else:
	error_message = "Please index documents first."
	st.error(error_message)
	st.session_state.messages.append({"role": "assistant", "content": error_message})

	if __name__ == "__main__":
	main()