Spaces:

tsissam
/

AI_Powered_University_of_CapeTown_Course_Advisor_Chatbot

Sleeping

AI_Powered_University_of_CapeTown_Course_Advisor_Chatbot

File size: 3,611 Bytes

import faiss
import pickle
import os
from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
from langchain.llms import HuggingFacePipeline
from langchain.vectorstores import FAISS as LangChainFAISS
from langchain.docstore import InMemoryDocstore
from langchain.schema import Document
from langchain.chains import RetrievalQA
from langchain.embeddings import HuggingFaceEmbeddings
import gradio as gr

# Paths (relative to app root)
vector_path = "vector_store_faiss_chroma/faiss_index.index"
metadata_path = "vector_store_faiss_chroma/metadata.pkl"
#model_path = "HuggingFaceModels/falcon-1b-instruct"
#model_path = "tiiuae/Falcon3-1B-Instruct"
#model_path = "TinyLlama/TinyLlama-1.1B-Chat-v1.0"
#model_path = "mistralai/Mistral-7B-Instruct-v0.1"
#model_path = "microsoft/phi-2"
model_path = "tiiuae/falcon-rw-1b"

# Load the FAISS index
faiss_index = faiss.read_index(f"{vector_path}")

# Load metadata (text chunks)
with open(f"{metadata_path}", "rb") as f:
    metadata = pickle.load(f)

# Rebuild LangChain Documents
docs = [Document(page_content=doc["page_content"]) for doc in metadata]

# Link documents to FAISS vectors
docstore = InMemoryDocstore({str(i): docs[i] for i in range(len(docs))})
id_map = {i: str(i) for i in range(len(docs))}

# Load the tokenizer and model
tokenizer = AutoTokenizer.from_pretrained(model_path)
model = AutoModelForCausalLM.from_pretrained(model_path)

# Create a generation pipeline
text_generator_pipeline = pipeline(
    model=model,
    tokenizer=tokenizer,
    task="text-generation",
    return_full_text=False,
    max_new_tokens=128,
    temperature=0.2
)
# Wrap it as a LangChain LLM
llm = HuggingFacePipeline(pipeline=text_generator_pipeline)

# Re-declare embedding function
embed_fn = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")

# Create vectorstore and retriever
vectorstore_faiss = LangChainFAISS(
    index=faiss_index,
    docstore=docstore,
    index_to_docstore_id=id_map,
    embedding_function=embed_fn # Not needed for retrieval only
)

# Create a retriever that returns top-k most relevant chunks
retriever = vectorstore_faiss.as_retriever(search_kwargs={"k": 2})

# Create the RAG pipeline (Retriever + LLM)
qa_chain = RetrievalQA.from_chain_type(
    llm=llm,
    chain_type="stuff",
    retriever=retriever,
    return_source_documents=True
)

# 🔁 Chatbot function: takes a user question, returns generated answer
def ask_rag(query):
    result = qa_chain({"query": query})
    answer = result["result"]

    # Optional: include sources (limited to 2)
    sources = result.get("source_documents", [])
    source_texts = "\n\n".join([f"🔹 Source {i+1}:\n{doc.page_content[:300]}..." for i, doc in enumerate(sources[:2])])

    return f"📘 Answer:\n{answer}\n\n📚 Sources:\n{source_texts}"

# 🎛️ Gradio UI components
gr.Interface(
    fn=ask_rag,
    inputs=gr.Textbox(lines=2, placeholder="Ask me about UCT admissions, housing, fees..."),
    outputs="text",
    title="🎓 University of Cape Town Course Advisor Chatbot",
    description="""
    Ask any academic-related question about the University of Cape Town — admissions, programs, housing, fees, or wellness services.

This chatbot uses a Retrieval-Augmented Generation (RAG) pipeline powered by:
- FAISS for semantic search
- Falcon-E 1B Instruct for natural language answers
- LangChain for orchestration

🛠️ Developed by **Serge Tsimba**, Data Science Consultant at **Amdari**/Canada.

🕐 Available 24/7 — Start by asking: "How can international students apply to UCT?"

""",
    allow_flagging="never"
).launch()