CNIQA_AGENTIC_101824v2

Runtime error

File size: 9,654 Bytes

import gradio as gr
from gradio_pdf import PDF
from gradio_client import Client, handle_file
import os

# Define your Hugging Face token (make sure to set it as an environment variable)
HF_TOKEN = os.getenv("HF_TOKEN")  # Replace with your actual token if not using an environment variable

# Initialize the Gradio Client for the specified API
client = Client("on1onmangoes/cnianswer101724v4", hf_token=HF_TOKEN)


client_name = ['primo','secondo','terzo','quarto4', 'quinto5', 'secondo6', 'sesto6', 'settimo7','ottavo8','nono9']



def stream_chat_with_rag(
    message: str,
    history: list,
    client_name: str,
    system_prompt: str,
    num_retrieved_docs: int = 10,
    num_docs_final: int = 9,
    temperature: float = 0, 
    max_new_tokens: int = 1024, 
    top_p: float = 1.0, 
    top_k: int = 20, 
    penalty: float = 1.2,
):
    print(f"Message: {message}")
    print(f"History: {history}")

    # Build the conversation prompt including system prompt and history
    conversation = f"{system_prompt}\n\nFor Client: {client_name}\n"
    
    # Add previous conversation history
    for user_input, assistant_response in history:
        conversation += f"User: {user_input}\nAssistant: {assistant_response}\n"
    
    # Add the current user message
    conversation += f"User: {message}\nAssistant:"

    # Call the API with the user's message
    question = message
    #answer = client.predict(question=question, api_name="/run_graph")
    answer = client.predict(question=question,selected_document=client_name, api_name="/get_answer")

    # Debugging: Print the raw response
    print("Raw answer from API:")
    print(answer)

    # Format the assistant's answer and the relevant documents separately
    formatted_answer = format_answer_string(answer)

    # Update the conversation history with the new message and answer
    history.append((message, formatted_answer))

    # Return the formatted answer
    return formatted_answer


def format_answer_string(answer: str):
    """
    This function extracts and formats the assistant's response before document metadata.
    Anything after the marker `[(` (where documents are listed) is ignored.
    """
    # Step 1: Split the response at the start of the document metadata
    split_marker = "[("
    if split_marker in answer:
        # Everything before the marker is the relevant answer
        answer_before_docs = answer.split(split_marker)[0]
    else:
        # If no documents metadata, return the entire answer
        answer_before_docs = answer
    
    # Step 2: Clean up formatting by replacing escaped newline characters
    formatted_answer = answer_before_docs.replace("\\n", "\n").strip()
    
    # Step 3: Remove potential starting and ending artifacts like (' and ,) if present
    if formatted_answer.startswith("(\"") and formatted_answer.endswith("\","):
        formatted_answer = formatted_answer[2:-2].strip()

    # Optional: Add a prefix for clarity
    formatted_answer = "Co-Pilot: " + formatted_answer
    
    return formatted_answer

def format_relevant_documents(relevant_docs: list):
    """
    This function formats the relevant document metadata and content for readable output.
    It extracts the heading, page number, and a snippet of the content from each document.
    """
    formatted_docs = "Relevant Documents:\n\n"
    
    for idx, (doc, score) in enumerate(relevant_docs):
        # Extract the relevant metadata
        heading = doc.metadata.get('heading', 'Unnamed Document')
        page_number = int(doc.metadata.get('page_number', -1))
        source = doc.metadata.get('source', 'Unknown Source')
        confidence = round(score, 4)  # Rounding the score for cleaner output
        
        # Add the formatted details to the output string
        formatted_docs += f"Document {idx + 1}:\n"
        formatted_docs += f"  - Heading: {heading}\n"
        formatted_docs += f"  - Page Number: {page_number}\n"
        formatted_docs += f"  - Source: {source}\n"
        formatted_docs += f"  - Confidence Score: {confidence}\n"
        
        # Optionally include a snippet from the content
        content_snippet = doc.page_content[:200]  # Take the first 200 characters for preview
        formatted_docs += f"  - Content Snippet: {content_snippet}...\n\n"

    return formatted_docs.strip()


# ------------------------------------- Core CNI APP ----------------------------------------------------------------------------------
# Function to handle PDF processing API call
def process_pdf(pdf_file, client_name):
    return client.predict(
        pdf_file=handle_file(pdf_file),
        #client_name=client_name,  # Hardcoded client name
        api_name="/process_pdf"
    )[1]  # Return only the result string

# # Function to handle search API call
# def search_api(query):
#     return client.predict(query=query, api_name="/search_with_confidence")

# Function to handle RAG API call
def rag_api(question, client_name):
    return client.predict(question=question,selected_document=client_name, api_name="/get_answer")

def delete_index():
    result = client.predict(api_name="/delete_index")
    return result


#-------------------------------------- View PDF ----------------------------------------------------------------------------------
def view_pdf(pdf):
    result = client.predict(api_name="/view_pdf_name")
    return result


#-------------------------------------- UX & Gradio -------------------------------------------------------------------------------

# CSS for custom styling
CSS = """
# chat-container {
    height: 100vh;
}
"""


    


# Title for the application
TITLE = "<h1 style='text-align:center;'>CNI RAG AGENTIC v0.2</h1>"

# Create the Gradio Blocks interface
with gr.Blocks(css=CSS) as demo:
    gr.HTML(TITLE)
    with gr.Tab("Chat"):
        chatbot = gr.Chatbot()  # Create a chatbot interface
        chat_interface = gr.ChatInterface(
            fn=stream_chat_with_rag,
            chatbot=chatbot,
            additional_inputs_accordion=gr.Accordion(label="⚙️ Parameters", open=False, render=False),
            additional_inputs=[
                gr.Dropdown(client_name,value="primo",label="Select Client", render=False,allow_custom_value=True),
                gr.Textbox(
                    value="You are an expert assistant",
                    label="System Prompt",
                    render=False,
                ),
                gr.Slider(
                    minimum=1,
                    maximum=10,
                    step=1,
                    value=10,
                    label="Number of Initial Documents to Retrieve",
                    render=False,
                ),
                gr.Slider(
                    minimum=1,
                    maximum=10,
                    step=1,
                    value=9,
                    label="Number of Final Documents to Retrieve",
                    render=False,
                ),
                gr.Slider(
                    minimum=0.2,
                    maximum=1,
                    step=0.1,
                    value=0,
                    label="Temperature",
                    render=False,
                ),
                gr.Slider(
                    minimum=128,
                    maximum=8192,
                    step=1,
                    value=1024,
                    label="Max new tokens",
                    render=False,
                ),
                gr.Slider(
                    minimum=0.0,
                    maximum=1.0,
                    step=0.1,
                    value=1.0,
                    label="Top P",
                    render=False,
                ),
                gr.Slider(
                    minimum=1,
                    maximum=20,
                    step=1,
                    value=20,
                    label="Top K",
                    render=False,
                ),
                gr.Slider(
                    minimum=0.0,
                    maximum=2.0,
                    step=0.1,
                    value=1.2,
                    label="Repetition Penalty",
                    render=False,
                ),
            ],
        )


    with gr.Tab("Process PDF"):
        pdf_input = gr.File(label="Upload PDF File")
        #select_client_dropdown = gr.Dropdown(client_name, value="rosariarossi", label="Select or Type Client", allow_custom_value=True)
        pdf_output = gr.Textbox(label="PDF Result", interactive=False)
    
        pdf_button = gr.Button("Process PDF")
        pdf_button.click(
            process_pdf,
            inputs=[pdf_input],  # Pass both PDF and client name is not required 
            outputs=pdf_output
        )

    with gr.Tab("Answer with RAG"):
        question_input = gr.Textbox(label="Enter Question for RAG")
        answer_with_rag_select_client_dropdown = gr.Dropdown(client_name, value="primo", label="Select or Type Client", allow_custom_value=True)
        rag_output = gr.Textbox(label="RAG Answer Result", interactive=False)

        rag_button = gr.Button("Get Answer")
        rag_button.click(
            rag_api,
            inputs=[question_input,answer_with_rag_select_client_dropdown ],
            outputs=rag_output
        )
    with gr.Tab(label="Manage Files"):
        with gr.Column():
            delete_index_button = gr.Button("Delete All Files")
            delete_index_textout = gr.Textbox(label="Deleted Files and Refresh Result")
            delete_index_button.click(fn=delete_index, inputs=[],outputs=[delete_index_textout])

# Launch the app
if __name__ == "__main__":
    demo.launch()