Spaces:
Runtime error
Runtime error
import gradio as gr | |
from sentence_transformers import SentenceTransformer, util | |
from transformers import pipeline, GPT2Tokenizer | |
import os | |
# Define paths and models | |
filename = "output_country_details.txt" # Adjust the filename as needed | |
retrieval_model_name = 'output/sentence-transformer-finetuned/' | |
gpt2_model_name = "gpt2" # GPT-2 model | |
tokenizer = GPT2Tokenizer.from_pretrained("gpt2") | |
# Load models | |
try: | |
retrieval_model = SentenceTransformer(retrieval_model_name) | |
gpt_model = pipeline("text-generation", model=gpt2_model_name) | |
print("Models loaded successfully.") | |
except Exception as e: | |
print(f"Failed to load models: {e}") | |
# Load and preprocess text from the country details file | |
def load_and_preprocess_text(filename): | |
try: | |
with open(filename, 'r', encoding='utf-8') as file: | |
segments = [line.strip() for line in file if line.strip()] | |
print("Text loaded and preprocessed successfully.") | |
return segments | |
except Exception as e: | |
print(f"Failed to load or preprocess text: {e}") | |
return [] | |
segments = load_and_preprocess_text(filename) | |
def find_relevant_segment(user_query, segments): | |
try: | |
query_embedding = retrieval_model.encode(user_query) | |
segment_embeddings = retrieval_model.encode(segments) | |
similarities = util.pytorch_cos_sim(query_embedding, segment_embeddings)[0] | |
best_idx = similarities.argmax() | |
print("Relevant segment found:", segments[best_idx]) | |
return segments[best_idx] | |
except Exception as e: | |
print(f"Error finding relevant segment: {e}") | |
return "" | |
def generate_response(user_query, relevant_segment): | |
try: | |
# Construct the prompt with the user query | |
prompt = f"Thank you for your question! this is an additional fact about your topic: {relevant_segment}" | |
# Generate response with adjusted max_length for completeness | |
max_tokens = len(tokenizer(prompt)['input_ids']) + 50 | |
response = gpt_model(prompt, max_length=max_tokens, temperature=0.25)[0]['generated_text'] | |
# Clean and format the response | |
response_cleaned = clean_up_response(response, relevant_segment) | |
return response_cleaned | |
except Exception as e: | |
print(f"Error generating response: {e}") | |
return "" | |
def clean_up_response(response, segments): | |
# Split the response into sentences | |
sentences = response.split('.') | |
# Remove empty sentences and any repetitive parts | |
cleaned_sentences = [] | |
for sentence in sentences: | |
if sentence.strip() and sentence.strip() not in segments and sentence.strip() not in cleaned_sentences: | |
cleaned_sentences.append(sentence.strip()) | |
# Join the sentences back together | |
cleaned_response = '. '.join(cleaned_sentences).strip() | |
# Check if the last sentence ends with a complete sentence | |
if cleaned_response and not cleaned_response.endswith((".", "!", "?")): | |
cleaned_response += "." | |
return cleaned_response | |
# Define the welcome message with markdown for formatting and larger fonts | |
welcome_message = """ | |
# Welcome to VISABOT! | |
## Your AI-driven visa assistant for all travel-related queries. | |
""" | |
# Define topics and countries with flag emojis | |
topics = """ | |
### Feel Free to ask me anything from the topics below! | |
- Visa issuance | |
- Documents needed | |
- Application process | |
- Processing time | |
- Recommended Vaccines | |
- Health Risks | |
- Healthcare Facilities | |
- Currency Information | |
- Embassy Information | |
- Allowed stay | |
""" | |
countries = """ | |
### Our chatbot can currently answer questions for these countries! | |
- π¨π³ China | |
- π«π· France | |
- π¬πΉ Guatemala | |
- π±π§ Lebanon | |
- π²π½ Mexico | |
- π΅π Philippines | |
- π·πΈ Serbia | |
- πΈπ± Sierra Leone | |
- πΏπ¦ South Africa | |
- π»π³ Vietnam | |
""" | |
# Define the Gradio app interface | |
def query_model(question): | |
if question == "": # If there's no input, the bot will display the greeting message. | |
return welcome_message | |
relevant_segment = find_relevant_segment(question, segments) | |
response = generate_response(question, relevant_segment) | |
return response | |
# Create Gradio Blocks interface for custom layout | |
with gr.Blocks() as demo: | |
gr.Markdown(welcome_message) # Display the welcome message with large fonts | |
with gr.Row(): | |
with gr.Column(): | |
gr.Markdown(topics) # Display the topics on the left | |
with gr.Column(): | |
gr.Markdown(countries) # Display the countries with flag emojis on the right | |
with gr.Row(): | |
img = gr.Image(os.path.join(os.getcwd(), "final.png"), width=500) # Adjust width as needed | |
with gr.Row(): | |
with gr.Column(): | |
question = gr.Textbox(label="Your question", placeholder="What do you want to ask about?") | |
answer = gr.Textbox(label="VisaBot Response", placeholder="VisaBot will respond here...", interactive=False, lines=10) | |
submit_button = gr.Button("Submit") | |
submit_button.click(fn=query_model, inputs=question, outputs=answer) | |
# Launch the app | |
demo.launch() | |