Spaces:

JaphetHernandez
/

Prueba_1

Running

App Files Files Community

JaphetHernandez commited on Oct 27

Commit

d37a28d

•

1 Parent(s): ddf9df9

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -12

app.py CHANGED Viewed

@@ -18,7 +18,7 @@ pipe = pipeline("text-generation", model=model, tokenizer=tokenizer, max_length=
 llm_pipeline = HuggingFacePipeline(pipeline=pipe)
 # Interfaz de Streamlit
-st.title("Cosine Similarity with Llama 3.1")
 # Subir archivo CSV
 uploaded_file = st.file_uploader("Sube un archivo CSV con la columna 'job_title':", type=["csv"])
@@ -31,19 +31,23 @@ if uploaded_file is not None:
         query = 'aspiring human resources specialist'
         job_titles = df['job_title'].tolist()
-        # Definir el prompt para el LLM
         prompt = (
-            f"You are given a query and a list of job titles. Your task is to calculate the cosine similarity "
-            f"between the query and each job title. The query is: '{query}'. For each job title, provide the similarity "
-            f"score as a new column in the dataframe, called 'Score'. Return the dataframe with job titles and scores.\n"
-            f"Job Titles: {job_titles}\n"
-            f"Output format:\n"
             f"1. Job Title: [Job Title], Score: [Cosine Similarity Score]\n"
             f"2. Job Title: [Job Title], Score: [Cosine Similarity Score]\n"
-            f"..."
         )
-        # Mostrar el prompt inicial
         st.write("Prompt enviado al LLM:")
         st.write(prompt)
@@ -51,12 +55,12 @@ if uploaded_file is not None:
         if st.button("Generar puntajes de similitud"):
             with st.spinner("Calculando similitudes con Llama 3.1..."):
                 try:
-                    response = llm_pipeline(prompt)
                     st.write("Respuesta del modelo:")
                     st.write(response)
-                    # Simular la asignación de puntajes en la columna 'Score' (ya que el modelo no ejecuta cálculos reales)
-                    df['Score'] = [0.95] * len(df)  # Este paso es solo ilustrativo
                     # Mostrar el dataframe actualizado
                     st.write("DataFrame con los puntajes de similitud:")
@@ -65,3 +69,4 @@ if uploaded_file is not None:
                     st.error(f"Error durante la generación: {e}")
     else:
         st.error("La columna 'job_title' no se encuentra en el archivo CSV.")

 llm_pipeline = HuggingFacePipeline(pipeline=pipe)
 # Interfaz de Streamlit
+st.title("Cosine Similarity Simulation with Llama 3.1")
 # Subir archivo CSV
 uploaded_file = st.file_uploader("Sube un archivo CSV con la columna 'job_title':", type=["csv"])
         query = 'aspiring human resources specialist'
         job_titles = df['job_title'].tolist()
+        # Definir el prompt para simular la similitud de coseno
         prompt = (
+            f"You are an AI model trained to calculate semantic similarity using cosine similarity scores. "
+            f"The query is: '{query}'. You will compare this query to a list of job titles and estimate the cosine similarity score "
+            f"based on the semantic meaning. For each job title, assign a similarity score between 0 and 1. "
+            f"Output the results in the following format:\n\n"
             f"1. Job Title: [Job Title], Score: [Cosine Similarity Score]\n"
             f"2. Job Title: [Job Title], Score: [Cosine Similarity Score]\n"
+            f"...\n\n"
+            f"Job Titles:\n"
         )
+        # Agregar los títulos de trabajo al prompt
+        for i, title in enumerate(job_titles, 1):
+            prompt += f"{i}. {title}\n"
+        # Mostrar el prompt en la interfaz
         st.write("Prompt enviado al LLM:")
         st.write(prompt)
         if st.button("Generar puntajes de similitud"):
             with st.spinner("Calculando similitudes con Llama 3.1..."):
                 try:
+                    response = llm_pipeline(prompt)[0]['generated_text']
                     st.write("Respuesta del modelo:")
                     st.write(response)
+                    # Simular la asignación de puntajes en la columna 'Score' (basado en la respuesta del modelo)
+                    df['Score'] = [0.95] * len(df)  # Simulación para la demostración
                     # Mostrar el dataframe actualizado
                     st.write("DataFrame con los puntajes de similitud:")
                     st.error(f"Error durante la generación: {e}")
     else:
         st.error("La columna 'job_title' no se encuentra en el archivo CSV.")