Spaces:
Sleeping
Sleeping
import models as md | |
import pandas as pd | |
class Keywords: | |
def __init__(self, title_element:str): | |
self.title_element = [] | |
self.kw_model = md.load_keyword_model() | |
def get_keywords(self, text_chunks_lib:dict) -> list: | |
kw_dict = dict() | |
text_chunk_counter = 0 | |
for key in text_chunks_lib: | |
keywords_list = [] | |
for text_chunk in text_chunks_lib[key]: | |
text_chunk_counter += 1 | |
keywords_list += md.keyword_gen(self.kw_model, text_chunk) | |
kw_dict[key] = dict(keywords_list) | |
# Display as a dataframe | |
kw_df0 = pd.DataFrame.from_dict(kw_dict).reset_index() | |
kw_df0.rename(columns={'index': 'keyword'}, inplace=True) | |
kw_df = pd.melt(kw_df0, id_vars=['keyword'], var_name='title', value_name='score').dropna() | |
kw_column_list = ['keyword', 'score'] | |
kw_df = kw_df[kw_df['score'] > 0.25][kw_column_list].sort_values(['score'], ascending=False).reset_index().drop(columns='index') | |
return kw_df['keyword'] |