File size: 1,877 Bytes
06b4325
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
class config():

    sample_texts_path = 'data/sample_text.csv'

    logo_path = 'images/tum-logo.png'
    main_title = 'Topic Modeling for Summarization'
    lecture_title = 'Machine Learning for Natural Language Processing Applications (IN2106)'

    input_text = 'Enter Some Text:'
    button_text = 'Generate new sample text'
    

    topic_modelling_title = 'Topic Modelling:'
    topic_modelling_answers = ('BERTopic','LDA','CTM','NMF','Top2Vec')

    segmenter_title = 'Segmentizer:'
    segmenter_answers = ('Nltk','Spacy','Stanza')

    summarizer_title = 'Summarizer:'
    summarizer_answers = ('Bart','T5-base','Prophetnet','Pegasus')

    generate_text = 'Generate topic based summaries'

    output_title = 'Select topics you want to see summaries of:'


    warning_len_input_text = 'The length of the input text is not enough to create topic awareness summaries! or change parameters!'
    filter_threshold_summaries = True
    threshold_error = 'X -> not possible to generate a summary due to ''threshold'

    # model parameters
    MIN_NUM_SENTENCES_FOR_SUMMARY_CREATION = 2
    PATH_20_NEWS_CLUSTERID_LABEL_WORDS = 'data/_20news_df_output_clusterId_label_words.csv'

    PATH_20_NEWS_CLUSTERID_LABEL_WORDS_CTM = 'data/_20news_df_output_doc_topic_CTM_LIST.csv'
    PATH_20_NEWS_CLUSTERID_LABEL_WORDS_LDA = 'data/_20news_df_output_doc_topic_LDA_LIST.csv'
    PATH_20_NEWS_CLUSTERID_LABEL_WORDS_NMF = 'data/_20news_df_output_doc_topic_NMF_LIST.csv'
    PATH_20_NEWS_CLUSTERID_LABEL_WORDS_TOP2VEC = 'data/_20news_df_output_doc_topic_Top2Vec_LIST.csv'

    # model paths
    nltk_path = 'models/nltkUtilsObj.pkl'
    sent_trans_path = 'models/sentTransfModelUtilsObj.pkl'

    pegasus_model_path = 'models/pegasus_model'
    bart_model_path = 'models/bart_model'
    t5_model_path = 'models/t5_model'
    prophetnet_model_path = 'models/prophetnet_model'