[lexical_search] | |
TOP_K = 20 | |
SPLIT_BY = sentence | |
SPLIT_LENGTH = 3 | |
SPLIT_OVERLAP = 0 | |
[semantic_search] | |
RETRIEVER_TOP_K = 10 | |
MAX_SEQ_LENGTH = 64 | |
RETRIEVER = msmarco-bert-base-dot-v5 | |
RETRIEVER_FORMAT = sentence_transformers | |
RETRIEVER_EMB_LAYER = -1 | |
READER = deepset/tinyroberta-squad2 | |
READER_TOP_K = 5 | |
THRESHOLD = 0.1 | |
SPLIT_BY = sentence | |
SPLIT_LENGTH = 3 | |
SPLIT_OVERLAP = 0 | |
[sdg] | |
THRESHOLD = 0.85 | |
MODEL = jonas/sdg_classifier_osdg | |
SPLIT_BY = word | |
REMOVE_PUNC = 0 | |
SPLIT_LENGTH = 120 | |
SPLIT_OVERLAP = 10 | |
RESPECT_SENTENCE_BOUNDARY = 1 | |
TOP_KEY = 15 | |
[preprocessor] | |
SPLIT_OVERLAP_WORD = 10 | |
SPLIT_OVERLAP_SENTENCE = 1 | |
[tfidf] | |
TOP_N = 20 | |