[lexical_search]
TOP_K = 20
THRESHOLD = 0.1
SPLIT_BY = sentence
SPLIT_LENGTH = 3
SPLIT_OVERLAP = 0

[semantic_search]
RETRIEVER_TOP_K = 10
MAX_SEQ_LENGTH = 64
RETRIEVER = msmarco-bert-base-dot-v5
RETRIEVER_FORMAT = sentence_transformers
RETRIEVER_EMB_LAYER = -1
READER = deepset/tinyroberta-squad2
READER_TOP_K = 5
THRESHOLD = 0.1
SPLIT_BY = sentence
SPLIT_LENGTH = 3
SPLIT_OVERLAP = 0

[sdg]
THRESHOLD = 0.85
MODEL = jonas/sdg_classifier_osdg
SPLIT_BY = word
SPLIT_LENGTH = 110
SPLIT_OVERLAP = 10

[preprocessor]
SPLIT_OVERLAP_WORD = 10
SPLIT_OVERLAP_SENTENCE = 1