littercockpit-demo / paramconfig.cfg
domdomingo's picture
Duplicate from GIZ/SDSN-demo
e1b1d60
raw
history blame contribute delete
938 Bytes
[lexical_search]
TOP_K = 20
SPLIT_BY = word
SPLIT_LENGTH = 120
SPLIT_OVERLAP = 0
REMOVE_PUNC = 0
[semantic_search]
RETRIEVER_TOP_K = 10
MAX_SEQ_LENGTH = 384
RETRIEVER = all-mpnet-base-v2
RETRIEVER_FORMAT = sentence_transformers
EMBEDDING_DIM = 768
RETRIEVER_EMB_LAYER = -1
READER = deepset/tinyroberta-squad2
READER_TOP_K = 10
READER_TOP_K_PER_CANDIDATE = 1
SPLIT_BY = word
SPLIT_LENGTH = 120
SPLIT_OVERLAP = 10
RESPECT_SENTENCE_BOUNDARY = 1
REMOVE_PUNC = 0
[sdg]
THRESHOLD = 0.85
MODEL = jonas/bert-base-uncased-finetuned-sdg
SPLIT_BY = word
REMOVE_PUNC = 0
SPLIT_LENGTH = 120
SPLIT_OVERLAP = 10
RESPECT_SENTENCE_BOUNDARY = 1
TOP_KEY = 15
[coherence]
RETRIEVER_TOP_K = 10
MAX_SEQ_LENGTH = 512
RETRIEVER = msmarco-distilbert-dot-v5
RETRIEVER_FORMAT = sentence_transformers
RETRIEVER_EMB_LAYER = -1
EMBEDDING_DIM = 768
THRESHOLD = 0.55
SPLIT_BY = word
SPLIT_LENGTH = 120
SPLIT_OVERLAP = 10
RESPECT_SENTENCE_BOUNDARY = 1
REMOVE_PUNC = 0