-
Notifications
You must be signed in to change notification settings - Fork 14
Expand file tree
/
Copy pathconfig.toml
More file actions
49 lines (42 loc) · 1.99 KB
/
config.toml
File metadata and controls
49 lines (42 loc) · 1.99 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
[[llm_providers]]
# LLM API 服务提供商,可配置多个
name = "localhost"
base_url = "http://192.168.1.9:8888/v1/"
api_key = "lm_studio"
[entity_extract.llm]
# 设置用于实体提取的LLM模型
provider = "localhost" # 服务提供商
model = "deepseek-r1-distill-llama-8b" # 模型名称
[rdf_build.llm]
# 设置用于RDF构建的LLM模型
provider = "localhost" # 服务提供商
model = "deepseek-r1-distill-llama-8b" # 模型名称
[embedding]
# 设置用于文本嵌入的Embedding模型
provider = "localhost" # 服务提供商
model = "text-embedding-bge-m3" # 模型名称
dimension = 1024 # 嵌入维度
[rag.params]
# RAG参数配置
synonym_search_top_k = 10 # 同义词搜索TopK
synonym_threshold = 0.8 # 同义词阈值(相似度高于此阈值的词语会被认为是同义词)
[qa.llm]
# 设置用于QA的LLM模型
provider = "localhost" # 服务提供商
model = "deepseek-r1-distill-llama-8b" # 模型名称
[qa.params]
# QA参数配置
relation_search_top_k = 10 # 关系搜索TopK
relation_threshold = 0.5 # 关系阈值(相似度高于此阈值的关系会被认为是相关的关系)
paragraph_search_top_k = 1000 # 段落搜索TopK(不能过小,可能影响搜索结果)
paragraph_node_weight = 0.05 # 段落节点权重(在图搜索&PPR计算中的权重,当搜索仅使用DPR时,此参数不起作用)
ent_filter_top_k = 10 # 实体过滤TopK
ppr_damping = 0.8 # PPR阻尼系数
res_top_k = 3 # 最终提供的文段TopK
[persistence]
# 持久化配置(存储中间数据,防止重复计算)
data_root_path = "data" # 数据根目录
raw_data_path = "data/import.json" # 原始数据路径
openie_data_path = "data/openie.json" # OpenIE数据路径
embedding_data_dir = "data/embedding" # 嵌入数据目录
rag_data_dir = "data/rag" # RAG数据目录