Skip to content

Commit c8ada4c

Browse files
wip: add protein_qa generation
1 parent 97cdde3 commit c8ada4c

File tree

1 file changed

+18
-0
lines changed

1 file changed

+18
-0
lines changed
Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,18 @@
1+
read:
2+
input_file: resources/input_examples/protein_demo.json # input file path, support json, jsonl, txt, pdf. See resources/input_examples for examples
3+
split:
4+
chunk_size: 1024 # chunk size for text splitting
5+
chunk_overlap: 100 # chunk overlap for text splitting
6+
search: # web search configuration
7+
enabled: false # whether to enable web search
8+
search_types: ["google"] # search engine types, support: google, bing, uniprot, wikipedia
9+
quiz_and_judge: # quiz and test whether the LLM masters the knowledge points
10+
enabled: false
11+
partition: # graph partition configuration
12+
method: anchor_bfs # partition method
13+
method_params:
14+
anchor_type: protein # node type to select anchor nodes
15+
max_units_per_community: 10 # atomic partition, one node or edge per community
16+
generate:
17+
mode: protein_qa # atomic, aggregated, multi_hop, cot, vqa
18+
data_format: ChatML # Alpaca, Sharegpt, ChatML

0 commit comments

Comments
 (0)