Skip to content

Commit c42cd24

Browse files
style: change configs order
1 parent da90335 commit c42cd24

4 files changed

Lines changed: 12 additions & 12 deletions

File tree

graphgen/configs/aggregated_config.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,12 +3,12 @@ read:
33
split:
44
chunk_size: 1024 # chunk size for text splitting
55
chunk_overlap: 100 # chunk overlap for text splitting
6-
output_data_type: aggregated # atomic, aggregated, multi_hop, cot
7-
output_data_format: ChatML # Alpaca, Sharegpt, ChatML
8-
tokenizer: cl100k_base # tokenizer for counting tokens, support tiktoken tokenizer names and local tokenizer path
96
search: # web search configuration
107
enabled: false # whether to enable web search
118
search_types: ["google"] # search engine types, support: google, bing, uniprot, wikipedia
9+
output_data_type: aggregated # atomic, aggregated, multi_hop, cot
10+
output_data_format: ChatML # Alpaca, Sharegpt, ChatML
11+
tokenizer: cl100k_base # tokenizer for counting tokens, support tiktoken tokenizer names and local tokenizer path
1212
quiz_and_judge_strategy: # quiz and test whether the LLM masters the knowledge points
1313
enabled: true
1414
quiz_samples: 2 # number of quiz samples to generate

graphgen/configs/atomic_config.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,12 +3,12 @@ read:
33
split:
44
chunk_size: 1024 # chunk size for text splitting
55
chunk_overlap: 100 # chunk overlap for text splitting
6-
output_data_type: atomic # atomic, aggregated, multi_hop, cot
7-
output_data_format: Alpaca # Alpaca, Sharegpt, ChatML
8-
tokenizer: cl100k_base # tokenizer for counting tokens, support tiktoken tokenizer names and local tokenizer path
96
search: # web search configuration
107
enabled: false # whether to enable web search
118
search_types: ["google"] # search engine types, support: google, bing, uniprot, wikipedia
9+
output_data_type: atomic # atomic, aggregated, multi_hop, cot
10+
output_data_format: Alpaca # Alpaca, Sharegpt, ChatML
11+
tokenizer: cl100k_base # tokenizer for counting tokens, support tiktoken tokenizer names and local tokenizer path
1212
quiz_and_judge_strategy: # quiz and test whether the LLM masters the knowledge points
1313
enabled: true
1414
quiz_samples: 2 # number of quiz samples to generate

graphgen/configs/cot_config.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,12 +3,12 @@ read:
33
split:
44
chunk_size: 1024 # chunk size for text splitting
55
chunk_overlap: 100 # chunk overlap for text splitting
6-
output_data_type: cot # atomic, aggregated, multi_hop, cot
7-
output_data_format: Sharegpt # Alpaca, Sharegpt, ChatML
8-
tokenizer: cl100k_base # tokenizer for counting tokens, support tiktoken tokenizer names and local tokenizer path
96
search: # web search configuration
107
enabled: false # whether to enable web search
118
search_types: ["google"] # search engine types, support: google, bing, uniprot, wikipedia
9+
output_data_type: cot # atomic, aggregated, multi_hop, cot
10+
output_data_format: Sharegpt # Alpaca, Sharegpt, ChatML
11+
tokenizer: cl100k_base # tokenizer for counting tokens, support tiktoken tokenizer names and local tokenizer path
1212
method_params:
1313
method: leiden
1414
max_size: 20 # Maximum size of communities

graphgen/configs/multi_hop_config.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,12 +3,12 @@ read:
33
split:
44
chunk_size: 1024 # chunk size for text splitting
55
chunk_overlap: 100 # chunk overlap for text splitting
6-
output_data_type: multi_hop # atomic, aggregated, multi_hop, cot
7-
output_data_format: ChatML # Alpaca, Sharegpt, ChatML
8-
tokenizer: cl100k_base # tokenizer for counting tokens, support tiktoken tokenizer names and local tokenizer path
96
search: # web search configuration
107
enabled: false # whether to enable web search
118
search_types: ["google"] # search engine types, support: google, bing, uniprot, wikipedia
9+
output_data_type: multi_hop # atomic, aggregated, multi_hop, cot
10+
output_data_format: ChatML # Alpaca, Sharegpt, ChatML
11+
tokenizer: cl100k_base # tokenizer for counting tokens, support tiktoken tokenizer names and local tokenizer path
1212
quiz_and_judge_strategy: # quiz and test whether the LLM masters the knowledge points
1313
enabled: false
1414
quiz_samples: 2 # number of quiz samples to generate

0 commit comments

Comments
 (0)