File tree Expand file tree Collapse file tree 2 files changed +577
-0
lines changed Expand file tree Collapse file tree 2 files changed +577
-0
lines changed Original file line number Diff line number Diff line change 1+ # Configuration for question categorization using generated capabilities extraction
2+ data_cfg :
3+ # Path to the generated capabilities directory containing capabilities
4+ generated_dir : /projects/DeepLesion/projects/automated_capability_evaluation/artifacts/capabilities_gpt-claude-math/math
5+
6+ # Dataset selection
7+ # Supported dataset_name values: "gsm8k", "math"
8+ dataset_name : gsm8k
9+ # For gsm8k: path to combined JSONL; For math: root directory with JSON files (recursive)
10+ dataset_path : /projects/DeepLesion/projects/automated_capability_evaluation/static_datasets/math/gsm8k-main/test.jsonl
11+
12+ # Path to the existing Wikipedia categorization results file (not used in generated mode)
13+ wikipedia_dir : /projects/DeepLesion/projects/automated_capability_evaluation/wikipedia/pages
14+
15+ categorization_cfg :
16+ # Method to use for extracting areas and capabilities
17+ # Options: "generated" (extract from capability.json files) or "wikipedia" (use predefined Wikipedia categorization)
18+ extraction_method : " generated"
19+
20+ llm_cfg :
21+ # LLM model name for categorization
22+ # model_name: "Qwen2.5-14B-Instruct"
23+ model_name : " Qwen2.5-7B-Instruct"
24+ # LLM model provider
25+ model_provider : " local"
26+
27+
28+ output_cfg :
29+ # Directory to save the categorization results
30+ results_dir : /projects/DeepLesion/projects/automated_capability_evaluation/results/GSM8K
31+ # Name of the output file
32+ output_filename : gsm8k_vs_generated.json
33+
34+ processing_cfg :
35+ # Save checkpoint every N questions
36+ save_every_n : 20
37+
38+ defaults :
39+ - _self_
40+
You can’t perform that action at this time.
0 commit comments