Skip to content

Commit 6504e50

Browse files
committed
Added static vs generated code
1 parent e948a34 commit 6504e50

File tree

2 files changed

+577
-0
lines changed

2 files changed

+577
-0
lines changed
Lines changed: 40 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,40 @@
1+
# Configuration for question categorization using generated capabilities extraction
2+
data_cfg:
3+
# Path to the generated capabilities directory containing capabilities
4+
generated_dir: /projects/DeepLesion/projects/automated_capability_evaluation/artifacts/capabilities_gpt-claude-math/math
5+
6+
# Dataset selection
7+
# Supported dataset_name values: "gsm8k", "math"
8+
dataset_name: gsm8k
9+
# For gsm8k: path to combined JSONL; For math: root directory with JSON files (recursive)
10+
dataset_path: /projects/DeepLesion/projects/automated_capability_evaluation/static_datasets/math/gsm8k-main/test.jsonl
11+
12+
# Path to the existing Wikipedia categorization results file (not used in generated mode)
13+
wikipedia_dir: /projects/DeepLesion/projects/automated_capability_evaluation/wikipedia/pages
14+
15+
categorization_cfg:
16+
# Method to use for extracting areas and capabilities
17+
# Options: "generated" (extract from capability.json files) or "wikipedia" (use predefined Wikipedia categorization)
18+
extraction_method: "generated"
19+
20+
llm_cfg:
21+
# LLM model name for categorization
22+
# model_name: "Qwen2.5-14B-Instruct"
23+
model_name: "Qwen2.5-7B-Instruct"
24+
# LLM model provider
25+
model_provider: "local"
26+
27+
28+
output_cfg:
29+
# Directory to save the categorization results
30+
results_dir: /projects/DeepLesion/projects/automated_capability_evaluation/results/GSM8K
31+
# Name of the output file
32+
output_filename: gsm8k_vs_generated.json
33+
34+
processing_cfg:
35+
# Save checkpoint every N questions
36+
save_every_n: 20
37+
38+
defaults:
39+
- _self_
40+

0 commit comments

Comments
 (0)