-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathcase.yaml.example
More file actions
35 lines (28 loc) · 900 Bytes
/
case.yaml.example
File metadata and controls
35 lines (28 loc) · 900 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
# CaseStack case configuration
# Copy this to case.yaml and customize for your document set.
name: "My Case"
slug: "my-case"
description: "Description of this document collection"
# Where raw documents live (PDFs, images, audio/video)
documents_dir: "./documents"
# Processing options
ocr:
backend: "pymupdf" # "docling", "pymupdf", or "both"
workers: 4
entities:
spacy_model: "en_core_web_sm"
types: ["PERSON", "ORG", "GPE", "DATE", "MONEY", "PHONE", "EMAIL_ADDR"]
# Optional: path to a JSON person registry for fuzzy matching
# registry: "./data/persons-registry.json"
# fuzzy_threshold: 85
dedup:
threshold: 0.90
# Bates number prefixes for dedup overlap detection (optional)
# bates_prefixes: ["EFTA", "DOJ"]
# Serving
serve:
port: 8001
title: "My Case — Document Database"
# ask_proxy:
# enabled: true
# openrouter_api_key_env: "OPENROUTER_API_KEY"