Skip to content

Commit 51435df

Browse files
authored
feat: adding clingen curation data (#55)
1 parent 2a5e76a commit 51435df

File tree

13 files changed

+60
-5
lines changed

13 files changed

+60
-5
lines changed

.github/workflows/main.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@ jobs:
3131
environment-file: environment.yml
3232
init-shell: bash
3333
cache-environment: true
34-
post-cleanup: 'all'
34+
post-cleanup: none # breaks otherwise
3535

3636
- name: Check formating
3737
run: |
@@ -65,7 +65,7 @@ jobs:
6565
environment-file: environment.yml
6666
init-shell: bash
6767
cache-environment: true
68-
post-cleanup: 'all'
68+
post-cleanup: none # breaks otherwise
6969

7070
- name: Install python package
7171
run: |

Snakefile

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -85,6 +85,7 @@ rule all:
8585
# == work directory =====================================================================
8686
#
8787
# genes
88+
f"work/download/genes/clingen/{DV.clingen_gene}/clingen.csv",
8889
f"work/genes/dbnsfp/{DV.dbnsfp}/genes.tsv.gz",
8990
f"work/genes/ensembl/{DV.ensembl}/ensembl_xlink.tsv",
9091
f"work/genes/enst_ensg/grch37/{DV.ensembl_37}/enst_ensg.tsv",
@@ -317,6 +318,7 @@ rule all:
317318
include: "rules/work/misc/hpo.smk"
318319
# Gene-related rules.
319320
include: "rules/work/genes/dbnsfp.smk"
321+
include: "rules/work/genes/clingen.smk"
320322
include: "rules/work/genes/ensembl.smk"
321323
include: "rules/work/genes/gnomad.smk"
322324
include: "rules/work/genes/hgnc.smk"

download_urls.yml

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,9 @@
1+
- comment: The curation activity summary report is built in real-time.
2+
url: https://search.clinicalgenome.org/kb/reports/curation-activity-summary-report
3+
4+
- comment: ClinGen variant summary is built in real-time
5+
url: http://erepo.clinicalgenome.org/evrepo/api/classifications/all?format=tabbed
6+
17
- url: https://github.com/bihealth/annonars-data-clinvar/releases/download/clinvar-weekly-20230625/clinvar-strucvar-grch37-2023-0625+0.6.3.tar.gz
28
excerpt_strategy:
39
strategy: no-excerpt

excerpt-data/0a27656c7f2ba08a/all

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
version https://git-lfs.github.com/spec/v1
2+
oid sha256:8dbeb7d6578a59b07d5296ba8f8d0f729f51dfd005cd7c3466a4c683e7a4d91c
3+
size 156424
Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
version https://git-lfs.github.com/spec/v1
2+
oid sha256:cce44490e7ce19c99ae46d09281eca6645ca05c05bfe32c8ff87b88a25ca856c
3+
size 77
Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
version https://git-lfs.github.com/spec/v1
2-
oid sha256:d76098d2d3712096592a4a0f78d2aad039cae1e68b60ea802edd52d4edc4ae85
3-
size 6733
2+
oid sha256:85689d642c36284f0bb17567eb9b10f7b001bed8e6d912ed97f728fcacd5b316
3+
size 34848332
Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
version https://git-lfs.github.com/spec/v1
2+
oid sha256:56ea2a537b3b1afdd7426268eec5cbb3154a38101015aff61592689472d36f52
3+
size 1810278
Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
version https://git-lfs.github.com/spec/v1
2+
oid sha256:25fee8c5e5004815bdf7fee7462711e0a9bb7b42b547f437dd58767fd640a6f2
3+
size 78

rules/output/annonars/genes.smk

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@
44
rule output_annonars_genes: # -- build annonars genes RocksDB file
55
input:
66
acmg_sf="data/acmg_sf/{v_acmg_sf}/acmg_sf.tsv",
7+
clingen="work/download/genes/clingen/{date}/clingen.csv",
78
gnomad_constraints="work/genes/gnomad/{v_gnomad_constraints}/gnomad_constraints.tsv",
89
dbnsfp="work/genes/dbnsfp/{v_dbnsfp}/genes.tsv.gz",
910
hgnc="work/genes/hgnc/{date}/hgnc_info.jsonl",
@@ -25,9 +26,15 @@ rule output_annonars_genes: # -- build annonars genes RocksDB file
2526
v_annonars=RE_VERSION,
2627
shell:
2728
r"""
29+
export TMPDIR=$(mktemp -d)
30+
trap "rm -rf $TMPDIR" EXIT
31+
32+
tail -n +4 {input.clingen} > $TMPDIR/clingen.csv
33+
2834
annonars gene import \
2935
--path-out-rocksdb $(dirname {output.rocksdb_identity}) \
3036
--path-in-acmg {input.acmg_sf} \
37+
--path-in-clingen $TMPDIR/clingen.csv \
3138
--path-in-gnomad-constraints {input.gnomad_constraints} \
3239
--path-in-dbnsfp {input.dbnsfp} \
3340
--path-in-hgnc {input.hgnc} \

rules/output/annonars/genes.spec.yaml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,8 @@ dc.source:
2222
x-created-from:
2323
- name: ACMG SF Gene List
2424
version: {{ v_acmg_sf }}
25+
- name: ClinGen Gene Curation
26+
version: {{ today }}
2527
- name: gnomAD constraints
2628
version: {{ v_gnomad_constraints }}
2729
- name: dbNSFP

0 commit comments

Comments
 (0)