Skip to content

Commit 1226f7a

Browse files
authored
Merge pull request #82 from umccr/patch1-pd
Grab correct cancer gene panel somatic_panel-v24.03.0.tsv
2 parents c16f9a2 + cead7f1 commit 1226f7a

16 files changed

+73
-1330
lines changed

.pre-commit-config.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
# R specific hooks: https://github.com/lorenzwalthert/precommit
33
repos:
44
- repo: https://github.com/lorenzwalthert/precommit
5-
rev: v0.3.2
5+
rev: v0.4.3
66
hooks:
77
- id: style-files
88
args: [--style_pkg=styler, --style_fun=tidyverse_style]
@@ -14,7 +14,7 @@ repos:
1414
- id: use-tidy-description
1515
- id: readme-rmd-rendered
1616
- repo: https://github.com/pre-commit/pre-commit-hooks
17-
rev: v4.2.0
17+
rev: v4.6.0
1818
hooks:
1919
- id: check-added-large-files
2020
args: ['--maxkb=200']

R/purple.R

+3-3
Original file line numberDiff line numberDiff line change
@@ -51,7 +51,7 @@ purple_cnv_som_gene_read <- function(x) {
5151
#'
5252
#' @examples
5353
#' x <- system.file("extdata/purple/purple.cnv.gene.tsv", package = "gpgr")
54-
#' g <- system.file("extdata/ref/umccr_cancer_genes_v24.03.0.tsv", package = "gpgr")
54+
#' g <- system.file("extdata/ref/somatic_panel-v24.03.0.tsv", package = "gpgr")
5555
#' (pp <- purple_cnv_som_gene_process(x, g))
5656
#' @testexamples
5757
#' expect_equal(colnames(pp$tab)[ncol(pp$tab)], "minRegSupportStartEndMethod")
@@ -60,11 +60,11 @@ purple_cnv_som_gene_read <- function(x) {
6060
purple_cnv_som_gene_process <- function(x, g = NULL) {
6161
purple_cnv_gene <- purple_cnv_som_gene_read(x)
6262
if (is.null(g)) {
63-
g <- system.file("extdata/ref/umccr_cancer_genes_v24.03.0.tsv", package = "gpgr")
63+
g <- system.file("extdata/ref/somatic_panel-v24.03.0.tsv", package = "gpgr")
6464
}
6565
genes <-
6666
readr::read_tsv(g, col_types = readr::cols(
67-
ensembl_gene_symbol = "c", oncogene = "l", tumorsuppressor = "l"
67+
ensembl_gene_symbol = "c", oncogene = "l", tsgene = "l"
6868
)) |>
6969
dplyr::select(symbol = "ensembl_gene_symbol", "oncogene", "tsgene")
7070
oncogenes <- genes |>

R/sv.R

+1-1
Original file line numberDiff line numberDiff line change
@@ -186,7 +186,7 @@ join_breakpoint_entries <- function(x) {
186186
# Group by GRIDSS identifier (clipping trailing h/o [h: High, o: lOwer])
187187
bps <- x |>
188188
tidyr::separate("ID", into = c("BND_group", "BND_mate"), sep = -1, convert = TRUE, remove = FALSE) |>
189-
dplyr::group_by(BND_group)
189+
dplyr::group_by(.data$BND_group)
190190

191191
# Set a sequential breakpoint identifier
192192
bps_groups <- bps |> dplyr::n_groups()

README.Rmd

+3-3
Original file line numberDiff line numberDiff line change
@@ -47,10 +47,10 @@ conda install r-gpgr -c umccr -c conda-forge -c bioconda
4747
(<https://github.com/hartwigmedical/hmftools/tree/master/purple>).
4848
See vignette at <https://umccr.github.io/gpgr/articles/purple.html>.
4949

50-
### 🐍 umccrise {#id_-umccrise}
50+
### sash {#id_-sash}
5151

52-
- Generate a HTML report with results from the `umccrise` DRAGEN tumor/normal
53-
post-processing workflow from UMCCR - <https://github.com/umccr/umccrise>.
52+
- Generate a HTML report with results from the `sash` WGS post-processing workflow
53+
- <https://github.com/scwatts/sash>.
5454
See the [CLI](#cli) section below for options.
5555

5656
## 🥳 Developers {#id_-developers}

README.md

+37-50
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,10 @@
11

22
- [📚 gpgr - Genomics Platform Group
3-
Reporting](#-gpgr---genomics-platform-group-reporting)
3+
Reporting](#books-gpgr---genomics-platform-group-reporting)
44
- [Installation](#installation)
55
- [Main modules](#main-modules)
6-
- [🕸 LINX](#id_-linx)
76
- [🔮 PURPLE](#id_-purple)
8-
- [🐍 umccrise](#id_-umccrise)
7+
- [sash](#id_-sash)
98
- [🥳 Developers](#id_-developers)
109
- [💻 CLI](#id_-cli)
1110

@@ -37,28 +36,19 @@ conda install r-gpgr -c umccr -c conda-forge -c bioconda
3736

3837
## Main modules
3938

40-
### 🕸 LINX
41-
42-
- Generate a HTML report with results from the `LINX` structural variant
43-
visualisation tool from the Hartwig Medical Foundation
44-
(<https://github.com/hartwigmedical/hmftools/tree/master/linx>). See
45-
the [CLI](#cli) section below for options.
46-
- For useful functions for reading/processing `LINX` results, see the
47-
vignette at <https://umccr.github.io/gpgr/articles/linx.html>.
48-
4939
### 🔮 PURPLE
5040

5141
- Read and process output files from the `PURPLE` purity/copy number
5242
estimator tool from the Hartwig Medical Foundation
5343
(<https://github.com/hartwigmedical/hmftools/tree/master/purple>). See
5444
vignette at <https://umccr.github.io/gpgr/articles/purple.html>.
5545

56-
### 🐍 umccrise
46+
### sash
5747

58-
- Generate a HTML report with results from the `umccrise` DRAGEN
59-
tumor/normal post-processing workflow from UMCCR -
60-
<https://github.com/umccr/umccrise>. See the [CLI](#cli) section below
61-
for options.
48+
- Generate a HTML report with results from the `sash` WGS
49+
post-processing workflow
50+
- <https://github.com/scwatts/sash>. See the [CLI](#cli) section below
51+
for options.
6252

6353
## 🥳 Developers
6454

@@ -80,52 +70,40 @@ export PATH="${gpgr_cli}:${PATH}"
8070
```
8171

8272
gpgr.R --version
83-
gpgr.R 1.4.3
73+
gpgr.R 2.1.0
8474

8575
#-----------------------------------#
8676
gpgr.R --help
87-
usage: gpgr.R [-h] [-v] {linx,canrep} ...
77+
usage: gpgr.R [-h] [-v] {canrep} ...
8878

8979
UMCCR Genomics Platform Group Reporting
9080

9181
positional arguments:
92-
{linx,canrep} sub-command help
93-
linx UMCCR LINX Report.
82+
{canrep} sub-command help
9483
canrep UMCCR Cancer Report.
9584

9685
options:
9786
-h, --help show this help message and exit
9887
-v, --version show program's version number and exit
9988

100-
#-----------------------------------#
101-
#------- LINX Report -------#
102-
gpgr.R linx --help
103-
usage: gpgr.R linx [-h] --sample SAMPLE --plot PLOT --table TABLE [--out OUT]
104-
[--quiet]
105-
106-
options:
107-
-h, --help show this help message and exit
108-
--sample SAMPLE Sample name.
109-
--plot PLOT Path to LINX plot directory.
110-
--table TABLE Path to LINX table directory.
111-
--out OUT HTML output file name [def: linx_{sample}.html].
112-
--quiet Suppress log printing during rendering.
113-
11489
#-----------------------------------#
11590
#------- Cancer Report -------#
11691
gpgr.R canrep --help
11792
usage: gpgr.R canrep [-h] --af_global AF_GLOBAL --af_keygenes AF_KEYGENES
118-
--batch_name BATCH_NAME --conda_list CONDA_LIST --img_dir
119-
IMG_DIR --key_genes KEY_GENES --somatic_snv_summary
120-
SOMATIC_SNV_SUMMARY --somatic_snv_vcf SOMATIC_SNV_VCF
93+
--batch_name BATCH_NAME [--conda_list CONDA_LIST]
94+
--img_dir IMG_DIR --key_genes KEY_GENES --oncokb_genes
95+
ONCOKB_GENES --somatic_snv_vcf SOMATIC_SNV_VCF
96+
--somatic_snv_summary SOMATIC_SNV_SUMMARY
12197
--somatic_sv_tsv SOMATIC_SV_TSV --somatic_sv_vcf
12298
SOMATIC_SV_VCF --purple_som_gene_cnv PURPLE_SOM_GENE_CNV
123-
--purple_som_cnv PURPLE_SOM_CNV --purple_purity
124-
PURPLE_PURITY --purple_qc PURPLE_QC --purple_som_snv_vcf
125-
PURPLE_SOM_SNV_VCF --oncoviral_present_viruses
126-
ONCOVIRAL_PRESENT_VIRUSES --oncoviral_breakpoints_tsv
127-
ONCOVIRAL_BREAKPOINTS_TSV [--out_file OUT_FILE] [--quiet]
128-
--result_outdir RESULT_OUTDIR --tumor_name TUMOR_NAME
99+
--purple_som_cnv_ann PURPLE_SOM_CNV_ANN --purple_som_cnv
100+
PURPLE_SOM_CNV --purple_purity PURPLE_PURITY --purple_qc
101+
PURPLE_QC --purple_som_snv_vcf PURPLE_SOM_SNV_VCF
102+
--virusbreakend_tsv VIRUSBREAKEND_TSV --virusbreakend_vcf
103+
VIRUSBREAKEND_VCF --dragen_hrd DRAGEN_HRD
104+
--bcftools_stats BCFTOOLS_STATS [--out_file OUT_FILE]
105+
[--quiet] --result_outdir RESULT_OUTDIR --tumor_name
106+
TUMOR_NAME
129107

130108
options:
131109
-h, --help show this help message and exit
@@ -140,16 +118,21 @@ export PATH="${gpgr_cli}:${PATH}"
140118
--img_dir IMG_DIR Path to directory containing PURPLE plots.
141119
--key_genes KEY_GENES
142120
Path to UMCCR cancer gene file.
143-
--somatic_snv_summary SOMATIC_SNV_SUMMARY
144-
Path to `somatic_snv_summary.json`.
121+
--oncokb_genes ONCOKB_GENES
122+
Path to OncoKB database file.
145123
--somatic_snv_vcf SOMATIC_SNV_VCF
146124
Path to `somatic-PASS.vcf.gz` SNV VCF.
125+
--somatic_snv_summary SOMATIC_SNV_SUMMARY
126+
Path to `somatic_snv_summary.json` JSON.
147127
--somatic_sv_tsv SOMATIC_SV_TSV
148128
Path to `manta.tsv` TSV file.
149129
--somatic_sv_vcf SOMATIC_SV_VCF
150130
Path to `manta.vcf.gz` VCF file.
151131
--purple_som_gene_cnv PURPLE_SOM_GENE_CNV
152132
Path to `purple.cnv.gene.tsv`.
133+
--purple_som_cnv_ann PURPLE_SOM_CNV_ANN
134+
Path to annotated and prioritised
135+
`purple.cnv.somatic.tsv`.
153136
--purple_som_cnv PURPLE_SOM_CNV
154137
Path to `purple.cnv.somatic.tsv`.
155138
--purple_purity PURPLE_PURITY
@@ -158,10 +141,14 @@ export PATH="${gpgr_cli}:${PATH}"
158141
Path to `purple.qc`.
159142
--purple_som_snv_vcf PURPLE_SOM_SNV_VCF
160143
Path to `purple.somatic.vcf.gz`.
161-
--oncoviral_present_viruses ONCOVIRAL_PRESENT_VIRUSES
162-
Path to `oncoviruses/present_viruses.txt`.
163-
--oncoviral_breakpoints_tsv ONCOVIRAL_BREAKPOINTS_TSV
164-
Path to `oncoviruses/oncoviral_breakpoints.tsv`.
144+
--virusbreakend_tsv VIRUSBREAKEND_TSV
145+
Path to VIRUSBreakend summary file.
146+
--virusbreakend_vcf VIRUSBREAKEND_VCF
147+
Path to VIRUSBreakend VCF file.
148+
--dragen_hrd DRAGEN_HRD
149+
Path to DRAGEN HRD file
150+
--bcftools_stats BCFTOOLS_STATS
151+
Path to bcftools stats file
165152
--out_file OUT_FILE Path to output HTML file (needs '.html' suffix) [def:
166153
{tumor_name}_cancer_report.html].
167154
--quiet Suppress log printing during rendering.
+2-2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
outs:
2-
- md5: b7e6e168bb07e3dc3bcab9934cda9094
3-
size: 482
2+
- md5: 37113a19fbacef8079824f7802f8ee4d
3+
size: 468
44
path: purple.purity.tsv
55
hash: md5

inst/extdata/purple/purple.qc.dvc

+2-2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
outs:
2-
- md5: c10f44c2a7dc2b29cd2971efc94e0b0d
3-
size: 228
2+
- md5: 2ec1cbc0a2c173f8154de718e82afb5d
3+
size: 246
44
path: purple.qc
55
hash: md5

inst/extdata/ref/.gitignore

+1
Original file line numberDiff line numberDiff line change
@@ -1 +1,2 @@
11
/umccr_cancer_genes_v24.03.0.tsv
2+
/somatic_panel-v24.03.0.tsv
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,5 @@
1+
outs:
2+
- md5: 5ada82f5b399519a6ed34d5449a343f4
3+
size: 50539
4+
hash: md5
5+
path: somatic_panel-v24.03.0.tsv

0 commit comments

Comments
 (0)