Skip to content

Commit ac22a9f

Browse files
authored
Merge pull request #122 from icgc-argo/payload-gen-variant-calling@0.5.0
[release]
2 parents 1066cd6 + 4ad9464 commit ac22a9f

8 files changed

Lines changed: 55 additions & 32 deletions

payload-gen-variant-calling/main.nf

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@
2525
/* this block is auto-generated based on info from pkg.json where */
2626
/* changes can be made if needed, do NOT modify this block manually */
2727
nextflow.enable.dsl = 2
28-
version = '0.4.0' // package version
28+
version = '0.5.0'
2929

3030
container = [
3131
'ghcr.io': 'ghcr.io/icgc-argo/data-processing-utility-tools.payload-gen-variant-calling'

payload-gen-variant-calling/main.py

Lines changed: 12 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -33,21 +33,21 @@
3333

3434

3535
variant_type_to_data_type_etc = {
36-
'snv': ['Simple Nucleotide Variation', ['Raw SNV Calls', None], ['CaVEMan'], ['GATK:Mutect2']], # dataCategory, [dataType, data_subtype], analysis_tools
36+
'snv': ['Simple Nucleotide Variation', ['Raw SNV Calls', None], ['CaVEMan'], ['GATK:Mutect2']], # dataCategory, [dataType, data_subtypes], analysis_tools
3737
'indel': ['Simple Nucleotide Variation', ['Raw InDel Calls', None], ['Pindel'], ['GATK:Mutect2']],
3838
'cnv': ['Copy Number Variation', ['Raw CNV Calls', None], ['ASCAT']],
3939
'sv': ['Structural Variation', ['Raw SV Calls', None], ['BRASS']],
4040
'caveman-supplement': ['Simple Nucleotide Variation', ['SNV Supplement', None], ['CaVEMan']],
4141
'pindel-supplement': ['Simple Nucleotide Variation', ['InDel Supplement', None], ['Pindel']],
4242
'ascat-supplement': ['Copy Number Variation', ['CNV Supplement', None], ['ASCAT']],
4343
'brass-supplement': ['Structural Variation', ['SV Supplement', None], ['BRASS']],
44-
'timings-supplement': ['Quality Control Metrics', ['Analysis QC', 'Runtime Stats'], None, None],
45-
'bas_metrics': ['Quality Control Metrics', ['Aligned Reads QC', 'Alignment Metrics'], ['Sanger:bam_stats']],
46-
'contamination_metrics': ['Quality Control Metrics', ['Analysis QC', 'Cross Sample Contamination'], ['Sanger:verifyBamHomChk'], ['GATK:CalculateContamination']],
47-
'ascat_metrics': ['Quality Control Metrics', ['Analysis QC', 'Ploidy and Purity Estimation'], ['ASCAT']],
48-
'genotyped_gender_metrics': ['Quality Control Metrics', ['Analysis QC', 'Genotyping Stats'], ['Sanger:compareBamGenotypes']],
49-
'mutect_filtering_metrics': ['Quality Control Metrics', ['Analysis QC', 'Variant Filtering Stats'], [], ['GATK:FilterMutectCalls']],
50-
'mutect_callable_metrics': ['Quality Control Metrics', ['Analysis QC', 'Variant Callable Stats'], [], ['GATK:Mutect2']],
44+
'timings-supplement': ['Quality Control Metrics', ['Analysis QC', ['Runtime Stats']], None, None],
45+
'bas_metrics': ['Quality Control Metrics', ['Aligned Reads QC', ['Alignment Metrics']], ['Sanger:bam_stats']],
46+
'contamination_metrics': ['Quality Control Metrics', ['Analysis QC', ['Cross Sample Contamination']], ['Sanger:verifyBamHomChk'], ['GATK:CalculateContamination']],
47+
'ascat_metrics': ['Quality Control Metrics', ['Analysis QC', ['Ploidy', 'Tumour Purity']], ['ASCAT']],
48+
'genotyped_gender_metrics': ['Quality Control Metrics', ['Analysis QC', ['Genotyping Stats']], ['Sanger:compareBamGenotypes']],
49+
'mutect_filtering_metrics': ['Quality Control Metrics', ['Analysis QC', ['Variant Filtering Stats']], [], ['GATK:FilterMutectCalls']],
50+
'mutect_callable_metrics': ['Quality Control Metrics', ['Analysis QC', ['Variant Callable Stats']], [], ['GATK:Mutect2']],
5151
}
5252

5353
workflow_full_name = {
@@ -151,22 +151,22 @@ def get_files_info(file_to_upload, wf_short_name, wf_version, somatic_or_germli
151151

152152
file_info['info'] = {
153153
'data_category': variant_type_to_data_type_etc[variant_type][0],
154-
'data_subtype': None
154+
'data_subtypes': None
155155
}
156156

157157
extra_info = {}
158158
if new_fname.endswith('.vcf.gz'):
159159
file_info['dataType'] = variant_type_to_data_type_etc[variant_type][1][0]
160-
file_info['info']['data_subtype'] = variant_type_to_data_type_etc[variant_type][1][1]
160+
file_info['info']['data_subtypes'] = variant_type_to_data_type_etc[variant_type][1][1]
161161
elif new_fname.endswith('.vcf.gz.tbi'):
162162
file_info['dataType'] = 'VCF Index'
163163
elif new_fname.endswith('.tgz'):
164164
if new_fname.endswith('-supplement.tgz'):
165165
file_info['dataType'] = variant_type_to_data_type_etc[variant_type][1][0]
166-
file_info['info']['data_subtype'] = variant_type_to_data_type_etc[variant_type][1][1]
166+
file_info['info']['data_subtypes'] = variant_type_to_data_type_etc[variant_type][1][1]
167167
elif new_fname.endswith('_metrics.tgz'):
168168
file_info['dataType'] = variant_type_to_data_type_etc[variant_type][1][0]
169-
file_info['info']['data_subtype'] = variant_type_to_data_type_etc[variant_type][1][1]
169+
file_info['info']['data_subtypes'] = variant_type_to_data_type_etc[variant_type][1][1]
170170
else:
171171
sys.exit('Error: unknown file type "%s"' % file_to_upload)
172172

payload-gen-variant-calling/pkg.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
{
22
"name": "payload-gen-variant-calling",
3-
"version": "0.4.0",
3+
"version": "0.5.0",
44
"description": "A tool to generate SONG payloads for variant calling workflows",
55
"main": "main.nf",
66
"deprecated": false,
@@ -33,4 +33,4 @@
3333
"license": "GNU Affero General Public License v3",
3434
"bugReport": "https://github.com/icgc-argo/data-processing-utility-tools/issues",
3535
"homepage": "https://github.com/icgc-argo/data-processing-utility-tools#readme"
36-
}
36+
}

tests/data/1a7df8db-cb54-43e1-952f-3c458a14800a.variant_calling.payload.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@
3535
"fileAccess": "controlled",
3636
"info": {
3737
"data_category": "Simple Nucleotide Variation",
38-
"data_subtype": null,
38+
"data_subtypes": null,
3939
"analysis_tools": [
4040
"CaVEMan"
4141
]
@@ -50,7 +50,7 @@
5050
"fileAccess": "controlled",
5151
"info": {
5252
"data_category": "Simple Nucleotide Variation",
53-
"data_subtype": null,
53+
"data_subtypes": null,
5454
"analysis_tools": [
5555
"CaVEMan"
5656
]

tests/data/66f84b1e-dad1-4981-916e-07e62ff53410.variant_calling_supplement.payload.json

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,9 @@
3535
"fileAccess": "controlled",
3636
"info": {
3737
"data_category": "Quality Control Metrics",
38-
"data_subtype": "Runtime Stats",
38+
"data_subtypes": [
39+
"Runtime Stats"
40+
],
3941
"analysis_tools": null,
4042
"description": "Files contain timing information for different processing steps",
4143
"files": [
@@ -66,7 +68,7 @@
6668
"fileAccess": "controlled",
6769
"info": {
6870
"data_category": "Simple Nucleotide Variation",
69-
"data_subtype": null,
71+
"data_subtypes": null,
7072
"analysis_tools": [
7173
"CaVEMan"
7274
],
@@ -98,7 +100,7 @@
98100
"fileAccess": "controlled",
99101
"info": {
100102
"data_category": "Simple Nucleotide Variation",
101-
"data_subtype": null,
103+
"data_subtypes": null,
102104
"analysis_tools": [
103105
"Pindel"
104106
],

tests/data/735a4c34-c928-4f03-957b-fe808df68f63.qc_metrics.payload.json

Lines changed: 12 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,9 @@
3535
"fileAccess": "controlled",
3636
"info": {
3737
"data_category": "Quality Control Metrics",
38-
"data_subtype": "Cross Sample Contamination",
38+
"data_subtypes": [
39+
"Cross Sample Contamination"
40+
],
3941
"analysis_tools": [
4042
"GATK:CalculateContamination"
4143
],
@@ -61,7 +63,9 @@
6163
"fileAccess": "controlled",
6264
"info": {
6365
"data_category": "Quality Control Metrics",
64-
"data_subtype": "Cross Sample Contamination",
66+
"data_subtypes": [
67+
"Cross Sample Contamination"
68+
],
6569
"analysis_tools": [
6670
"GATK:CalculateContamination"
6771
],
@@ -87,7 +91,9 @@
8791
"fileAccess": "controlled",
8892
"info": {
8993
"data_category": "Quality Control Metrics",
90-
"data_subtype": "Variant Filtering Stats",
94+
"data_subtypes": [
95+
"Variant Filtering Stats"
96+
],
9197
"analysis_tools": [
9298
"GATK:FilterMutectCalls"
9399
],
@@ -162,7 +168,9 @@
162168
"fileAccess": "controlled",
163169
"info": {
164170
"data_category": "Quality Control Metrics",
165-
"data_subtype": "Variant Callable Stats",
171+
"data_subtypes": [
172+
"Variant Callable Stats"
173+
],
166174
"analysis_tools": [
167175
"GATK:Mutect2"
168176
],

tests/data/d354c4b2-db32-41f0-973f-db1306a99a84.qc_metrics.payload.json

Lines changed: 19 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,9 @@
3232
"fileAccess": "controlled",
3333
"info": {
3434
"data_category": "Quality Control Metrics",
35-
"data_subtype": "Cross Sample Contamination",
35+
"data_subtypes": [
36+
"Cross Sample Contamination"
37+
],
3638
"analysis_tools": [
3739
"Sanger:verifyBamHomChk"
3840
],
@@ -64,7 +66,9 @@
6466
"fileAccess": "controlled",
6567
"info": {
6668
"data_category": "Quality Control Metrics",
67-
"data_subtype": "Cross Sample Contamination",
69+
"data_subtypes": [
70+
"Cross Sample Contamination"
71+
],
6872
"analysis_tools": [
6973
"Sanger:verifyBamHomChk"
7074
],
@@ -96,7 +100,9 @@
96100
"fileAccess": "controlled",
97101
"info": {
98102
"data_category": "Quality Control Metrics",
99-
"data_subtype": "Alignment Metrics",
103+
"data_subtypes": [
104+
"Alignment Metrics"
105+
],
100106
"analysis_tools": [
101107
"Sanger:bam_stats"
102108
],
@@ -115,7 +121,9 @@
115121
"fileAccess": "controlled",
116122
"info": {
117123
"data_category": "Quality Control Metrics",
118-
"data_subtype": "Alignment Metrics",
124+
"data_subtypes": [
125+
"Alignment Metrics"
126+
],
119127
"analysis_tools": [
120128
"Sanger:bam_stats"
121129
],
@@ -134,7 +142,10 @@
134142
"fileAccess": "controlled",
135143
"info": {
136144
"data_category": "Quality Control Metrics",
137-
"data_subtype": "Ploidy and Purity Estimation",
145+
"data_subtypes": [
146+
"Ploidy",
147+
"Tumour Purity"
148+
],
138149
"analysis_tools": [
139150
"ASCAT"
140151
],
@@ -162,7 +173,9 @@
162173
"fileAccess": "controlled",
163174
"info": {
164175
"data_category": "Quality Control Metrics",
165-
"data_subtype": "Genotyping Stats",
176+
"data_subtypes": [
177+
"Genotyping Stats"
178+
],
166179
"analysis_tools": [
167180
"Sanger:compareBamGenotypes"
168181
],

tests/data/f7ca0bd4-53a7-4663-b7b6-1b3d414e0018.variant_calling.payload.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@
3535
"fileAccess": "controlled",
3636
"info": {
3737
"data_category": "Simple Nucleotide Variation",
38-
"data_subtype": null,
38+
"data_subtypes": null,
3939
"analysis_tools": [
4040
"GATK:Mutect2"
4141
]
@@ -50,7 +50,7 @@
5050
"fileAccess": "controlled",
5151
"info": {
5252
"data_category": "Simple Nucleotide Variation",
53-
"data_subtype": null,
53+
"data_subtypes": null,
5454
"analysis_tools": [
5555
"GATK:Mutect2"
5656
]

0 commit comments

Comments
 (0)