-
Notifications
You must be signed in to change notification settings - Fork 428
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Joint Germline subworkflow haplotypecaller -> Vqsr #595
Changes from 7 commits
19e5e0e
cd8d767
03909c9
c22a64f
028ad1a
57c2dff
ea8dd93
d6cc403
b78ad1c
37aa902
d49a5ac
d574b0c
dd7445f
06c66ad
8686dfb
f9fcb65
6e5e8dd
9a29759
aa110ab
fa41fa0
17924d0
50de0de
7947ce0
3463c56
1c48729
b835c37
d45423f
ed5ccea
3de8f7f
b2fd565
bfaf48d
cb25481
8fd7ff9
4eac972
ced2398
66a7f00
0ea9747
0717286
37e5e77
1db8bc8
ff6b530
aa7127a
5be916a
21182a3
9eebd71
69feebd
20a7e2e
3cbe260
e9fb076
6ea35cc
8d7235d
13f9bd7
e75a7f3
fb7c594
04b3191
9e31397
fc0c251
2e9a724
748947d
7e3a11e
77eb3d6
3fe7927
acb9fce
c793d5f
87f3405
ef8f526
72b4bc8
e5b1703
d6c006e
c94e00b
0dd0976
717e271
da17db9
4b9bd9f
9bae10f
b77a116
468dedb
e919d09
46bc423
f057709
4d50caf
c707f7c
ac0a1f5
a6d6e9a
7f5a916
1fc9e2a
d842fe0
73e84db
9fa1a5c
b0c32c7
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -18,6 +18,7 @@ params { | |
chr_dir = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Sequence/Chromosomes" | ||
dbsnp = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Annotation/GATKBundle/dbsnp_138.b37.vcf" | ||
dbsnp_tbi = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Annotation/GATKBundle/dbsnp_138.b37.vcf.idx" | ||
dbsnp_vqsr = 'dbsnp,known=false,training=true,truth=false,prior=2 dbsnp_138.b37.vcf' | ||
dict = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Sequence/WholeGenomeFasta/human_g1k_v37_decoy.dict" | ||
fasta = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Sequence/WholeGenomeFasta/human_g1k_v37_decoy.fasta" | ||
fasta_fai = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Sequence/WholeGenomeFasta/human_g1k_v37_decoy.fasta.fai" | ||
|
@@ -26,12 +27,30 @@ params { | |
intervals = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Annotation/intervals/wgs_calling_regions_Sarek.list" | ||
known_indels = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Annotation/GATKBundle/{1000G_phase1,Mills_and_1000G_gold_standard}.indels.b37.vcf" | ||
known_indels_tbi = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Annotation/GATKBundle/{1000G_phase1,Mills_and_1000G_gold_standard}.indels.b37.vcf.idx" | ||
known_indels_mills_vqsr = 'mills,known=false,training=true,truth=true,prior=12 Mills_and_1000G_gold_standard.indels.b37.vcf' | ||
known_indels_1000g_vqsr = '1000G,known=false,training=true,truth=true,prior=10 1000G_phase1.indels.b37.vcf' | ||
mappability = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Annotation/Control-FREEC/out100m2_hg19.gem" | ||
res_1000g = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Annotation/GATKBundle/1000G_phase1.snps.high_confidence.b37.vcf.gz" | ||
res_1000g_tbi = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh37/Annotation/GATKBundle/1000G_phase1.snps.high_confidence.b37.vcf.idx.gz" | ||
res_1000g_vqsr = '1000G,known=false,training=true,truth=true,prior=10 1000G_phase1.snps.high_confidence.b37.vcf.gz' | ||
snpeff_db = 'GRCh37.75' | ||
snpeff_genome = 'GRCh37' | ||
vep_cache_version = 104 | ||
vep_genome = 'GRCh37' | ||
vep_species = 'homo_sapiens' | ||
|
||
// resources for GATK joint germline variant recalibration | ||
RESOURCE_SNP = [ | ||
[ res_1000g, dbsnp ], | ||
[ res_1000g, dbsnp_tbi ], | ||
[ res_1000g_vqsr, dbsnp_vqsr ] | ||
] | ||
resource_INDEL = [ | ||
[ known_indels, dbsnp ], | ||
[ known_indels_tbi, dbsnp_tbi ], | ||
[ known_indels_mills_vqsr, known_indels_1000g_vqsr, dbsnp_vqsr ] | ||
] | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I like that, but I feel like it should be done in the sarek script or in the joint germline variant calling workflow instead There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I would then have to use less descriptive names as for hg19 and hg38 the files are slightly different. So the naming convention has to match regardless of the genome There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. what about something like |
||
|
||
} | ||
'GATK.GRCh38' { | ||
ac_loci = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/ASCAT/1000G_phase3_GRCh38_maf0.3.loci" | ||
|
@@ -42,6 +61,7 @@ params { | |
chr_dir = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Sequence/Chromosomes" | ||
dbsnp = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/GATKBundle/dbsnp_146.hg38.vcf.gz" | ||
dbsnp_tbi = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/GATKBundle/dbsnp_146.hg38.vcf.gz.tbi" | ||
dbsnp_vqsr = 'dbsnp,known=false,training=true,truth=false,prior=2 dbsnp_146.hg38.vcf.gz' | ||
dict = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Sequence/WholeGenomeFasta/Homo_sapiens_assembly38.dict" | ||
fasta = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Sequence/WholeGenomeFasta/Homo_sapiens_assembly38.fasta" | ||
fasta_fai = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Sequence/WholeGenomeFasta/Homo_sapiens_assembly38.fasta.fai" | ||
|
@@ -50,14 +70,31 @@ params { | |
intervals = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/intervals/wgs_calling_regions.hg38.bed" | ||
known_indels = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/GATKBundle/{Mills_and_1000G_gold_standard.indels.hg38,beta/Homo_sapiens_assembly38.known_indels}.vcf.gz" | ||
known_indels_tbi = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/GATKBundle/{Mills_and_1000G_gold_standard.indels.hg38,beta/Homo_sapiens_assembly38.known_indels}.vcf.gz.tbi" | ||
known_indels_mills_vqsr = 'mills,known=false,training=true,truth=true,prior=12 Mills_and_1000G_gold_standard.indels.hg38.vcf.gz' | ||
known_indels_gatk_vqsr = 'gatk,known=false,training=true,truth=true,prior=10 Homo_sapiens_assembly38.known_indels.vcf.gz' | ||
mappability = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/Control-FREEC/out100m2_hg38.gem" | ||
pon = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/GATKBundle/1000g_pon.hg38.vcf.gz" | ||
pon_tbi = "${params.igenomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/GATKBundle/1000g_pon.hg38.vcf.gz.tbi" | ||
res_1000g_omni = "${params.genomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/GATKBundle/1000G_omni2.5.hg38.vcf.gz" | ||
res_1000g_omni_tbi = "${params.genomes_base}/Homo_sapiens/GATK/GRCh38/Annotation/GATKBundle/1000G_omni2.5.hg38.vcf.gz.tbi" | ||
res_1000g_omni_vqsr = 'omni,known=false,training=true,truth=false,prior=12.0 1000G_omni2.5.hg38.vcf.gz' | ||
snpeff_db = 'GRCh38.99' | ||
snpeff_genome = 'GRCh38' | ||
vep_cache_version = 104 | ||
vep_genome = 'GRCh38' | ||
vep_species = 'homo_sapiens' | ||
|
||
nickhsmith marked this conversation as resolved.
Show resolved
Hide resolved
|
||
// resources for GATK joint germline variant recalibration | ||
resource_SNP = [ | ||
[ res_1000g_omni, dbsnp ], | ||
[ res_1000g_omni, dbsnp_tbi ], | ||
[ res_1000g_omni_vqsr, dbsnp_vqsr ] | ||
] | ||
resource_INDEL = [ | ||
[ known_indels, dbsnp ], | ||
[ known_indels_tbi, dbsnp_tbi ], | ||
[ known_indels_mills_vqsr, known_indels_gatk_vqsr, dbsnp_vqsr ] | ||
] | ||
} | ||
'Ensembl.GRCh37' { | ||
bwa = "${params.igenomes_base}/Homo_sapiens/Ensembl/GRCh37/Sequence/BWAIndex/version0.6.0/" | ||
|
Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.
Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.
Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
I'd prefer having args in the modules.config, and avoiding adding extra files in igenomes.config
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
that doesn't fit with the nf-core/module styling as this is expected to be an inputted value