You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

workflow.wdl 8.0KB

5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
4 vuotta sitten
4 vuotta sitten
4 vuotta sitten
4 vuotta sitten
4 vuotta sitten
4 vuotta sitten
4 vuotta sitten
4 vuotta sitten
4 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
4 vuotta sitten
5 vuotta sitten
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315
  1. import "./tasks/mapping.wdl" as mapping
  2. import "./tasks/Dedup.wdl" as Dedup
  3. import "./tasks/deduped_Metrics.wdl" as deduped_Metrics
  4. import "./tasks/sentieon.wdl" as sentieon
  5. import "./tasks/Realigner.wdl" as Realigner
  6. import "./tasks/BQSR.wdl" as BQSR
  7. import "./tasks/Haplotyper_gVCF.wdl" as Haplotyper_gVCF
  8. import "./tasks/GVCFtyper.wdl" as GVCFtyper
  9. import "./tasks/split_gvcf_files.wdl" as split_gvcf_files
  10. import "./tasks/benchmark.wdl" as benchmark
  11. import "./tasks/multiqc.wdl" as multiqc
  12. import "./tasks/merge_sentieon_metrics.wdl" as merge_sentieon_metrics
  13. import "./tasks/extract_tables.wdl" as extract_tables
  14. import "./tasks/mendelian.wdl" as mendelian
  15. import "./tasks/merge_mendelian.wdl" as merge_mendelian
  16. import "./tasks/quartet_mendelian.wdl" as quartet_mendelian
  17. import "./tasks/fastqc.wdl" as fastqc
  18. import "./tasks/fastqscreen.wdl" as fastqscreen
  19. import "./tasks/D5_D6.wdl" as D5_D6
  20. import "./tasks/merge_family.wdl" as merge_family
  21. workflow {{ project_name }} {
  22. File inputSamplesFile
  23. Array[Array[File]] inputSamples = read_tsv(inputSamplesFile)
  24. String SENTIEON_INSTALL_DIR
  25. String SENTIEON_LICENSE
  26. String SENTIEONdocker
  27. String FASTQCdocker
  28. String FASTQSCREENdocker
  29. String QUALIMAPdocker
  30. String BENCHMARKdocker
  31. String MENDELIANdocker
  32. String DIYdocker
  33. String MULTIQCdocker
  34. String fasta
  35. File ref_dir
  36. File dbmills_dir
  37. String db_mills
  38. File dbsnp_dir
  39. String dbsnp
  40. File sdf
  41. File screen_ref_dir
  42. File fastq_screen_conf
  43. File benchmarking_dir
  44. String project
  45. String disk_size
  46. String BIGcluster_config
  47. String SMALLcluster_config
  48. scatter (quartet in inputSamples){
  49. call mapping.mapping as mapping {
  50. input:
  51. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  52. SENTIEON_LICENSE=SENTIEON_LICENSE,
  53. group=quartet[2],
  54. sample=quartet[2],
  55. pl="ILLUMINAL",
  56. fasta=fasta,
  57. ref_dir=ref_dir,
  58. fastq_1=quartet[0],
  59. fastq_2=quartet[1],
  60. docker=SENTIEONdocker,
  61. disk_size=disk_size,
  62. cluster_config=BIGcluster_config
  63. }
  64. call fastqc.fastqc as fastqc {
  65. input:
  66. read1=quartet[0],
  67. read2=quartet[1],
  68. docker=FASTQCdocker,
  69. cluster_config=BIGcluster_config,
  70. disk_size=disk_size
  71. }
  72. call fastqscreen.fastq_screen as fastqscreen {
  73. input:
  74. read1=quartet[0],
  75. read2=quartet[1],
  76. screen_ref_dir=screen_ref_dir,
  77. fastq_screen_conf=fastq_screen_conf,
  78. docker=FASTQSCREENdocker,
  79. cluster_config=BIGcluster_config,
  80. disk_size=disk_size
  81. }
  82. call Dedup.Dedup as Dedup {
  83. input:
  84. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  85. sorted_bam=mapping.sorted_bam,
  86. sorted_bam_index=mapping.sorted_bam_index,
  87. sample=quartet[2],
  88. docker=SENTIEONdocker,
  89. disk_size=disk_size,
  90. cluster_config=BIGcluster_config
  91. }
  92. call deduped_Metrics.deduped_Metrics as deduped_Metrics {
  93. input:
  94. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  95. fasta=fasta,
  96. ref_dir=ref_dir,
  97. Dedup_bam=Dedup.Dedup_bam,
  98. Dedup_bam_index=Dedup.Dedup_bam_index,
  99. sample=quartet[2],
  100. docker=SENTIEONdocker,
  101. disk_size=disk_size,
  102. cluster_config=BIGcluster_config
  103. }
  104. call sentieon.sentieon as sentieon {
  105. input:
  106. quality_yield=deduped_Metrics.deduped_QualityYield,
  107. wgs_metrics_algo=deduped_Metrics.deduped_wgsmetrics,
  108. aln_metrics=deduped_Metrics.dedeuped_aln_metrics,
  109. is_metrics=deduped_Metrics.deduped_is_metrics,
  110. sample=quartet[2],
  111. docker=SENTIEONdocker,
  112. cluster_config=SMALLcluster_config,
  113. disk_size=disk_size
  114. }
  115. call Realigner.Realigner as Realigner {
  116. input:
  117. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  118. fasta=fasta,
  119. ref_dir=ref_dir,
  120. Dedup_bam=Dedup.Dedup_bam,
  121. Dedup_bam_index=Dedup.Dedup_bam_index,
  122. db_mills=db_mills,
  123. dbmills_dir=dbmills_dir,
  124. sample=quartet[2],
  125. docker=SENTIEONdocker,
  126. disk_size=disk_size,
  127. cluster_config=BIGcluster_config
  128. }
  129. call BQSR.BQSR as BQSR {
  130. input:
  131. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  132. fasta=fasta,
  133. ref_dir=ref_dir,
  134. realigned_bam=Realigner.realigner_bam,
  135. realigned_bam_index=Realigner.realigner_bam_index,
  136. db_mills=db_mills,
  137. dbmills_dir=dbmills_dir,
  138. dbsnp=dbsnp,
  139. dbsnp_dir=dbsnp_dir,
  140. sample=quartet[2],
  141. docker=SENTIEONdocker,
  142. disk_size=disk_size,
  143. cluster_config=BIGcluster_config
  144. }
  145. call Haplotyper_gVCF.Haplotyper_gVCF as Haplotyper_gVCF {
  146. input:
  147. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  148. fasta=fasta,
  149. ref_dir=ref_dir,
  150. recaled_bam=BQSR.recaled_bam,
  151. recaled_bam_index=BQSR.recaled_bam_index,
  152. sample=quartet[2],
  153. docker=SENTIEONdocker,
  154. disk_size=disk_size,
  155. cluster_config=BIGcluster_config
  156. }
  157. }
  158. call GVCFtyper.GVCFtyper as GVCFtyper {
  159. input:
  160. ref_dir=ref_dir,
  161. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  162. fasta=fasta,
  163. vcf=Haplotyper_gVCF.vcf,
  164. vcf_idx=Haplotyper_gVCF.vcf_idx,
  165. project=project,
  166. docker=SENTIEONdocker,
  167. cluster_config=BIGcluster_config,
  168. disk_size=disk_size
  169. }
  170. call split_gvcf_files.split_gvcf_files as split_gvcf_files {
  171. input:
  172. gvcf=GVCFtyper.gvcf,
  173. docker=DIYdocker,
  174. project=project,
  175. cluster_config=SMALLcluster_config,
  176. disk_size=disk_size
  177. }
  178. Array[File] single_gvcf = split_gvcf_files.splited_vcf
  179. scatter (idx in range(length(single_gvcf))) {
  180. call benchmark.benchmark as benchmark {
  181. input:
  182. vcf=single_gvcf[idx],
  183. benchmarking_dir=benchmarking_dir,
  184. sdf=sdf,
  185. project=project,
  186. docker=BENCHMARKdocker,
  187. cluster_config=BIGcluster_config,
  188. disk_size=disk_size,
  189. }
  190. }
  191. call multiqc.multiqc as multiqc {
  192. input:
  193. read1_zip=fastqc.read1_zip,
  194. read2_zip=fastqc.read2_zip,
  195. txt1=fastqscreen.txt1,
  196. txt2=fastqscreen.txt2,
  197. docker=MULTIQCdocker,
  198. cluster_config=SMALLcluster_config,
  199. disk_size=disk_size
  200. }
  201. call merge_sentieon_metrics.merge_sentieon_metrics as merge_sentieon_metrics {
  202. input:
  203. quality_yield_header=sentieon.quality_yield_header,
  204. wgs_metrics_algo_header=sentieon.wgs_metrics_algo_header,
  205. aln_metrics_header=sentieon.aln_metrics_header,
  206. is_metrics_header=sentieon.is_metrics_header,
  207. quality_yield_data=sentieon.quality_yield_data,
  208. wgs_metrics_algo_data=sentieon.wgs_metrics_algo_data,
  209. aln_metrics_data=sentieon.aln_metrics_data,
  210. is_metrics_data=sentieon.is_metrics_data,
  211. project=project,
  212. docker=MULTIQCdocker,
  213. cluster_config=SMALLcluster_config,
  214. disk_size=disk_size
  215. }
  216. call extract_tables.extract_tables as extract_tables {
  217. input:
  218. quality_yield_summary=merge_sentieon_metrics.quality_yield_summary,
  219. wgs_metrics_summary=merge_sentieon_metrics.wgs_metrics_summary,
  220. aln_metrics_summary=merge_sentieon_metrics.aln_metrics_summary,
  221. is_metrics_summary=merge_sentieon_metrics.is_metrics_summary,
  222. fastqc=multiqc.fastqc,
  223. fastqscreen=multiqc.fastqscreen,
  224. project=project,
  225. docker=DIYdocker,
  226. cluster_config=SMALLcluster_config,
  227. disk_size=disk_size
  228. }
  229. Boolean sister_tag = read_boolean(split_gvcf_files.sister_tag)
  230. Boolean quartet_tag = read_boolean(split_gvcf_files.quartet_tag)
  231. if (sister_tag) {
  232. call D5_D6.D5_D6 as D5_D6 {
  233. input:
  234. splited_vcf=split_gvcf_files.splited_vcf,
  235. project=project,
  236. docker=DIYdocker,
  237. cluster_config=SMALLcluster_config,
  238. disk_size=disk_size,
  239. }
  240. }
  241. if (quartet_tag) {
  242. call merge_family.merge_family as merge_family {
  243. input:
  244. splited_vcf=split_gvcf_files.splited_vcf,
  245. project=project,
  246. docker=DIYdocker,
  247. cluster_config=SMALLcluster_config,
  248. disk_size=disk_size,
  249. }
  250. Array[File] family_vcfs = merge_family.family_vcf
  251. scatter (idx in range(length(family_vcfs))) {
  252. call mendelian.mendelian as mendelian {
  253. input:
  254. family_vcf=family_vcfs[idx],
  255. ref_dir=ref_dir,
  256. fasta=fasta,
  257. docker=MENDELIANdocker,
  258. cluster_config=BIGcluster_config,
  259. disk_size=disk_size
  260. }
  261. call merge_mendelian.merge_mendelian as merge_mendelian {
  262. input:
  263. D5_trio_vcf=mendelian.D5_trio_vcf,
  264. D6_trio_vcf=mendelian.D6_trio_vcf,
  265. family_vcf=family_vcfs[idx],
  266. docker=DIYdocker,
  267. cluster_config=SMALLcluster_config,
  268. disk_size=disk_size
  269. }
  270. }
  271. call quartet_mendelian.quartet_mendelian as quartet_mendelian {
  272. input:
  273. project_mendelian_summary=merge_mendelian.project_mendelian_summary,
  274. project=project,
  275. docker=DIYdocker,
  276. cluster_config=SMALLcluster_config,
  277. disk_size=disk_size
  278. }
  279. }
  280. }