Nevar pievienot vairāk kā 25 tēmas Tēmai ir jāsākas ar burtu vai ciparu, tā var saturēt domu zīmes ('-') un var būt līdz 35 simboliem gara.

314 rindas
8.0KB

  1. import "./tasks/mapping.wdl" as mapping
  2. import "./tasks/Dedup.wdl" as Dedup
  3. import "./tasks/qualimap.wdl" as qualimap
  4. import "./tasks/deduped_Metrics.wdl" as deduped_Metrics
  5. import "./tasks/sentieon.wdl" as sentieon
  6. import "./tasks/Realigner.wdl" as Realigner
  7. import "./tasks/BQSR.wdl" as BQSR
  8. import "./tasks/Haplotyper_gVCF.wdl" as Haplotyper_gVCF
  9. import "./tasks/GVCFtyper.wdl" as GVCFtyper
  10. import "./tasks/split_gvcf_files.wdl" as split_gvcf_files
  11. import "./tasks/benchmark.wdl" as benchmark
  12. import "./tasks/merge_sentieon_metrics.wdl" as merge_sentieon_metrics
  13. import "./tasks/extract_tables.wdl" as extract_tables
  14. import "./tasks/mendelian.wdl" as mendelian
  15. import "./tasks/merge_mendelian.wdl" as merge_mendelian
  16. import "./tasks/quartet_mendelian.wdl" as quartet_mendelian
  17. import "./tasks/fastqc.wdl" as fastqc
  18. import "./tasks/fastqscreen.wdl" as fastqscreen
  19. import "./tasks/D5_D6.wdl" as D5_D6
  20. import "./tasks/merge_family.wdl" as merge_family
  21. workflow {{ project_name }} {
  22. File inputSamplesFile
  23. Array[Array[File]] inputSamples = read_tsv(inputSamplesFile)
  24. String SENTIEON_INSTALL_DIR
  25. String SENTIEON_LICENSE
  26. String SENTIEONdocker
  27. String FASTQCdocker
  28. String FASTQSCREENdocker
  29. String QUALIMAPdocker
  30. String BENCHMARKdocker
  31. String MENDELIANdocker
  32. String DIYdocker
  33. String MULTIQCdocker
  34. String fasta
  35. File ref_dir
  36. File dbmills_dir
  37. String db_mills
  38. File dbsnp_dir
  39. String dbsnp
  40. File screen_ref_dir
  41. File fastq_screen_conf
  42. File benchmarking_dir
  43. String project
  44. String disk_size
  45. String BIGcluster_config
  46. String SMALLcluster_config
  47. scatter (quartet in inputSamples){
  48. call mapping.mapping as mapping {
  49. input:
  50. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  51. SENTIEON_LICENSE=SENTIEON_LICENSE,
  52. group=quartet[2],
  53. sample=quartet[2],
  54. pl="ILLUMINAL",
  55. fasta=fasta,
  56. ref_dir=ref_dir,
  57. fastq_1=quartet[0],
  58. fastq_2=quartet[1],
  59. docker=SENTIEONdocker,
  60. disk_size=disk_size,
  61. cluster_config=BIGcluster_config
  62. }
  63. call fastqc.fastqc as fastqc {
  64. input:
  65. read1=quartet[0],
  66. read2=quartet[1],
  67. docker=FASTQCdocker,
  68. cluster_config=BIGcluster_config,
  69. disk_size=disk_size
  70. }
  71. call fastqscreen.fastq_screen as fastqscreen {
  72. input:
  73. read1=quartet[0],
  74. read2=quartet[1],
  75. screen_ref_dir=screen_ref_dir,
  76. fastq_screen_conf=fastq_screen_conf,
  77. docker=FASTQSCREENdocker,
  78. cluster_config=BIGcluster_config,
  79. disk_size=disk_size
  80. }
  81. call Dedup.Dedup as Dedup {
  82. input:
  83. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  84. sorted_bam=mapping.sorted_bam,
  85. sorted_bam_index=mapping.sorted_bam_index,
  86. sample=quartet[2],
  87. docker=SENTIEONdocker,
  88. disk_size=disk_size,
  89. cluster_config=BIGcluster_config
  90. }
  91. call qualimap.qualimap as qualimap {
  92. input:
  93. bam=Dedup.Dedup_bam,
  94. bai=Dedup.Dedup_bam_index,
  95. docker=QUALIMAPdocker,
  96. disk_size=disk_size,
  97. cluster_config=BIGcluster_config
  98. }
  99. call deduped_Metrics.deduped_Metrics as deduped_Metrics {
  100. input:
  101. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  102. fasta=fasta,
  103. ref_dir=ref_dir,
  104. Dedup_bam=Dedup.Dedup_bam,
  105. Dedup_bam_index=Dedup.Dedup_bam_index,
  106. sample=quartet[2],
  107. docker=SENTIEONdocker,
  108. disk_size=disk_size,
  109. cluster_config=BIGcluster_config
  110. }
  111. call sentieon.sentieon as sentieon {
  112. input:
  113. quality_yield=deduped_Metrics.deduped_QualityYield,
  114. wgs_metrics_algo=deduped_Metrics.deduped_wgsmetrics,
  115. aln_metrics=deduped_Metrics.dedeuped_aln_metrics,
  116. is_metrics=deduped_Metrics.deduped_is_metrics,
  117. sample=quartet[2],
  118. docker=SENTIEONdocker,
  119. cluster_config=SMALLcluster_config,
  120. disk_size=disk_size
  121. }
  122. call Realigner.Realigner as Realigner {
  123. input:
  124. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  125. fasta=fasta,
  126. ref_dir=ref_dir,
  127. Dedup_bam=Dedup.Dedup_bam,
  128. Dedup_bam_index=Dedup.Dedup_bam_index,
  129. db_mills=db_mills,
  130. dbmills_dir=dbmills_dir,
  131. sample=quartet[2],
  132. docker=SENTIEONdocker,
  133. disk_size=disk_size,
  134. cluster_config=BIGcluster_config
  135. }
  136. call BQSR.BQSR as BQSR {
  137. input:
  138. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  139. fasta=fasta,
  140. ref_dir=ref_dir,
  141. realigned_bam=Realigner.realigner_bam,
  142. realigned_bam_index=Realigner.realigner_bam_index,
  143. db_mills=db_mills,
  144. dbmills_dir=dbmills_dir,
  145. dbsnp=dbsnp,
  146. dbsnp_dir=dbsnp_dir,
  147. sample=quartet[2],
  148. docker=SENTIEONdocker,
  149. disk_size=disk_size,
  150. cluster_config=BIGcluster_config
  151. }
  152. call Haplotyper_gVCF.Haplotyper_gVCF as Haplotyper_gVCF {
  153. input:
  154. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  155. fasta=fasta,
  156. ref_dir=ref_dir,
  157. recaled_bam=BQSR.recaled_bam,
  158. recaled_bam_index=BQSR.recaled_bam_index,
  159. sample=quartet[2],
  160. docker=SENTIEONdocker,
  161. disk_size=disk_size,
  162. cluster_config=BIGcluster_config
  163. }
  164. }
  165. call GVCFtyper.GVCFtyper as GVCFtyper {
  166. input:
  167. ref_dir=ref_dir,
  168. SENTIEON_INSTALL_DIR=SENTIEON_INSTALL_DIR,
  169. fasta=fasta,
  170. vcf=Haplotyper_gVCF.vcf,
  171. vcf_idx=Haplotyper_gVCF.vcf_idx,
  172. project=project,
  173. docker=SENTIEONdocker,
  174. cluster_config=BIGcluster_config,
  175. disk_size=disk_size
  176. }
  177. call split_gvcf_files.split_gvcf_files as split_gvcf_files {
  178. input:
  179. gvcf=GVCFtyper.gvcf,
  180. docker=DIYdocker,
  181. project=project,
  182. cluster_config=SMALLcluster_config,
  183. disk_size=disk_size
  184. }
  185. Array[File] single_gvcf = split_gvcf_files.splited_vcf
  186. scatter (idx in range(length(single_gvcf))) {
  187. call benchmark.benchmark as benchmark {
  188. input:
  189. vcf=single_gvcf[idx],
  190. benchmarking_dir=benchmarking_dir,
  191. ref_dir=ref_dir,
  192. fasta=fasta,
  193. docker=BENCHMARKdocker,
  194. cluster_config=BIGcluster_config,
  195. disk_size=disk_size
  196. }
  197. }
  198. call merge_sentieon_metrics.merge_sentieon_metrics as merge_sentieon_metrics {
  199. input:
  200. quality_yield_header=sentieon.quality_yield_header,
  201. wgs_metrics_algo_header=sentieon.wgs_metrics_algo_header,
  202. aln_metrics_header=sentieon.aln_metrics_header,
  203. is_metrics_header=sentieon.is_metrics_header,
  204. quality_yield_data=sentieon.quality_yield_data,
  205. wgs_metrics_algo_data=sentieon.wgs_metrics_algo_data,
  206. aln_metrics_data=sentieon.aln_metrics_data,
  207. is_metrics_data=sentieon.is_metrics_data,
  208. project=project,
  209. docker=MULTIQCdocker,
  210. cluster_config=SMALLcluster_config,
  211. disk_size=disk_size
  212. }
  213. call extract_tables.extract_tables as extract_tables {
  214. input:
  215. quality_yield_summary=merge_sentieon_metrics.quality_yield_summary,
  216. wgs_metrics_summary=merge_sentieon_metrics.wgs_metrics_summary,
  217. aln_metrics_summary=merge_sentieon_metrics.aln_metrics_summary,
  218. is_metrics_summary=merge_sentieon_metrics.is_metrics_summary,
  219. fastqc=multiqc.fastqc,
  220. fastqscreen=multiqc.fastqscreen,
  221. hap=multiqc.hap,
  222. project=project,
  223. docker=DIYdocker,
  224. cluster_config=SMALLcluster_config,
  225. disk_size=disk_size
  226. }
  227. Boolean sister_tag = read_boolean(split_gvcf_files.sister_tag)
  228. Boolean quartet_tag = read_boolean(split_gvcf_files.quartet_tag)
  229. if (sister_tag) {
  230. call D5_D6.D5_D6 as D5_D6 {
  231. input:
  232. splited_vcf=split_gvcf_files.splited_vcf,
  233. project=project,
  234. docker=DIYdocker,
  235. cluster_config=SMALLcluster_config,
  236. disk_size=disk_size,
  237. }
  238. }
  239. if (quartet_tag) {
  240. call merge_family.merge_family as merge_family {
  241. input:
  242. splited_vcf=split_gvcf_files.splited_vcf,
  243. project=project,
  244. docker=DIYdocker,
  245. cluster_config=SMALLcluster_config,
  246. disk_size=disk_size,
  247. }
  248. Array[File] family_vcfs = merge_family.family_vcf
  249. scatter (idx in range(length(family_vcfs))) {
  250. call mendelian.mendelian as mendelian {
  251. input:
  252. family_vcf=family_vcfs[idx],
  253. ref_dir=ref_dir,
  254. fasta=fasta,
  255. docker=MENDELIANdocker,
  256. cluster_config=BIGcluster_config,
  257. disk_size=disk_size
  258. }
  259. call merge_mendelian.merge_mendelian as merge_mendelian {
  260. input:
  261. D5_trio_vcf=mendelian.D5_trio_vcf,
  262. D6_trio_vcf=mendelian.D6_trio_vcf,
  263. family_vcf=family_vcfs[idx],
  264. docker=DIYdocker,
  265. cluster_config=SMALLcluster_config,
  266. disk_size=disk_size
  267. }
  268. }
  269. call quartet_mendelian.quartet_mendelian as quartet_mendelian {
  270. input:
  271. project_mendelian_summary=merge_mendelian.project_mendelian_summary,
  272. project=project,
  273. docker=DIYdocker,
  274. cluster_config=SMALLcluster_config,
  275. disk_size=disk_size
  276. }
  277. }
  278. }