Germline & Somatic short variant discovery (SNVs + Indels) for WGS & WES.
Nelze vybrat více než 25 témat Téma musí začínat písmenem nebo číslem, může obsahovat pomlčky („-“) a může být dlouhé až 35 znaků.

93 lines
2.5KB

  1. task TNseq {
  2. String sample
  3. String SENTIEON_INSTALL_DIR
  4. String SENTIEON_LICENSE
  5. File tumor_recaled_bam
  6. File tumor_recaled_bam_index
  7. File? normal_recaled_bam
  8. File? normal_recaled_bam_index
  9. String tumor_name
  10. String normal_name
  11. File ref_dir
  12. String fasta
  13. File germline_resource
  14. File germline_resource_tbi
  15. File? regions
  16. Int? interval_padding
  17. File? pon_vcf
  18. String docker
  19. String cluster_config
  20. String disk_size
  21. command <<<
  22. set -o pipefail
  23. set -e
  24. export SENTIEON_LICENSE=${SENTIEON_LICENSE}
  25. nt=$(nproc)
  26. if [ ${regions} ]; then
  27. INTERVAL="--interval ${regions} --interval_padding ${interval_padding}"
  28. else
  29. INTERVAL=""
  30. fi
  31. if [ ${pon_vcf} ]; then
  32. PON="--pon ${pon_vcf}"
  33. ${SENTIEON_INSTALL_DIR}/bin/sentieon util vcfindex ${pon_vcf}
  34. else
  35. PON=""
  36. fi
  37. if [ ${normal_recaled_bam} ]; then
  38. INPUT="-i ${tumor_recaled_bam} -i ${normal_recaled_bam}"
  39. SAMPLE="--tumor_sample ${tumor_name} --normal_sample ${normal_name}"
  40. typ="TN"
  41. else
  42. INPUT="-i ${tumor_recaled_bam}"
  43. SAMPLE="--tumor_sample ${tumor_name}"
  44. typ="T"
  45. fi
  46. ${SENTIEON_INSTALL_DIR}/bin/sentieon driver -t $nt -r ${ref_dir}/${fasta} \
  47. $INPUT $INTERVAL \
  48. --algo TNhaplotyper2 $SAMPLE \
  49. --germline_vcf ${germline_resource} \
  50. $PON \
  51. ${sample}.TNseq.$typ.vcf \
  52. --algo OrientationBias --tumor_sample ${tumor_name} \
  53. ${sample}.orientation \
  54. --algo ContaminationModel $SAMPLE \
  55. --vcf ${germline_resource} \
  56. --tumor_segments ${sample}.contamination.segments \
  57. ${sample}.contamination
  58. ${SENTIEON_INSTALL_DIR}/bin/sentieon driver -t $nt \
  59. -r ${ref_dir}/${fasta} \
  60. --algo TNfilter $SAMPLE \
  61. -v ${sample}.TNseq.$typ.vcf \
  62. --contamination ${sample}.contamination \
  63. --tumor_segments ${sample}.contamination.segments \
  64. --orientation_priors ${sample}.orientation \
  65. ${sample}.TNseq.$typ.filter.vcf
  66. >>>
  67. runtime {
  68. docker: docker
  69. cluster: cluster_config
  70. systemDisk: "cloud_ssd 40"
  71. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  72. }
  73. output {
  74. File TNseq_filter_vcf = "${sample}.TNseq.${typ}.filter.vcf"
  75. File TNseq_filter_vcf_index = "${sample}.TNseq.${typ}.filter.vcf.idx"
  76. File TNseq_vcf = "${sample}.TNseq.${typ}.vcf"
  77. File TNseq_vcf_index = "${sample}.TNseq.${typ}.vcf.idx"
  78. File contamination = "${sample}.contamination"
  79. File contamination_segments = "${sample}.contamination.segments"
  80. File orientation = "${sample}.orientation"
  81. }
  82. }