Nie możesz wybrać więcej, niż 25 tematów Tematy muszą się zaczynać od litery lub cyfry, mogą zawierać myślniki ('-') i mogą mieć do 35 znaków.

VQSR.wdl 3.1KB

5 lat temu
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869
  1. task VQSR {
  2. String SENTIEON_INSTALL_DIR
  3. String fasta
  4. File vcf
  5. File vcf_index
  6. File ref_dir
  7. String dbsnp
  8. String dbsnp_Mill
  9. String dbsnp_1000G_omni
  10. String dbsnp_hapmap
  11. String dbsnp_1000G_phase1
  12. String sample
  13. String docker
  14. String cluster_config
  15. String disk_size
  16. command <<<
  17. set -o pipefail
  18. set -e
  19. export SENTIEON_LICENSE=192.168.0.55:8990
  20. resource_text="--resource ${dbsnp_1000G_phase1} \
  21. --resource_param 1000G,known=false,training=true,truth=false,prior=10.0 "
  22. resource_text="$resource_text --resource ${dbsnp_1000G_omni} \
  23. --resource_param omni,known=false,training=true,truth=true,prior=12.0 "
  24. resource_text="$resource_text --resource ${dbsnp} \
  25. --resource_param dbsnp,known=true,training=false,truth=false,prior=2.0 "
  26. resource_text="$resource_text --resource ${dbsnp_hapmap} \
  27. --resource_param hapmap,known=false,training=true,truth=true,prior=15.0"
  28. annotation_array="DP QD FS SOR MQ MQRankSum ReadPosRankSum"
  29. for annotation in $annotation_array; do
  30. annotate_text="$annotate_text --annotation $annotation"
  31. done
  32. ${SENTIEON_INSTALL_DIR}/bin/sentieon driver -r ${ref_dir}/${fasta} --algo VarCal -v ${vcf} $resource_text $annotate_text --var_type SNP --plot_file ${sample}.vqsrSNP.hc.plotfile --tranches_file ${sample}.vqsrSNP.hc.tranches ${sample}.vqsrSNP.hc.recal
  33. ${SENTIEON_INSTALL_DIR}/bin/sentieon driver -r ${ref_dir}/${fasta} --algo ApplyVarCal -v ${vcf} --var_type SNP --tranches_file ${sample}.vqsrSNP.hc.tranches --sensitivity 99.0 --recal ${sample}.vqsrSNP.hc.recal ${sample}.vqsrSNP.hc.recaled.vcf.gz
  34. ${SENTIEON_INSTALL_DIR}/bin/sentieon plot vqsr -o ${sample}.vqsrSNP.pdf ${sample}.vqsrSNP.hc.plotfile
  35. resource_text="$resource_text --resource ${dbsnp_Mill} \
  36. --resource_param Mills,known=false,training=true,truth=true,prior=12.0 "
  37. resource_text="$resource_text --resource ${dbsnp} \
  38. --resource_param dbsnp,known=true,training=false,truth=false,prior=2.0 "
  39. annotation_array="QD DP FS SOR MQ ReadPosRankSum"
  40. annotate_text=""
  41. for annotation in $annotation_array; do
  42. annotate_text="$annotate_text --annotation $annotation"
  43. done
  44. ${SENTIEON_INSTALL_DIR}/bin/sentieon driver -r ${ref_dir}/${fasta} --algo VarCal -v ${vcf} $resource_text $annotate_text --var_type INDEL --plot_file ${sample}.vqsrINDEL.hc.plotfile --max_gaussians 4 --tranches_file ${sample}.vqsrINDEL.hc.tranches ${sample}.vqsrINDEL.hc.recal
  45. ${SENTIEON_INSTALL_DIR}/bin/sentieon driver -r ${ref_dir}/${fasta} --algo ApplyVarCal -v ${sample}.vqsrSNP.hc.recaled.vcf.gz --var_type INDEL --recal ${sample}.vqsrINDEL.hc.recal --tranches_file ${sample}.vqsrINDEL.hc.tranches --sensitivity 99.0 ${sample}.vqsrSNPINDEL.hc.recaled.vcf.gz
  46. ${SENTIEON_INSTALL_DIR}/bin/sentieon plot vqsr -o ${sample}.vqsrINDEL.VQSR.pdf ${sample}.vqsrINDEL.hc.plotfile
  47. >>>
  48. runtime {
  49. dockerTag:docker
  50. cluster: cluster_config
  51. systemDisk: "cloud_ssd 40"
  52. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  53. }
  54. output {
  55. File filtered_vcf = "${sample}.vqsrSNPINDEL.hc.recaled.vcf.gz"
  56. }
  57. }