Nie możesz wybrać więcej, niż 25 tematów Tematy muszą się zaczynać od litery lub cyfry, mogą zawierać myślniki ('-') i mogą mieć do 35 znaków.

71 lines
2.6KB

  1. task BQSR {
  2. File ref_dir
  3. File dbsnp_dir
  4. File dbmills_dir
  5. String fasta
  6. String dbsnp
  7. String db_mills
  8. File realigned_bam
  9. File realigned_bam_index
  10. String sample = basename(realigned_bam,".sorted.deduped.realigned.bam")
  11. String docker
  12. String cluster_config
  13. String disk_size
  14. command <<<
  15. set -o pipefail
  16. set -e
  17. # export SENTIEON_LICENSE=192.168.0.55:8990
  18. # nt=$(nproc)
  19. # ${SENTIEON_INSTALL_DIR}/bin/sentieon driver -r ${ref_dir}/${fasta} -t $nt -i ${realigned_bam} --algo QualCal -k ${dbsnp_dir}/${dbsnp} -k ${dbmills_dir}/${db_mills} ${sample}_recal_data.table
  20. # ${SENTIEON_INSTALL_DIR}/bin/sentieon driver -r ${ref_dir}/${fasta} -t $nt -i ${realigned_bam} -q ${sample}_recal_data.table --algo QualCal -k ${dbsnp_dir}/${dbsnp} -k ${dbmills_dir}/${db_mills} ${sample}_recal_data.table.post --algo ReadWriter ${sample}.sorted.deduped.realigned.recaled.bam
  21. # ${SENTIEON_INSTALL_DIR}/bin/sentieon driver -t $nt --algo QualCal --plot --before ${sample}_recal_data.table --after ${sample}_recal_data.table.post ${sample}_recal_data.csv
  22. # ${SENTIEON_INSTALL_DIR}/bin/sentieon plot QualCal -o ${sample}_bqsrreport.pdf ${sample}_recal_data.csv
  23. gatk BaseRecalibrator \
  24. -R ${ref_dir}/${fasta} \
  25. -I ${realigned_bam} \
  26. --known-sites ${dbsnp_dir}/${dbsnp} \
  27. --known-sites ${dbmills_dir}/${db_mills} \
  28. -O ${sample}_recal_data.table
  29. gatk ApplyBQSR \
  30. -R ${ref_dir}/${fasta} \
  31. -I ${realigned_bam} \
  32. -bqsr ${sample}_recal_data.table \
  33. -O ${sample}.sorted.deduped.realigned.recaled.bam
  34. samtools index -@ $(nproc) -o ${sample}.sorted.deduped.realigned.recaled.bam.bai ${sample}.sorted.deduped.realigned.recaled.bam
  35. # gatk BaseRecalibrator \
  36. # -R ${ref_dir}/${fasta} \
  37. # -I ${sample}.sorted.deduped.realigned.recaled.bam \
  38. # --known-sites ${dbsnp_dir}/${dbsnp} \
  39. # --known-sites ${dbmills_dir}/${db_mills} \
  40. # -O ${sample}_recal_data.table.post
  41. # gatk AnalyzeCovariates \
  42. # -before ${sample}_recal_data.table \
  43. # -after ${sample}_recal_data.table.post \
  44. # -csv ${sample}_recal_data.csv
  45. >>>
  46. runtime {
  47. docker:docker
  48. cluster: cluster_config
  49. systemDisk: "cloud_ssd 40"
  50. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  51. }
  52. output {
  53. # File recal_table = "${sample}_recal_data.table"
  54. # File recal_post = "${sample}_recal_data.table.post"
  55. File recaled_bam = "${sample}.sorted.deduped.realigned.recaled.bam"
  56. File recaled_bam_index = "${sample}.sorted.deduped.realigned.recaled.bam.bai"
  57. # File recal_csv = "${sample}_recal_data.csv"
  58. # File bqsrreport_pdf = "${sample}_bqsrreport.pdf"
  59. }
  60. }