Annotation of genetic variants detected from human genome hg19 and hg38.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

53 lines
1.6KB

  1. task annovar {
  2. File vcf
  3. String basename = basename(vcf,".vcf")
  4. String hg
  5. File annovar_database
  6. String docker
  7. String cluster_config
  8. String disk_size
  9. command <<<
  10. set -o pipefail
  11. set -e
  12. nt=$(nproc)
  13. awk -F'\t' '{if(($1~"^#")||($1!~"^#" && $7=="PASS")){print $0}}' ${vcf} > ${basename}.PASS.vcf
  14. if [ ${hg} == "hg38" ]; then
  15. /installations/annovar/table_annovar.pl ${basename}.PASS.vcf \
  16. ${annovar_database} -buildver ${hg} \
  17. -out ${basename} -remove \
  18. #-protocol refGene,cytoBand,genomicSuperDups,ljb26_all,dbnsfp35c,intervar_20180118,cosmic70,exac03,gnomad211_exome,clinvar_20210501 \
  19. #-operation g,r,r,f,f,f,f,f,f,f \
  20. -protocol refGene,ensGene,knownGene,rmsk,esp6500siv2_all,1000g2015aug,avsnp147,dbnsfp33a,clinvar_20210501,gnomad_genome,dbscsnv11,dbnsfp31a_interpro \
  21. -operation g,g,g,r,f,f,f,f,f,f,f,f \
  22. -nastring . -vcfinput -thread $nt
  23. fi
  24. if [ ${hg} == "hg19" ]; then
  25. /installations/annovar/table_annovar.pl ${basename}.PASS.vcf \
  26. ${annovar_database} -buildver ${hg} \
  27. -out ${basename} -remove \
  28. -protocol refGene,cytoBand,genomicSuperDups,ljb26_all,snp138,cosmic78,intervar_20170202,popfreq_all_20150413,clinvar_20190305 \
  29. -operation g,r,r,f,f,f,f,f,f \
  30. -nastring . -vcfinput -thread $nt
  31. fi
  32. >>>
  33. runtime {
  34. docker: docker
  35. cluster: cluster_config
  36. systemDisk: "cloud_ssd 40"
  37. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  38. }
  39. output {
  40. File pass_vcf = "${basename}.PASS.vcf"
  41. File avinput = "${basename}.avinput"
  42. File multianno_txt = "${basename}.${hg}_multianno.txt"
  43. File multianno_vcf = "${basename}.${hg}_multianno.vcf"
  44. }
  45. }