Nie możesz wybrać więcej, niż 25 tematów Tematy muszą się zaczynać od litery lub cyfry, mogą zawierać myślniki ('-') i mogą mieć do 35 znaków.

46 lines
1.4KB

  1. task Jaccard_Index {
  2. File merged_gvcf
  3. String chromo
  4. String docker
  5. String cluster_config
  6. String disk_size
  7. command <<<
  8. cat ${merged_gvcf} | grep -v '##' | awk '
  9. BEGIN { OFS = "\t" }
  10. NF > 2 && FNR > 1 {
  11. for ( i=9; i<=NF; i++ ) {
  12. split($i,a,":") ;$i = a[1];
  13. }
  14. }
  15. { print }
  16. '| cut -f1,2,4,5,10- > ${chromo}.gt
  17. cat ${chromo}.gt | awk '{ if ((length($3) == 1) && (length($4) == 1)) { print } }' > ${chromo}.gt.snv
  18. cat ${chromo}.gt | awk '{ if ((length($3) != 1) || (length($4) != 1)) { print } }' > ${chromo}.gt.indel
  19. cat ${chromo}.gt | head -n1 | cat - ${chromo}.gt.snv > ${chromo}.gt.snv.txt
  20. python /opt/library_concordance.py -i ${chromo}.gt.snv.txt -prefix ${chromo}.snv
  21. python /opt/filter_indel_over_50.py -i ${chromo}.gt.indel -prefix ${chromo}
  22. cat ${chromo}.gt | head -n1 | cat - ${chromo}.indel.lessthan50bp.txt > ${chromo}.gt.indel.txt
  23. python /opt/library_concordance.py -i ${chromo}.gt.indel.txt -prefix ${chromo}.indel
  24. >>>
  25. runtime {
  26. docker:docker
  27. cluster: cluster_config
  28. systemDisk: "cloud_ssd 40"
  29. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  30. }
  31. output {
  32. File genotype = "${chromo}.gt"
  33. File snv = "${chromo}.gt.snv.txt"
  34. File indel = "${chromo}.indel.txt"
  35. File snv_inter = "${chromo}.snv.inter.txt"
  36. File snv_union = "${chromo}.snv.union.txt"
  37. File indel_inter = "${chromo}.indel.inter.txt"
  38. File indel_union = "${chromo}.indel.union.txt"
  39. }
  40. }