您最多选择25个主题 主题必须以字母或数字开头,可以包含连字符 (-),并且长度不得超过35个字符

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768
  1. task split_file {
  2. File D5_trio_raw_vcf
  3. File D6_trio_raw_vcf
  4. File family_raw_vcf
  5. File high_confidence_bed
  6. String family_name
  7. String docker
  8. String cluster_config
  9. String disk_size
  10. command <<<
  11. cat ${D5_trio_raw_vcf} | grep '#CHROM' > D5.header
  12. cat ${D6_trio_raw_vcf} | grep '#CHROM' > D6.header
  13. cat ${family_raw_vcf} | grep '#CHROM' > family.header
  14. /opt/ccdg/bedtools-2.27.1/bin/bedtools intersect -a ${D5_trio_raw_vcf} -b ${high_confidence_bed} > D5.in
  15. /opt/ccdg/bedtools-2.27.1/bin/bedtools intersect -a ${D6_trio_raw_vcf} -b ${high_confidence_bed} > D6.in
  16. /opt/ccdg/bedtools-2.27.1/bin/bedtools intersect -a ${family_raw_vcf} -b ${high_confidence_bed} > family.in
  17. /opt/ccdg/bedtools-2.27.1/bin/bedtools intersect -a ${D5_trio_raw_vcf} -b ${high_confidence_bed} -v > D5.out
  18. /opt/ccdg/bedtools-2.27.1/bin/bedtools intersect -a ${D6_trio_raw_vcf} -b ${high_confidence_bed} -v > D6.out
  19. /opt/ccdg/bedtools-2.27.1/bin/bedtools intersect -a ${family_raw_vcf} -b ${high_confidence_bed} -v > family.out
  20. cat D5.header D5.in > ${family_name}.D5.in.txt
  21. cat D6.header D6.in > ${family_name}.D6.in.txt
  22. cat family.header family.in > ${family_name}.family.in.txt
  23. cat D5.header D5.out > ${family_name}.D5.out.txt
  24. cat D6.header D6.out > ${family_name}.D6.out.txt
  25. cat family.header family.out > ${family_name}.family.out.txt
  26. cat ${family_name}.family.in.txt | awk '
  27. BEGIN { OFS = "\t" }
  28. NF > 2 && FNR > 1 {
  29. for ( i=9; i<=NF; i++ ) {
  30. split($i,a,":") ;$i = a[1];
  31. }
  32. }
  33. { print }
  34. ' > ${family_name}.family.in.gt.txt
  35. cat ${family_name}.family.out.txt | awk '
  36. BEGIN { OFS = "\t" }
  37. NF > 2 && FNR > 1 {
  38. for ( i=9; i<=NF; i++ ) {
  39. split($i,a,":") ;$i = a[1];
  40. }
  41. }
  42. { print }
  43. ' > ${family_name}.family.out.gt.txt
  44. >>>
  45. runtime {
  46. docker:docker
  47. cluster: cluster_config
  48. systemDisk: "cloud_ssd 40"
  49. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  50. }
  51. output {
  52. File D5_in = "${family_name}.D5.in.txt"
  53. File D6_in = "${family_name}.D6.in.txt"
  54. File family_in = "${family_name}.family.in.gt.txt"
  55. File D5_out = "${family_name}.D5.out.txt"
  56. File D6_out = "${family_name}.D6.out.txt"
  57. File family_out = "${family_name}.family.out.gt.txt"
  58. }
  59. }