Infer and visualize copy number from high-throughput DNA sequencing data.
Вы не можете выбрать более 25 тем Темы должны начинаться с буквы или цифры, могут содержать дефисы(-) и должны содержать не более 35 символов.

53 lines
1.6KB

  1. task batch {
  2. String sample_id
  3. Array[File] tumor_bam
  4. Array[File] tumor_bai
  5. Array[File] normal_bam
  6. Array[File] normal_bai
  7. File bed
  8. File faidx
  9. File fasta
  10. File? ref_flat
  11. File access_bed
  12. File? reference
  13. String method
  14. String docker
  15. String cluster_config
  16. String disk_size
  17. String annotate_opt = if (ref_flat != "") then "--annotate ${ref_flat}" else ""
  18. String reference_opt = if (reference != "") then "--reference ${reference}" else ""
  19. String access_opt = if (method == "amplicon") then "--access ${bed}" else "--access ${access_bed}"
  20. command <<<
  21. set -o pipefail
  22. set -e
  23. mkdir -p /cromwell_root/tmp/cnvkit
  24. cp ${sep=' ' normal_bai} /cromwell_root/tmp/cnvkit
  25. cp ${sep=' ' tumor_bai} /cromwell_root/tmp/cnvkit
  26. cp ${fasta} /cromwell_root/tmp/cnvkit/hg38.fa
  27. cp ${faidx} /cromwell_root/tmp/cnvkit/hg38.fai
  28. cd /cromwell_root/tmp/cnvkit
  29. mkdir results
  30. cnvkit.py batch ${sep=' ' tumor_bam} --normal ${sep=' ' normal_bam} \
  31. --method ${method} \
  32. --targets ${bed} ${annotate_opt} \
  33. --fasta hg38.fa ${access_opt} ${reference_opt} \
  34. --output-reference ~/${sample_id}.reference.cnn \
  35. --output-dir ./results/ \
  36. --drop-low-coverage --diagram --scatter
  37. >>>
  38. runtime {
  39. docker: docker
  40. cluster: cluster_config
  41. systemDisk: "cloud_ssd 40"
  42. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  43. }
  44. output {
  45. File reference_cnn = "${sample_id}.reference.cnn"
  46. Array[File] results = glob("/cromwell_root/tmp/cnvkit/results/*")
  47. }
  48. }