Automated integrated analysis software for genomics data of the cancer patients.
Du kan inte välja fler än 25 ämnen Ämnen måste starta med en bokstav eller siffra, kan innehålla bindestreck ('-') och vara max 35 tecken långa.

mapping.wdl 1.5KB

2 år sedan
2 år sedan
12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152
  1. task mapping {
  2. File ref_dir
  3. String fasta
  4. File fastq_1
  5. File fastq_2
  6. String SENTIEON_LICENSE
  7. String group
  8. String sample
  9. String platform
  10. String? duplex_umi
  11. String? read_structure
  12. String docker
  13. String cluster_config
  14. String disk_size
  15. command <<<
  16. set -o pipefail
  17. set -e
  18. export SENTIEON_LICENSE=${SENTIEON_LICENSE}
  19. nt=$(nproc)
  20. if [ ${read_structure} ]; then
  21. if [ ${duplex_umi} == "true" ]; then
  22. READ_STRUCTURE="-d ${read_structure}"
  23. fi
  24. sentieon umi extract $READ_STRUCTURE ${fastq_1} ${fastq_2} | \
  25. sentieon bwa mem -p -C -R "@RG\tID:${group}\tSM:${sample}\tPL:${platform}" -t $nt -K 10000000 ${ref_dir}/${fasta} - | \
  26. sentieon umi consensus -o ${sample}.umi_consensus.fastq.gz
  27. sentieon bwa mem -p -C -R "@RG\tID:${group}\tSM:${sample}\tPL:${platform}" -t $nt -K 10000000 $fasta ${sample}.umi_consensus.fastq.gz | \
  28. sentieon util sort --umi_post_process --sam2bam -i - -o ${sample}.sorted.bam
  29. else
  30. sentieon bwa mem -R "@RG\tID:${group}\tSM:${sample}\tPL:${platform}" \
  31. -t $nt -K 10000000 ${ref_dir}/${fasta} ${fastq_1} ${fastq_2} | \
  32. sentieon util sort -o ${sample}.sorted.bam -t $nt --sam2bam -i -
  33. fi
  34. >>>
  35. runtime {
  36. docker: docker
  37. cluster: cluster_config
  38. systemDisk: "cloud_ssd 40"
  39. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  40. }
  41. output {
  42. File sorted_bam = "${sample}.sorted.bam"
  43. File sorted_bam_index = "${sample}.sorted.bam.bai"
  44. }
  45. }