Automated integrated analysis software for genomics data of the cancer patients.
Vous ne pouvez pas sélectionner plus de 25 sujets Les noms de sujets doivent commencer par une lettre ou un nombre, peuvent contenir des tirets ('-') et peuvent comporter jusqu'à 35 caractères.

53 lignes
1.5KB

  1. task mapping {
  2. File ref_dir
  3. String fasta
  4. File fastq_1
  5. File fastq_2
  6. String SENTIEON_LICENSE
  7. String group
  8. String sample
  9. String platform
  10. String? duplex_umi
  11. String? read_structure
  12. String docker
  13. String cluster_config
  14. String disk_size
  15. command <<<
  16. set -o pipefail
  17. set -e
  18. export SENTIEON_LICENSE=${SENTIEON_LICENSE}
  19. nt=$(nproc)
  20. if [ ${read_structure} ]; then
  21. if [ ${duplex_umi} == "true" ]; then
  22. READ_STRUCTURE="-d ${read_structure}"
  23. fi
  24. sentieon umi extract $READ_STRUCTURE ${fastq_1} ${fastq_2} | \
  25. sentieon bwa mem -p -C -R "@RG\tID:${group}\tSM:${sample}\tPL:${platform}" -t $nt -K 10000000 ${ref_dir}/${fasta} - | \
  26. sentieon umi consensus -o ${sample}.umi_consensus.fastq.gz
  27. sentieon bwa mem -p -C -R "@RG\tID:${group}\tSM:${sample}\tPL:${platform}" -t $nt -K 10000000 $fasta ${sample}.umi_consensus.fastq.gz | \
  28. sentieon util sort --umi_post_process --sam2bam -i - -o ${sample}.sorted.bam
  29. else
  30. sentieon bwa mem -R "@RG\tID:${group}\tSM:${sample}\tPL:${platform}" \
  31. -t $nt -K 10000000 ${ref_dir}/${fasta} ${fastq_1} ${fastq_2} | \
  32. sentieon util sort -o ${sample}.sorted.bam -t $nt --sam2bam -i -
  33. fi
  34. >>>
  35. runtime {
  36. docker: docker
  37. cluster: cluster_config
  38. systemDisk: "cloud_ssd 40"
  39. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  40. }
  41. output {
  42. File sorted_bam = "${sample}.sorted.bam"
  43. File sorted_bam_index = "${sample}.sorted.bam.bai"
  44. }
  45. }