You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

67 lines
2.0KB

  1. task arriba{
  2. String sample_id
  3. File fastq1
  4. File fastq2
  5. File STAR_INDEX_DIR
  6. File ASSEMBLY_FA
  7. File ANNOTATION_GTF
  8. String disk_size
  9. String docker
  10. String cluster
  11. command <<<
  12. set -o pipefail
  13. set -e
  14. mkdir ./output/
  15. STAR \
  16. --runThreadN 4 \
  17. --genomeDir ${STAR_INDEX_DIR} \
  18. --genomeLoad NoSharedMemory \
  19. --readFilesIn ${fastq1} ${fastq2} \
  20. --readFilesCommand zcat \
  21. --outSAMtype BAM Unsorted \
  22. --outSAMunmapped Within \
  23. --outBAMcompression 0 \
  24. --outFilterMultimapNmax 50 \
  25. --peOverlapNbasesMin 10 \
  26. --alignSplicedMateMapLminOverLmate 0.5 \
  27. --alignSJstitchMismatchNmax 5 -1 5 5 \
  28. --chimSegmentMin 10 \
  29. --chimOutType WithinBAM HardClip \
  30. --chimJunctionOverhangMin 10 \
  31. --chimScoreDropMax 30 \
  32. --chimScoreJunctionNonGTAG 0 \
  33. --chimScoreSeparation 1 \
  34. --chimSegmentReadGapMax 3 \
  35. --chimMultimapNmax 50 |tee ./output/${sample_id}.Aligned.out.bam |/arriba_v2.1.0/arriba \
  36. -x /dev/stdin \
  37. -o ./output/${sample_id}_fusions.tsv -O ./output/${sample_id}_fusions.discarded.tsv \
  38. -a ${ASSEMBLY_FA} \
  39. -g ${ANNOTATION_GTF} \
  40. -b /arriba_v2.1.0/database/blacklist_hg38_GRCh38_v2.1.0.tsv.gz \
  41. -k /arriba_v2.1.0/database/known_fusions_hg38_GRCh38_v2.1.0.tsv.gz \
  42. -t /arriba_v2.1.0/database/known_fusions_hg38_GRCh38_v2.1.0.tsv.gz \
  43. -p /arriba_v2.1.0/database/protein_domains_hg38_GRCh38_v2.1.0.gff3
  44. >>>
  45. runtime {
  46. docker: docker
  47. cluster: cluster
  48. systemDisk: "cloud_ssd 40"
  49. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  50. }
  51. output {
  52. Array[File] arriba_result=glob("./output/*.tsv")
  53. Array[File] arriba_bam=glob("./output/*.bam")
  54. }
  55. }