You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

67 satır
1.8KB

  1. task arriba {
  2. String sample_id
  3. File fastq1
  4. File fastq2
  5. File STAR_INDEX_DIR
  6. File ASSEMBLY_FA
  7. File ANNOTATION_GTF
  8. String docker
  9. String cluster
  10. String disk_size
  11. command <<<
  12. set -o pipefail
  13. set -e
  14. mkdir ./output/
  15. STAR \
  16. --runThreadN 4 \
  17. --genomeDir ${STAR_INDEX_DIR} \
  18. --genomeLoad NoSharedMemory \
  19. --readFilesIn ${fastq1} ${fastq2} \
  20. --readFilesCommand zcat \
  21. --outStd BAM_Unsorted \
  22. --outSAMtype BAM Unsorted \
  23. --outSAMunmapped Within \
  24. --outBAMcompression 0 \
  25. --outFilterMultimapNmax 50 \
  26. --peOverlapNbasesMin 10 \
  27. --alignSplicedMateMapLminOverLmate 0.5 \
  28. --alignSJstitchMismatchNmax 5 -1 5 5 \
  29. --chimSegmentMin 10 \
  30. --chimOutType WithinBAM HardClip \
  31. --chimJunctionOverhangMin 10 \
  32. --chimScoreDropMax 30 \
  33. --chimScoreJunctionNonGTAG 0 \
  34. --chimScoreSeparation 1 \
  35. --chimSegmentReadGapMax 3 \
  36. --chimMultimapNmax 50 |tee ./output/${sample_id}.Aligned.out.bam |/arriba_v2.1.0/arriba \
  37. -x /dev/stdin \
  38. -o ./output/${sample_id}_fusions.tsv \
  39. -O ./output/${sample_id}_fusions.discarded.tsv \
  40. -a ${ASSEMBLY_FA} \
  41. -g ${ANNOTATION_GTF} \
  42. -b /arriba_v2.1.0/database/blacklist_hg38_GRCh38_v2.1.0.tsv.gz \
  43. -k /arriba_v2.1.0/database/known_fusions_hg38_GRCh38_v2.1.0.tsv.gz \
  44. -t /arriba_v2.1.0/database/known_fusions_hg38_GRCh38_v2.1.0.tsv.gz \
  45. -p /arriba_v2.1.0/database/protein_domains_hg38_GRCh38_v2.1.0.gff3
  46. >>>
  47. runtime {
  48. docker: docker
  49. cluster: cluster
  50. systemDisk: "cloud_ssd 40"
  51. dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
  52. }
  53. output {
  54. Array[File] arriba_result = glob("./output/*.tsv")
  55. Array[File] arriba_bam=glob("./output/*.bam")
  56. }
  57. }