使用fastp对fastq文件进行质控, 使用fastqscreen对污染源进行检测
Nelze vybrat více než 25 témat Téma musí začínat písmenem nebo číslem, může obsahovat pomlčky („-“) a může být dlouhé až 35 znaků.

71 lines
1.6KB

  1. task fastp {
  2. input {
  3. # I/O options
  4. File in1
  5. File in2
  6. String sample_id
  7. Boolean? phred64 = false
  8. Boolean? fix_mgi_id = false
  9. String? adapter_sequence
  10. String? adapter_sequence_r2
  11. Int? reads_to_process # specify how many reads/pairs to be processed. Default 0 means process all reads.
  12. # reporting options
  13. String json = sample_id+"fastp.json"
  14. String html = sample_id+"fastp.html"
  15. String report_title = "\'fastp report\'"
  16. # excute env
  17. String docker
  18. String cluster_config
  19. String disk_size
  20. }
  21. String out1_name = sample_id+'clean_1.fastq'
  22. String out2_name = sample_id+'clean_2.fastq'
  23. command <<<
  24. # basic command
  25. /opt/conda/bin/fastp \
  26. --in1 ${in1} \
  27. --in2 ${in2} \
  28. --out1 ${out1_name} \
  29. --out2 ${out2_name} \
  30. --json ${json} \
  31. --html ${html} \
  32. --report_title ${report_title} \
  33. # options
  34. ${ true="--phred64 " false="" phred64 } \
  35. ${ "--reads_to_process " + reads_to_process } \
  36. ${ true="--fix_mgi_id " false="" fix_mgi_id } \
  37. ${ "--adapter_sequence " + adapter_sequence } \
  38. ${ "--adapter_sequence_r2 " + adapter_sequence_r2 }
  39. >>>
  40. runtime {
  41. docker:docker
  42. cluster:cluster_config
  43. systemDisk:"cloud_ssd 40"
  44. dataDisk:"cloud_ssd " + disk_size + " /cromwell_root/"
  45. }
  46. output {
  47. File out1 = out1_name
  48. File out2 = out2_name
  49. File json_report = json
  50. File html_report = html
  51. }
  52. }