stead99 преди 5 години
ревизия
bd4ac47198
променени са 8 файла, в които са добавени 151 реда и са изтрити 0 реда
  1. Двоични данни
      data/BL10-200-2_S5.sorted.bam
  2. Двоични данни
      data/BL10-200-2_S5.sorted.bam.bai
  3. +12
    -0
      inputs
  4. +23
    -0
      readme.md
  5. +26
    -0
      tasks/arcashla.wdl
  6. +27
    -0
      tasks/hisat2.wdl
  7. +34
    -0
      tasks/samtools.wdl
  8. +29
    -0
      workflow.wdl

Двоични данни
data/BL10-200-2_S5.sorted.bam Целия файл


Двоични данни
data/BL10-200-2_S5.sorted.bam.bai Целия файл


+ 12
- 0
inputs Целия файл

@@ -0,0 +1,12 @@
{
"{{ project_name }}.read1": "{{ read1 }}",
"{{ project_name }}.read2": "{{ read2 }}",
"{{ project_name }}.idx": "oss://pgx-reference-data/reference/hisat2/grch38_snp_tran/",
"{{ project_name }}.idx_prefix": "genome_snp_tran",
"{{ project_name }}.hisat2.docker": "registry.cn-shanghai.aliyuncs.com/pgx-docker-registry/hisat2:v2.0.5-1-deb-cv1",
"{{ project_name }}.hisat2.cluster": "OnDemand bcs.a2.3xlarge img-ubuntu-vpc",
"{{ project_name }}.samtools.docker": "registry.cn-shanghai.aliyuncs.com/pgx-docker-registry/samtools:v1.3.1",
"{{ project_name }}.samtools.cluster": "OnDemand bcs.a2.large img-ubuntu-vpc"
"{{ project_name }}.arcashla.docker": registry.cn-shanghai.aliyuncs.com/pgx-docker-registry/tengfei/arcashla:latest
"{{ project_name }}.arcashla.cluster": "OnDemand bcs.a2.large img-ubuntu-vpc"
}

+ 23
- 0
readme.md Целия файл

@@ -0,0 +1,23 @@
> Author: Jun Shang
>
> Email: shangjunv@163.com
>
> Last Updates: 25/02/2020

#### Requirements

- choppy
- Ali-Cloud

```
$ source activate choppy/open-choppy-env
$ choppy install junshang/rna-seq-pair-end-viral
$ choppy apps
```

#### quick start

```
$ choppy samples junshang/rna-seq-pair-end-viral-latest > samples.csv
$ choppy batch junshang/rna-seq-pair-end-viral-latest samples.csv -p Your_project_name
```

+ 26
- 0
tasks/arcashla.wdl Целия файл

@@ -0,0 +1,26 @@
task samtools {
String base = basename(bam, ".sorted.bam")
String docker
String cluster

command <<<
mkdir hla_type
./arcasHLA extract ${sorted_bam} -o ${base}.extracted.fq.gz --paired -t 8 -v
./arcasHLA genotype ${bam}.extracted.1.fq.gz ${bam}.extracted.2.fq.gz hla_type/${base}.genotype.json
>>>

runtime {
docker: docker
cluster: cluster
systemDisk: "cloud_ssd 40"
dataDisk: "cloud_ssd 200 /cromwell_root/"
}

output {
File extracted_1p = base + "extracted.1.fq.gz"
File extracted_2p = base + "extracted.2.fq.gz"
Array[File] hla_type = ["hla_type/${base}.genotype.json", "hla_type/${base}.genes.json", "hla_type/${base}.extract.log", "hla_type/${base}.genotype.log"]
}

}


+ 27
- 0
tasks/hisat2.wdl Целия файл

@@ -0,0 +1,27 @@
task hisat2 {
File idx
File read_1P
File read_2P
String idx_prefix
String base = sub(basename(read_1P),"\\.\\S+$", "")
String docker
String cluster

command {
nt=$(nproc)
hisat2 -t -p $nt -x ${idx}/${idx_prefix} -1 ${read_1P} -2 ${read_2P} -S ${base}.sam --un-conc-gz ${base}_un.fq.gz
}
runtime {
docker: docker
cluster: cluster
systemDisk: "cloud_ssd 40"
dataDisk: "cloud_ssd 200 /cromwell_root/"
}

output {
File sam = base + ".sam"
File unmapread_1p = base + "_un.fq.1.gz"
File unmapread_2p = base + "_un.fq.2.gz"
}
}

+ 34
- 0
tasks/samtools.wdl Целия файл

@@ -0,0 +1,34 @@
task samtools {
File sam
String base = basename(sam, ".sam")
String bam = base + ".bam"
String sorted_bam = base + ".sorted.bam"
String sorted_bam_index = base + ".sorted.bam.bai"
String viral_samstats = base + ".viral.samstats"
String docker
String cluster

command <<<
set -o pipefail
set -e
/opt/conda/bin/samtools view -bS ${sam} > ${bam}
/opt/conda/bin/samtools sort -m 1000000000 ${bam} -o ${sorted_bam}
/opt/conda/bin/samtools index ${sorted_bam}
/opt/conda/bin/samtools stats ${sorted_bam} > ${viral_samstats}
>>>

runtime {
docker: docker
cluster: cluster
systemDisk: "cloud_ssd 40"
dataDisk: "cloud_ssd 200 /cromwell_root/"
}

output {
File out_bam = sorted_bam
File out_bam_index = sorted_bam_index
File out_viral_samstats = viral_samstats
}

}


+ 29
- 0
workflow.wdl Целия файл

@@ -0,0 +1,29 @@
import "./tasks/hisat2.wdl" as hisat2
import "./tasks/samtools.wdl" as samtools
import "./tasks/stringtie.wdl" as stringtie

workflow {{ project_name }} {

File read1
File read2
File idx
String idx_prefix
File gtf
call hisat2.hisat2 as hisat2 {
input: idx=idx, idx_prefix=idx_prefix, read_1P=read1, read_2P=read2
}

call samtools.samtools as samtools {
input: sam = hisat2.sam
}

call stringtie.stringtie as stringtie {
input: gtf = gtf, bam = samtools.out_bam
}
}



Loading…
Отказ
Запис