# README.md | |||||
> Author: Qingwang Chen | |||||
> | |||||
> Email: [qwch20@fudan.edu.cn](mailto:qwch20@fudan.edu.cn) | |||||
> | |||||
> Last Updates: 18/08/2021 | |||||
#### Brief Introduction | |||||
For RNA-seq data, from bams to AS Information files. | |||||
#### Requirements | |||||
- choppy | |||||
- Ali-Cloud | |||||
- Linux | |||||
``` | |||||
# 激活choppy环境 | |||||
$ source activate choppy (open-choppy-env) | |||||
# 第一次安装 | |||||
$ choppy install chenqingwang/SplAdder-merge | |||||
# 非第一次安装 | |||||
$ choppy install chenqingwang/SplAdder-merge -f | |||||
# 查询已安装APP | |||||
$ choppy apps | |||||
``` | |||||
#### Quick Start | |||||
``` | |||||
# 准备 samples.csv 文件 | |||||
$ choppy samples chenqingwang/SplAdder-merge-latest > samples.csv | |||||
# 准备无默认参数的samples.csv 文件 | |||||
choppy samples --no-default chenqingwang/SplAdder-merge-latest > samples.csv | |||||
# 提交任务 | |||||
$ choppy batch chenqingwang/SplAdder-merge-latest samples.csv -p Your_project_name -l Your_label | |||||
# 查询任务运行状况 | |||||
$ choppy query -L Your_label | grep "status" | |||||
# 查询失败任务 | |||||
$ choppy search -s Failed -p Your_project_name -u chenqingwang --short-format | |||||
# 结果文件地址 | |||||
$ oss://choppy-cromwell-result/test-choppy/Your_project_name/ | |||||
``` |
{ | |||||
"reference_gtf_file":"oss://pgx-reference-data/reference/spladder/SplAdder/data/reference/Homo_sapiens.GRCh38.103.gtf", | |||||
"spladder_docker":"registry.cn-shanghai.aliyuncs.com/pgx-docker-registry/spladder:v2.4.2", | |||||
"spladder_cluster":"OnDemand bcs.a2.large img-ubuntu-vpc", | |||||
"disk_size":"200" | |||||
} |
bam_file,sample_id | |||||
oss://pgx-reference-data/reference/spladder/SplAdder/data/bams/test/Quartet_RNA_ILM_NovaSeq_RiboZero_WUX_D5_1_20200901.downsampled.bam,D5_1_Test |
{ | |||||
"{{ project_name }}.sample_id": "{{ sample_id }}", | |||||
"{{ project_name }}.bam": "{{ bam | tojson }}", | |||||
"{{ project_name }}.bai": "{{ bai | tojson }}", | |||||
"{{ project_name }}.pickle": "{{ pickle | tojson }}", | |||||
"{{ project_name }}.reference_gtf_file": "{{ reference_gtf_file }}", | |||||
"{{ project_name }}.spladder_docker": "{{ spladder_docker }}", | |||||
"{{ project_name }}.spladder_cluster": "{{ spladder_cluster }}", | |||||
"{{ project_name }}.disk_size": "{{ disk_size }}" | |||||
} |
task spladder { | |||||
String sample_id | |||||
Array[File] bam | |||||
Array[File] bai | |||||
Array[File] pickle | |||||
File reference_gtf_file | |||||
String docker | |||||
String cluster | |||||
String disk_size | |||||
command <<< | |||||
set -o pipefail | |||||
set -e | |||||
mkdir -p ${sample_id}/spladder_out | |||||
sed ':a ; N;s/\n/,/ ; t a ; ' bam > alignment.txt | |||||
for i in ${sep=" " pickle} | |||||
do | |||||
ln -s $i ${sample_id}/spladder_out/$i | |||||
echo ${sample_id}/spladder_out/$i | |||||
echo ${sample_id}/spladder_out/$i >> pickle.txt | |||||
done | |||||
find . -depth > fileList.txt | |||||
>>> | |||||
runtime { | |||||
docker: docker | |||||
cluster: cluster | |||||
systemDisk: "cloud_ssd 40" | |||||
dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/" | |||||
} | |||||
output { | |||||
File fileList = "fileList.txt" | |||||
File alignment = "alignment.txt" | |||||
File pickle = "pickle.txt" | |||||
} | |||||
} |
import "./tasks/spladder.wdl" as spladder | |||||
workflow {{ project_name }} { | |||||
String sample_id | |||||
Array[File] bam | |||||
Array[File] bai | |||||
Array[File] pickle | |||||
File reference_gtf_file | |||||
String spladder_docker | |||||
String spladder_cluster | |||||
String disk_size | |||||
call spladder.spladder as spladder { | |||||
input: | |||||
reference_gtf_file=reference_gtf_file, | |||||
sample_id=sample_id, | |||||
bam=bam, | |||||
bai=bai, | |||||
pickle=pickle, | |||||
docker=spladder_docker, | |||||
cluster=spladder_cluster, | |||||
disk_size=disk_size | |||||
} | |||||
} |