task benchmark { File vcf File vcf_index File benchmarking_dir File ref_dir String sample = basename(vcf,".vcf") String sample_mark String fasta String docker String cluster_config String disk_size command <<< set -o pipefail set -e nt=$(nproc) mkdir -p /cromwell_root/tmp cp -r ${ref_dir} /cromwell_root/tmp/ export HGREF=/cromwell_root/tmp/reference_data/GRCh38.d1.vd1.fa if [ ${sample_mark} == "LCL5" ];then /opt/hap.py/bin/hap.py ${benchmarking_dir}/LCL5.vcf.gz ${vcf} -f ${benchmarking_dir}/LCL5.bed.gz --threads $nt -o ${sample} -r ${ref_dir}/${fasta} elif [ ${sample_mark} == "LCL6" ]; then /opt/hap.py/bin/hap.py ${benchmarking_dir}/LCL6.vcf.gz ${vcf} -f ${benchmarking_dir}/LCL6.bed.gz --threads $nt -o ${sample} -r ${ref_dir}/${fasta} elif [ ${sample_mark} == "LCL7" ]; then /opt/hap.py/bin/hap.py ${benchmarking_dir}/LCL7.vcf.gz ${vcf} -f ${benchmarking_dir}/LCL7.bed.gz --threads $nt -o ${sample} -r ${ref_dir}/${fasta} elif [ ${sample_mark} == "LCL8" ]; then /opt/hap.py/bin/hap.py ${benchmarking_dir}/LCL8.vcf.gz ${vcf} -f ${benchmarking_dir}/LCL8.bed.gz --threads $nt -o ${sample} -r ${ref_dir}/${fasta} else echo "only for quartet samples" fi >>> runtime { docker:docker cluster:cluster_config systemDisk:"cloud_ssd 40" dataDisk:"cloud_ssd " + disk_size + " /cromwell_root/" } output { File gzip_vcf = "${sample}.vcf.gz" File gzip_vcf_index = "${sample}.vcf.gz.tbi" File roc_all_csv = "${sample}.roc.all.csv.gz" File roc_indel = "${sample}.roc.Locations.INDEL.csv.gz" File roc_indel_pass = "${sample}.roc.Locations.INDEL.PASS.csv.gz" File roc_snp = "${sample}.roc.Locations.SNP.csv.gz" File roc_snp_pass = "${sample}.roc.Locations.SNP.PASS.csv.gz" File summary = "${sample}.summary.csv" File extended = "${sample}.extended.csv" File metrics = "${sample}.metrics.json.gz" } }