task split_gvcf_files {
	File merged_gvcf
	String project
	String docker
	String cluster_config
	String disk_size
	
	command <<<

		cat ${merged_gvcf} | grep '#CHROM' | sed s'/\t/\n/g' > name

		ncol=`cat name | wc -l`

		sed -i '1,9d' name

		cat ${merged_gvcf} | grep '#' > header
		cat ${merged_gvcf} | grep -v '#' > body
		cat body | grep -w '^chr1\|^chr2\|^chr3\|^chr4\|^chr5\|^chr6\|^chr7\|^chr8\|^chr9\|^chr10\|^chr11\|^chr12\|^chr13\|^chr14\|^chr15\|^chr16\|^chr17\|^chr18\|^chr19\|^chr20\|^chr21\|^chr22\|^chrX' > body.filtered
		cat header body.filtered > ${project}.filtered.g.vcf

		for i in $(seq 10 $ncol);  do  cat ${project}.filtered.g.vcf | cut -f1-9,$i > $i.splited.vcf; done

		ls *splited.vcf | sort -n | paste - name > rename

		cat rename | while read a b
		do
			mv $a $b.splited.vcf
			sample=$(echo $b | cut -f6 -d_)
			rep=$(echo $b | cut -f7 -d_)
			echo $sample >> quartet_sample
			echo $rep >> quartet_rep
		done

		python /opt/how_many_samples.py -sample quartet_sample -rep quartet_rep


	>>>

	runtime {
		docker:docker
		cluster: cluster_config
		systemDisk: "cloud_ssd 40"
		dataDisk: "cloud_ssd " + disk_size + " /cromwell_root/"
	}
	output {
		Array[File] splited_vcf = glob("*.splited.vcf")
		File sister_tag = "sister_tag"
		File quartet_tag = "quartet_tag"
	}
}