Solution
process '6A_post_process_vcf' { tag "$sampleId" publishDir "$params.results/$sampleId" input: set sampleId, file('final.vcf') from vcf_files set file('filtered.recode.vcf.gz'), file('filtered.recode.vcf.gz.tbi') from prepared_vcf_ch output: set sampleId, file('final.vcf'), file('commonSNPs.diff.sites_in_files') into vcf_and_snps_ch script: ''' grep -v '#' final.vcf | awk '$7~/PASS/' |perl -ne 'chomp($_); ($dp)=$_=~/DP\\=(\\d+)\\;/; if($dp>=8){print $_."\\n"};' > result.DP8.vcf vcftools --vcf result.DP8.vcf --gzdiff filtered.recode.vcf.gz --diff-site --out commonSNPs ''' } process '6B_prepare_vcf_for_ase' { tag "$sampleId" publishDir "$params.results/$sampleId" input: set sampleId, file('final.vcf'), file('commonSNPs.diff.sites_in_files') from vcf_and_snps_ch output: set sampleId, file('known_snps.vcf') into vcf_for_ASE file('AF.histogram.pdf') into gghist_pdfs script: ''' awk 'BEGIN{OFS="\t"} $4~/B/{print $1,$2,$3}' commonSNPs.diff.sites_in_files > test.bed vcftools --vcf final.vcf --bed test.bed --recode --keep-INFO-all --stdout > known_snps.vcf grep -v '#' known_snps.vcf | awk -F '\\t' '{print $10}' \ |awk -F ':' '{print $2}'|perl -ne 'chomp($_); \ @v=split(/\\,/,$_); if($v[0]!=0 ||$v[1] !=0)\ {print $v[1]/($v[1]+$v[0])."\\n"; }' |awk '$1!=1' \ >AF.4R gghist.R -i AF.4R -o AF.histogram.pdf ''' }