#!/usr/bin/perl -w #get_regions_coverage.pl open OUT, ">cds.covstats.txt" or die $!; print OUT join("\t",'Sample','Chromosome','Position','ExonName', 'MinDepth','MaxDepth','MedianDepth','AvgDepth', 'Fraction100X+','Fraction10X-','BP100X+','BP10X-','TotalBP'),"\n"; my %totalbp; my %numsamp; my @covfiles = @ARGV; my %cov; my %covstats; foreach $cfile (@covfiles) { my %good; my $prefix = (split(/\./,$cfile))[0]; open COV, "<$cfile" or die $!; while (my $line = <COV>) { chomp($line); next if ($line =~ m/^all/); my ($chrom,$pos,$end,$name,$depth,$bp,$total,$percent) = split(/\t/,$line); my $region = join(":",$chrom,$pos,$end); $cov{$region}{$depth} = $percent; $covstats{$region}{sumdepth} += $depth*$bp; $exons{$region} = $name; $totalbp{$region} = $total; if ($depth <= 10) { $poor{$region} += $bp; } if ($depth >= 100) { $good{$region} += $bp; } } close COV; foreach $reg (keys %totalbp) { $good{$reg} = 0 unless $good{$reg}; $poor{$reg} = 0 unless $poor{$reg}; if ($totalbp{$reg} < 1) { next; } my $avgdepth = sprintf("%.0f",$covstats{$reg}{sumdepth}/$totalbp{$reg}); my @depths = sort {$a <=> $b} keys %{$cov{$reg}}; %covhash = %{$cov{$reg}}; my @perc = @covhash{@depths}; my @cum_sum = cumsum(@perc); my $mediandep = 0; foreach my $i (0..$#cum_sum) { if ($cum_sum[$i] < 0.5) { $mediandep = $depths[$i]; } } $good_fract = sprintf("%.4f",$good{$reg}/$totalbp{$reg}); $poor_fract = sprintf("%.4f",$poor{$reg}/$totalbp{$reg}); print OUT join("\t",$prefix,split(/:/,$reg),$exons{$reg},$depths[0],$depths[-1],$mediandep,$avgdepth,$good_fract,$poor_fract,$good{$reg},$poor{$reg},$totalbp{$reg}),"\n"; } } sub cumsum { my @nums = @_; my @cumsum = (); my $mid = 0; for my $i (0..$#nums) { $mid += $nums[$i]; push(@cumsum,$mid); } return @cumsum; }