#!/usr/bin/perl -w
#get_regions_coverage.pl

open OUT, ">cds.covstats.txt" or die $!;
print OUT join("\t",'Sample','Chromosome','Position','ExonName',
		'MinDepth','MaxDepth','MedianDepth','AvgDepth',
		'Fraction100X+','Fraction10X-','BP100X+','BP10X-','TotalBP'),"\n";

my %totalbp;
my %numsamp;
my @covfiles = @ARGV;
my %cov;
my %covstats;
foreach $cfile (@covfiles) {
  my %good;
  my $prefix = (split(/\./,$cfile))[0];
  open COV, "<$cfile" or die $!;
  while (my $line = <COV>) {
    chomp($line);
    next if ($line =~ m/^all/);
    my ($chrom,$pos,$end,$name,$depth,$bp,$total,$percent) = split(/\t/,$line);
    my $region = join(":",$chrom,$pos,$end);
    $cov{$region}{$depth} = $percent;
    $covstats{$region}{sumdepth} += $depth*$bp;
    $exons{$region} = $name;
    $totalbp{$region} = $total;
    if ($depth <= 10) {
      $poor{$region} += $bp;
    }
    if ($depth >= 100) {
      $good{$region} += $bp;
    }
  }
  close COV;
  foreach $reg (keys %totalbp) {
    $good{$reg} = 0 unless $good{$reg};
    $poor{$reg} = 0 unless $poor{$reg};
    if ($totalbp{$reg} < 1) {
      next;
    }
    my $avgdepth = sprintf("%.0f",$covstats{$reg}{sumdepth}/$totalbp{$reg});
    my @depths = sort {$a <=> $b} keys %{$cov{$reg}};
    %covhash = %{$cov{$reg}};
    my @perc = @covhash{@depths};
    my @cum_sum = cumsum(@perc);
    my $mediandep = 0;
    foreach my $i (0..$#cum_sum) {
      if ($cum_sum[$i] < 0.5) {
	$mediandep = $depths[$i];
      }
    }
    $good_fract = sprintf("%.4f",$good{$reg}/$totalbp{$reg});
    $poor_fract = sprintf("%.4f",$poor{$reg}/$totalbp{$reg});
    print OUT join("\t",$prefix,split(/:/,$reg),$exons{$reg},$depths[0],$depths[-1],$mediandep,$avgdepth,$good_fract,$poor_fract,$good{$reg},$poor{$reg},$totalbp{$reg}),"\n";
  }
}
sub cumsum {
  my @nums = @_;
  my @cumsum = ();
  my $mid = 0;
  for my $i (0..$#nums) {
    $mid += $nums[$i];
    push(@cumsum,$mid);
  }
  return @cumsum;
}