#!/usr/bin/perl -w 

$posmax=300;
 
$pre = "/disk_aug18_a/jan2019/processed_data100/smit_files";

@dirs = qw(
hs1A_50
hs1B_51
hs1C_52
hs1D_53
);

@info = qw(wt wtpb y2h2 y2h2pb);

open(PROB1,">shortlist");

foreach $d (@dirs){
system("ls $pre/$d/*splicingValues.txt > tlist");
open(IF,"tlist");
while($a=<IF>){
chomp($a);
@cc = split(/\//,$a);
$gene = $cc[6];
$ghash{$gene}++;
#print "filling $d\n$gene\n";
$tposmax = 0;
open(IF2,$a);
$aa = <IF2>;
while($aa=<IF2>){
chomp($aa);
@bb = split(/\t/,$aa);
$pos = $bb[0]; $val = $bb[1]; $splraw = $bb[2] ; $splnorm = $bb[3];
#relPos	readSum	splicingValueRaw	splicingValueNorm
#-100	0	NA	0
#-99	0	NA	0
$splnorm =~ s/NA/0/g;
if($pos<=$posmax){
$tposmax = $pos;
$poshash{$d}{$gene}  .= "$pos,";
$valhash{$d}{$gene}  .= "$splnorm,";
#print "$d\n";print "$a\n";exit;
}
}
close(IF2);
if($tposmax<$posmax){print PROB1 "$d $gene $tposmax\n";}
}
close(IF);
}

#system("rm pngs/*");

open(HF,">lowess.html");
print HF "<pre>\n";
print HF "<table border=1>
<tr><td>gene ";
for($i=0;$i<4;$i++){
$d = $dirs[$i];
print HF "<td>$d $info[$i]"; }
print HF "\n";

foreach $gene (sort keys %ghash){
print HF "<tr><td>$gene";
for($i=0;$i<4;$i++){
$d = $dirs[$i];
print HF "<td><img height=240 src=\"pngs/$d.$gene.png\">";

open(RF,">tmp.R");
$poshash{$d}{$gene} =~ s/,$//;
$valhash{$d}{$gene} =~ s/,$//;
print RF "
df <- data.frame(x=c($poshash{$d}{$gene}) , y=c($valhash{$d}{$gene}) )

png(\"pngs/$d.$gene.png\")
plot(df\$x, df\$y)
lines(lowess(df\$x, df\$y ,f=1/2 ), col='red')

";
system("R --vanilla < tmp.R");
#exit;
}
print HF "\n";
}


