#script to get files in suitable format for ROCR (AUC analysis)

use strict;

my $indir="inputdir/"; #inputdir: directory with maxscore files for each TF binding model
my $outdir="outputdir/";

my @in_files=glob $indir.'*.txt';


foreach my $file (@in_files) {
	
	$file =~ /inputdir\/.txt/;
	
	print $1, "\n"; 
	open (OUT, ">", $outdir."ROCR_".$1.".txt") or die ($!);
	print OUT 'score', "\t", 'case', "\n";
	open (IN, "<", $file) or die ($!);
	#print $file; 
	while (<IN>) {
		chomp; 
		s /\W+$//;
		s /"//g;
		s /'//g;
		#tf	matrix	maxscore	fileindex	sourceind	case
		#reverse: 
		my($traf, $matrix, $maxscore, $fileindex, $sourceindex, $case) = split/\t/; 
		#my ($traf, $matrix, $maxscore, $index, $case) = split/\t/; 
		next if $traf eq 'tf'; 
		if ($case eq 'positive') {
			print OUT $maxscore, "\t", '1', "\n";
		}
		elsif ($case eq 'negative') {
			print OUT $maxscore, "\t", '0', "\n";
		}
	}
}



