Mercurial > repos > devteam > generate_pc_lda_matrix
diff generate_matrix_for_pca_lda.pl @ 0:263a3b92368b draft default tip
Imported from capsule None
author | devteam |
---|---|
date | Mon, 28 Jul 2014 11:30:18 -0400 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/generate_matrix_for_pca_lda.pl Mon Jul 28 11:30:18 2014 -0400 @@ -0,0 +1,147 @@ +#!/usr/bin/perl -w + +use strict; +use warnings; + +my $Input_Matrix = $ARGV[0]; +my $Input_Label = $ARGV[1]; + +my %Hash_X = (); +my %Hash_Y = (); +my $My_Num_X = 0; +my $My_Num_Y = 0; + +open (OUT, "> $ARGV[2]"); + +open (LABEL, "< $Input_Label") || + die "Sorry, I couldn't open the escape.txt for clone: $!\n"; + +my $Label_Index = 0; +my $X_Label; +my $input_Label; +while (defined($input_Label = <LABEL>)){ + chomp($input_Label); + my @cArray_Label = $input_Label =~ /(\S+)\s*/g; + if ($input_Label =~ /\w/){ + if ($Label_Index == 0){ + $Hash_X{$cArray_Label[0]} = $cArray_Label[1]; + $X_Label = $cArray_Label[1]; + $Label_Index = 1; + }else{ + if ($cArray_Label[1] eq $X_Label){ + $Hash_X{$cArray_Label[0]} = $cArray_Label[1]; + }else{ + $Hash_Y{$cArray_Label[0]} = $cArray_Label[1]; + } + } + } +} +close(LABEL); + +open (MATRIX, "< $Input_Matrix") || + die "Sorry, I couldn't open the escape.txt for clone: $!\n"; + +my %Hash_Matrix = (); +my %Hash_Features = (); +my @cArray_Features = (); + +my %Hash_Sum = (); +my $Matrix_Index = 0; +my $input_Matrix; +while (defined($input_Matrix = <MATRIX>)){ + chomp($input_Matrix); + my @cArray_Matrix = $input_Matrix =~ /(\S+)\s*/g; + if ($input_Matrix =~ /\w/){ + if ($Matrix_Index == 0){ + @cArray_Features = @cArray_Matrix; + my $Temp_Num_Array = scalar(@cArray_Matrix); + my $Temp_Index = 0; + for(;$Temp_Index < $Temp_Num_Array; $Temp_Index++){ + $Hash_Features{$cArray_Matrix[$Temp_Index]} = "BOL"; + $Hash_Sum{$cArray_Matrix[$Temp_Index]} = 0; + } + $Matrix_Index = 1; + }else{ + $Hash_Matrix{$cArray_Matrix[0]} = $input_Matrix; + } + } +} +close(MATRIX); + +my $Trace_Key; + +foreach $Trace_Key (sort {$a cmp $b} keys %Hash_X){ + my @cArray_Trace_X = $Hash_Matrix{$Trace_Key} =~ /(\S+)\s*/g; + my $Num_Array_Feature_X = scalar(@cArray_Features); + my $Index_Feature_X = 0; + for(;$Index_Feature_X < $Num_Array_Feature_X; $Index_Feature_X++){ + if ($Hash_Features{$cArray_Features[$Index_Feature_X]} eq "BOL"){ + $Hash_Features{$cArray_Features[$Index_Feature_X]} = $cArray_Trace_X[$Index_Feature_X + 1]; + }else{ + $Hash_Features{$cArray_Features[$Index_Feature_X]} = $Hash_Features{$cArray_Features[$Index_Feature_X]} . "\t" . $cArray_Trace_X[$Index_Feature_X + 1]; + } + + $Hash_Sum{$cArray_Features[$Index_Feature_X]} += $cArray_Trace_X[$Index_Feature_X + 1]; + } + $My_Num_X ++; +} + +my $Append_Key; +foreach $Append_Key (keys %Hash_Features){ + $Hash_Features{$Append_Key} = $Hash_Features{$Append_Key} . "\t" . $Hash_Sum{$Append_Key}; + $Hash_Sum{$Append_Key} = 0; +} + +foreach $Trace_Key (sort {$a cmp $b} keys %Hash_Y){ + my @cArray_Trace_Y = $Hash_Matrix{$Trace_Key} =~ /(\S+)\s*/g; + my $Num_Array_Feature_Y = scalar(@cArray_Features); + my $Index_Feature_Y = 0; + for(;$Index_Feature_Y < $Num_Array_Feature_Y; $Index_Feature_Y++){ + if ($Hash_Features{$cArray_Features[$Index_Feature_Y]} eq "BOL"){ + $Hash_Features{$cArray_Features[$Index_Feature_Y]} = $cArray_Trace_Y[$Index_Feature_Y + 1]; + }else{ + $Hash_Features{$cArray_Features[$Index_Feature_Y]} = $Hash_Features{$cArray_Features[$Index_Feature_Y]} . "\t" . $cArray_Trace_Y[$Index_Feature_Y + 1]; + } + + $Hash_Sum{$cArray_Features[$Index_Feature_Y]} += $cArray_Trace_Y[$Index_Feature_Y + 1]; + } + $My_Num_Y ++; +} + +foreach $Append_Key (keys %Hash_Features){ + $Hash_Features{$Append_Key} = $Hash_Features{$Append_Key} . "\t" . $Hash_Sum{$Append_Key} . "\t" . "EOL"; +} + +my $Prt_Key; +print OUT " \t"; +foreach $Prt_Key (sort {$a cmp $b} keys %Hash_X){ + print OUT "$Prt_Key \t"; +} +print OUT "X(SUM) \t"; + +foreach $Prt_Key (sort {$a cmp $b} keys %Hash_Y){ + print OUT "$Prt_Key \t"; +} +print OUT "Y(SUM) \t"; +print OUT "\n"; + +my $Prt_Index = 0; +my $Prt_Array_Num = scalar (@cArray_Features); +for(;$Prt_Index < $Prt_Array_Num; $Prt_Index++){ + print OUT "$cArray_Features[$Prt_Index] \t$Hash_Features{$cArray_Features[$Prt_Index]}\n"; +} + +print OUT " \t"; +my $My_Label_Index = 0; +for(;$My_Label_Index < $My_Num_X; $My_Label_Index++){ + print OUT "X \t"; +} +print OUT " \t"; + +$My_Label_Index = 0; +for(;$My_Label_Index < $My_Num_Y; $My_Label_Index++){ + print OUT "Y \t"; +} +print OUT " \t\n"; + +close(OUT);