From 07c40b0977795b3d21cdfeacb47ba443fd3d99b3 Mon Sep 17 00:00:00 2001 From: mestato Date: Tue, 7 Jul 2015 11:25:45 -0400 Subject: [PATCH] New subroutine flag_multiSSRs, to identify SSRs that are in contigs with other SSRs. --- hwg_gssr_scripts/findSSRs_post_assembly.pl | 31 +++++++++++++++++++++++++++--- 1 file changed, 28 insertions(+), 3 deletions(-) diff --git a/hwg_gssr_scripts/findSSRs_post_assembly.pl b/hwg_gssr_scripts/findSSRs_post_assembly.pl index 27b39cc..2f39a07 100755 --- a/hwg_gssr_scripts/findSSRs_post_assembly.pl +++ b/hwg_gssr_scripts/findSSRs_post_assembly.pl @@ -265,6 +265,10 @@ sub main{ parseP3_output($p3_output); print "done.\n"; + print "identifying sequences with >1 SSR..."; + flag_multiSSRs(); + print "done.\n"; + ##--------------------------------------------------------------- ## Producing output - statistics @@ -636,6 +640,30 @@ sub parseP3_output{ } ############################################################### +sub flag_multiSSRs{ + + foreach my $contig (keys %CONTIG_SSR_STARTS){ + print "contig: $contig\n"; + my @starts = @{ $CONTIG_SSR_STARTS{$contig}}; + print "starts: @starts\n"; + if(@starts == 1){ + my $start_index = $starts[0]; + my $ssr_id = $contig."_ssr".$start_index; + $SSR_STATS{$ssr_id}{MULTI} = "False"; + print "\t$ssr_id:FALSE\n"; + } + else{ + foreach my $start_index (@starts){ + my $ssr_id = $contig."_ssr".$start_index; + $SSR_STATS{$ssr_id}{MULTI} = "True"; + print "\t$ssr_id:TRUE\n"; + } + } + } + +} + +############################################################### sub initiate_workbooks{ my $workbook = $_[0]; # file name my $formats = $_[1]; # file name @@ -680,9 +708,6 @@ sub _print_worksheet{ } -# my $multi_flag = 0; -# ## skip contigs with more than one ssr -# if(scalar @{ $CONTIG_SSR_STARTS{$contig}} == 1){ # print $fastaout_fh ">$contig $motif.$ssrStart-$ssrEnd\n$seq\n"; # #print "\t$forward\n"; # $SSR_w_PRIMER_COUNT++;