#! /usr/bin/perl -w use strict; $set1count=000; $set2count=000; $set3count=000; $set4count=000; $set5count=000; foreach my $id (keys %bact) { if (($bact{$id} =~ m/^CAGGTGGCAT/)) { s/^CAGGTGGCAT//; $id .='_set1_'; $set1count++; $id .=$set1count; } elsif (($bact{$id} =~ m/^CATTGAAGCT/)) { s/^CATTGAAGCT//; $id .='_set2_'; $set2count++; $id .=$set2count; } elsif (($bact{$id} =~ m/^CTAAGTTCAG/)) { s/^CTAAGTTCAG//; $id .='_set3_'; $set3count++; $id .=$set3count; } elsif (($bact{$id} =~ m/^CTAAGAACGT/)) { s/^CTAAGAACGT//; $id .='_set4_'; $set4count++; $id .=$set4count; } else { s/^CTGGAGGACT//; $id .='_set5_'; $set5count++; $id .=$set5count; } } print "---------------------------------------------------------------\n"; print "-------- ABUNDANCE OF SEQUENCES WTHIN EACH SUBGROUP ----------\n"; print "number of sequences in set 1 CAGGTGGCAT sub group = $set1count \n"; print "number of sequences in set 2 CATTGAAGCT sub group = $set2count \n"; print "number of sequences in set 3 CTAAGTTCAG sub group = $set3count \n"; print "number of sequences in set 4 CTAAGAACGT sub group = $set4count \n"; print "number of sequences in set 5 CTGGAGGACT sub group = $set5count \n"; ...