#!/usr/bin/perl use warnings; use strict; use diagnostics; open( INFILE, "<", 'myosin.fasta') or die $!; #open original myosin.fasta for reading open( OUTFILE, ">", 'modifiedHeaders.fasta') or die $!; #open/create new fasta for writing my %headerHash; #create hash for the header my %seq; my %header; #loop through old file while (){ chomp; my $line = $_; # use if/then to seperate headers from seq, while regex to select only species name in header if ($line =~ /^>/){ my $header = $line; if ($header =~ /(>gi.*)\[(.+)\](>gi.*)\[(.+)\]/){ my $headerHash; $headerHash{$1} = $2; # return $headerHash; } else{ my $seq = $line; # return $seq ; print OUTFILE $headerHash, "\n", $seq, "\n"; } # if ($header =~ /(>gi.*)\[(.+)\](>gi.*)\[(.+)\]/){ # my $headerHash = $2;} #print $headerHash # print OUTFILE $headerHash{$2}, "\n", $seq, "\n"; } } #print OUTFILE $headerHash, "\n", $seq, "\n";