comment on

good i have done that'

 

use strict;
use warnings;

#use List::MoreUtils qw(uniq); // i have tried this to handle the dupl
+icated emails
use Data::Dumper qw(Dumper);
my $Directory = $ARGV[0]; #Directory to scan for emails
my $Filename =$ARGV[1];  # where to write out found emails note: avoid
+ forever  loop make sure it's not the same directory

my $success   = "\n [+] $0 is Scanning For E-mails \n\n";
my $tryagain    = "\n [?] perl $0 Directory fileto.txt \n\n";
if (@ARGV != 2) { print $tryagain; exit(); } else { print $success; }
sub uniq {  #and this to handle the duplicated emails
    return keys %{{ map { $_ => 1 } @_ }};
}

#sub uniq {  #with this to handle the duplicated emails
 #   my %seen;
 #   grep !$seen{$_}++, @_;
#}

my $total_filesscanned = 0;
my $total_email = 0;
my @files = grep ( -f ,<$Directory*.txt*>); #scanning directory


open(my $fh, '>>', $Filename);
 foreach my $file (@files) {
$total_filesscanned++;  # begin to count numbers of file to be scanned
open my $open, '<', $file or die $!;
    while (<$open>) {
    
    
        chomp;
        my @findemails = split(' ');
        my @filtered = uniq(@findemails);  # meant to avoid duplicates
        #my @filtered  = join(" ", uniq(@findemails)); also took this 
+aproach
        
        
        foreach my $emails (@filtered) { 
          
            if($emails =~ /^\w+\@([\da-zA-Z\-]{1,}\.){1,}[\da-zA-Z-]{2
+,6}$/) { #grab the emails
    $total_email++;   # begin to count emails
 print $fh "$emails\n"; # write the emails to file
            
            } 
            }
        
            
        }
        
             
    close $file; # close files
      print "$file\n";
        
    }
    
    close $fh; # close the file to write
    
    #my $removed = @findemails - @filtered; # am expecting it to avoid
+ duplicate emails but it's not working
     print "Files Scanned: $total_filesscanned\n";
     print "E-mail Found: $total_email\n";
     #print "Filtered Total: $removed\n";
     print "done\n";
[download]

The beginning of knowledge is the discovery of something we do not understand.
Frank Herbert (1920 - 1986)

In reply to Re^2: Help with removing duplicates in array by beanscake
in thread Help with removing duplicates in array by beanscake

Posts are HTML formatted. Put <p> </p> tags around your paragraphs. Put <code> </code> tags around your code and data!

Titles consisting of a single word are discouraged, and in most cases are disallowed outright.

Read Where should I post X? if you're not absolutely sure you're posting in the right place.

Please read these before you post! —

Posts may use any of the Perl Monks Approved HTML tags:

a, abbr, b, big, blockquote, br, caption, center, col, colgroup, dd, del, details, div, dl, dt, em, font, h1, h2, h3, h4, h5, h6, hr, i, ins, li, ol, p, pre, readmore, small, span, spoiler, strike, strong, sub, summary, sup, table, tbody, td, tfoot, th, thead, tr, tt, u, ul, wbr

You may need to use entities for some characters, as follows. (Exception: Within code tags, you can put the characters literally.)

	For:		Use:
	&		`&`
	<		`<`
	>		`>`
	[		`[`
	]		`]`

Link using PerlMonks shortcuts! What shortcuts can I use for linking?

See Writeup Formatting Tips and other pages linked from there for more info.