comment on

#!/usr/local/bin/perl
=head1 NAME

cgrep - print lines matching a pattern

=head1 SYNOPSYS

B<cgrep> [I<options>] I<PATTERN> [I<FILES>]

=head1 DESCRIPTION

B<Cgrep> searches for I<PATTERN> in text files, and prints matching li
+nes.
I<PATTERN> can be a perl regular expression, or a fixed string.

B<Cgrep> reads all files specified in I<FILES>, or stdin if no I<FILES
+>
are given.  Directories are ignored.
Every line is matched with I<PATTERN> separately.  I<PATTERN>
is interpreted as a perl regular expression by default, but as a fixed
string if the B<-F> flag is set.  In normal operation mode, B<cgrep> p
+rints
matching lines.  Exit code is 0 if any matches are found, 1 if no matc
+hes
were found.

=head1 OPTIONS

Long options can be abbreviated to a unique prefix, and can be
negated with a B<no-> prefix.  A double hyphen stops option processing
+,
allowing you to use filenames starting with a minus.

=over

=item B<-A> I<NUM1>, B<--after-context=>I<NUM1>; 
    B<-B> I<NUM2>, B<--before-context=>I<NUM2>

Print context lines around matches, as with B<-C>.
These options, however, set the number of context lines
after and before matches to I<NUM1> and I<NUM2> respectively.
If only one of the options is given, context lines will
be printed only after or only before the match resp.

=item B<-C> I<NUM>, B<--context=>I<NUM>

Print I<NUM> lines of context before and after each match.

Also, print a line with a lone dash between continuous chunks
of lines.
If any of B<-n>, B<-h>, B<-p>, B<-P> is enabled, the separator
before the line and the prefixes will be a colon on 
matching lines, and a hyphen in context lines.

=item B<-e> I<PATTERN>, B<--pattern=>I<PATTERN>

A different way to specify I<PATTERN>.
If this option is used, all non-option arguments are filenames.
If not used, the first non-option argument is the I<PATTERN>.

=item B<-E>, B<--perl-regexp>

Interpret I<PATTERN> as a perl regexp.  This is the default.
Perl regexps are NFA, see L<perlre(1)> for details of syntax and seman
+tics.

=item B<-F>, B<--fixed-strings>

Interpret I<PATTERN> as fixed string, not a regexp.

=item B<-h>, B<--with-no-filename>

Do not print filename before each line printed.  
This is the default if there is only one I<FILE> given.

=item B<-H>, B<--with-filename>

Print filename before each line.  This is the default if
more than one I<FILES> are given.

=item B<-i>, B<--fold-case>

Interpret I<PATTERN> case insensitively.  Works with both 
regexp pattern and fixed strings.

=item B<-l>, B<--files-with-match>

Print the lists of files that have any matching lines.

Stop reading the file at the first match.
This supresses normal operation mode, that is, printing
matching lines.  The options B<-ABChHnpP> do not make
sense in combination with B<-l>.

=item B<-L>, B<--files-without-match>

Prints the lists of files having no matching lines.
Similar to B<-l> otherwise.

=item B<-n>, B<--line-number>

Print line number before each line printed.

=item B<-p>, B<--show-function>

Prints current function name before each line.

=item B<-P> I<REGEXP>, B<--function-regexp=>I<REGEXP>

Defines how function names are found.  Implies B<-p>.

Lines matching I<REGEXP> are taken to be function
headers.  I<REGEXP> is a perl regexp, unaffected by
B<-F>, B<-i>, B<-v>.  The last matching capture in it
should return the function name.

The default regexp is C<^(\w+)>, suitable for C.

=item B<-s>, B<--no-messages>

Do not print warnings about files that can't be opened.

=item B<-q>, B<--silent>

Do not print anything, just give the return value.

Stops execution at very first match.

=item B<-v>, B<--invert-match>

Inverts the sense of the match, that is, searches for
line not matching I<PATTERN>

=back

=head1 SEE ALSO

L<egrep(1)>, L<perlre(1)>

=head1 AUTHOR

<ambrus@math.bme.hu>

=cut

use warnings;
use strict;

use Getopt::Long;
use IO::Handle;


{

my($cregexp, @filenames, $complement, $found_any, $match, $endfile,
    $print_filename, $print_lineno, $before_context, $after_context, 
    $context, $hush_messages, $print_func, $func_cregexp, 
    $file, $filename, $anyoutput, $lastoutput);


sub main {
    parseopts();
    $found_any = 0;
    !@filenames and @filenames = undef;
    for my $n (@filenames) {
        $filename = $n;
        if (defined($filename)) {
            open $file, "<", $n or do {
                $hush_messages or warn qq[error opening file "$n": $!]
+;
                next;
            };
        } else {
            $file = *STDIN;
        }
        -d $file and next;
        process_file();
        close $file;
    }
    !$found_any;
}


sub process_file {
    my($line, $func, $m, @before, $b, $after);
    ($after, $func, $lastoutput) = (0, undef, -1);
    READ: {
    while (defined($line = <$file>)) {
        chomp $line;
        $print_func and 
            $line =~ /$func_cregexp/ and
                $func = $+;
        $m = $line =~ /$cregexp/;
        if ($m xor $complement) {
            $found_any = 1;
            $context and do {
                for $b (@before)
                    { &$match(@$b[0, 1, 2]), 0 }
                @before = ();
                $after = $after_context;
            };
            &$match($line, input_line_number $file, $func, 1);
        } else {
            $context and do {
                if (0 < $after) {
                    &$match($line, input_line_number $file, $func, 0);
                    $after--;
                } else {
                    push @before, [$line, input_line_number $file, $fu
+nc];
                    $before_context < @before and shift @before;
                }
            };
        }
    }
    &$endfile()
    }
}


sub nextfile {
    no warnings "exiting";
    last READ;
}


sub print_match {
    my($line, $lineno, $func, $m) = @_;
    $context and do {
        $lastoutput != $lineno - 1 && $anyoutput and
            print "--\n";
        $anyoutput = 1;
        $lastoutput = $lineno;
    };
    $print_filename and print $filename, $m ? ":" : "-";
    $print_func and defined($func) and print $func, $m ? ":" : "-";
    $print_lineno and print $lineno, $m ? ":" : "-";
    print $line, "\n";
}


sub print_name_exit {
    $_[3] or return;
    print $filename, "\n";
    nextfile;
}

sub found_exit {
    $_[3] or return;
    nextfile;
}

sub found_exit_zero {
    $_[3] or return;
    return 0;
}

sub print_filename {
    print $filename, "\n";
}

sub noop {
}

sub parseopts {
    my($regexp, $plain, $ignorecase, $mods, $mode);
    ($before_context, $after_context, $mode, $func_cregexp) = (0, 0, "
+", qr/^(\w+)/);
    Getopt::Long::Configure "bundling", "gnu_compat", "prefix_pattern=
+(--|-)";
    GetOptions(
        "fixed-strings|F!", sub { $plain = $_[1] },
        "extended-regexp|perl-regexp|E!", sub { $plain = !$_[1] },
        "pattern|e=s", sub { $regexp = $_[1] },
        "invert-match|complement-match|v!", sub { $complement = $_[1] 
+},
        "filename|with-filename|H!", sub { $print_filename = $_[1] },
        "with-no-filename|h!", sub { $print_filename = !$_[1] },
        "igore-case|fold-case|y|i!", sub { $ignorecase = $_[1] },
        "line-number|n!", sub { $print_lineno = $_[1]; },
        "context|C=n", sub { $after_context = $before_context = $_[1] 
+},
        "after-context|A=n", sub { $after_context = $_[1] },
        "before-context|B=n", sub { $before_context = $_[1] },
        "files-with-match|list|l!", sub { $mode = $_[1] ? "l" : "" },
        "file-without-match|missing|L!", sub { $mode = $_[1] ? "L" : "
+" },
        "quiet|silent|q", sub { $mode = $_[1] ? "q" : "" },
        "no-messages|hush-messages|s", sub { $hush_messages = $_[1] },
        "show-function|function|p!", sub { $print_func = $_[1] },
        "function-regexp|P=s", sub { $func_cregexp = qr/$_[1]/; $print
+_func = 1 },
    );
    defined($regexp) or $regexp = shift @ARGV;
    defined($regexp) or die 'required argument missing; usage: cgrep [
+options] regexp [filenames]';
    !$plain && $regexp=~/\<|\>/ and do
        { $hush_messages or warn 'warning: \< and \> are not special i
+n perl regexen' };
    $plain and $regexp = quotemeta $regexp;
    $mods = $ignorecase ? "i" : "";
    $cregexp = qr/(?$mods:$regexp)/;
    @filenames = @ARGV;
    defined($print_filename) or $print_filename = 1 < @filenames;
    0 < $before_context || 0 < $after_context and do {
        $context = 1; $before_context ||= 0; $after_context ||= 0;
    };
    $endfile = \&noop;
    if ($mode eq "l") 
        { $match = \&print_name_exit }
    elsif ($mode eq "L")
        { ($match, $endfile) = (\&found_exit, \&print_filename) }
    elsif ($mode eq "q")
        { $match = \&found_exit_zero }
    elsif ($mode eq "")
        { $match = \&print_match }
    else
        { die "internal error: invalid mode: $mode" }
}


exit main();

}

__END__
[download]
In reply to cgrep: Egrep clone with function name display by ambrus
Are you posting in the right place? Check out Where do I post X? to know for sure.
Posts may use any of the Perl Monks Approved HTML tags. Currently these include the following:
<code> <a> <b> <big> <blockquote> <br /> <dd> <dl> <dt> <em> <font> <h1> <h2> <h3> <h4> <h5> <h6> <hr /> <i> <li> <nbsp> <ol> <p> <small> <strike> <strong> <sub> <sup> <table> <td> <th> <tr> <tt> <u> <ul>
Snippets of code should be wrapped in <code> tags not <pre> tags. In fact, <pre> tags should generally be avoided. If they must be used, extreme care should be taken to ensure that their contents do not have long lines (<70 chars), in order to prevent horizontal scrolling (and possible janitor intervention).
Want more info? How to link or How to display code and escape characters are good places to start.

P is for Practical
	PerlMonks