in reply to Re^7: POD style regex for inline HTML elements
in thread POD style regex for inline HTML elements
Will you please tell me what I am missing after I took all of the comments out? I'm still getting an infinite loop when these are nested with the error Use of uninitialized value in numeric gt (>) at files/lib/Base/HTML/Inline.pm line 32, <DATA> line 19.
Well, first thing is a call that calls the code .. word problems are hard :) when what is nested?
#!/usr/bin/perl -- use strict; use warnings; use Test::More qw' no_plan '; use Data::Dump qw/ dd pp /; { my $in = 'SPAN<text I<italic text>|class="span_class"> some more t +ext B<bold text>.'; my $out = Base::HTML::Inline::inline($in); my $wanted = '<span class="span_class">text <i>italic text</i></sp +an> some more text <b>bold text</b>.'; is( $out, $wanted , 'shabba'); } { my $in = 'SPAN<text I<italic B<and bold> text>|class="span_class"> + some more text B<bold text>.'; my $out = Base::HTML::Inline::inline($in); my $wanted = '<span class="span_class">text <i>italic <b>and bold< +/b> text</i></span> some more text <b>bold text</b>.'; is( $out, $wanted , 'shabba'); } { my $in = undef;; my $out = Base::HTML::Inline::inline( undef ); my $wanted = ''; is( $out, $wanted , 'a warning with infinite loop?'); } exit( 0 ); BEGIN { $INC{'Base/HTML/Inline.pm'} = __FILE__; package Base::HTML::Inline; use strict; use warnings; use Exporter qw(import); our @EXPORT_OK = qw(inline); # Written by an Anonymous Monk on PerlMonks (http://www.perlmonks.org/ +?node_id=1028699) #~ use Test::More qw' no_plan '; #~ use Regexp::Common qw/ balanced /; #~ use Data::Dump qw/ dd pp /; use vars qw/ $re_balanced_angles /; sub TRACE; sub DEBUG; *TRACE = *DEBUG = sub { print STDERR @_,"\n" }; our $re_balanced_angles = qr{\<(?:(?>[^\<\>]+)|(??{ $re_balanced_angle +s }))*\>}x; our $allowed = join '|', qw[ A ABBR ACRONYM B BIG CITE CODE DFN EM I KBD Q SAMP SMALL SPAN STRONG SUB SUP TT VAR ]; sub inline { local $_ = $_[0]; my $dent = $_[1] || 0; pos = 0; my $ret = ""; inlineLOOP: while( length > pos ){ m{\G(\s+)}gcsx and do { $ret .= $1; next inlineLOOP; }; m{\G( $allowed )( $re_balanced_angles )}gcsx and do { TRACE "# $dent allowed<> { $1 ( $2 ) }"; $ret .= inline_allowed( "$1" , "$2" , $dent ); next inlineLOOP; }; m{\G([^<]+\s)}gcmx and do { TRACE "# $dent text { $1 }"; $ret .= inline_text( "$1" ); next inlineLOOP; };;; m{\G([\<\>])}gcmx and do { TRACE "## $dent error-stray<> { $1 } at pos(@{[pos]})"; last inlineLOOP; };;; m{\G(\S)}gcmx and do { TRACE "# $dent inch-forward { $1 }"; $ret .= inline_text( "$1" ); next inlineLOOP; };;; } $ret; } sub inline_allowed { my( $tag , $stuff, $dent ) = @_; $stuff = $1 if $stuff =~ m{^<(.*)>$}gs; my $ret = ""; $ret .= "<\L$tag\E" if $tag; $stuff =~ s{\|([^<>]+)$}{$ret .= " $1"; "";}gsex if defined $stuff + ; ## inline_allowed_atts($tag,$1); $ret .= ">" if $tag; if( defined $stuff and length $stuff and $stuff =~ m{[<>]}g ){ $ret .= inline( $stuff , $dent+1) ; ## recurse } else { $ret .= $stuff; } $ret .= "</\L$tag\E>" if $tag; $ret; } sub inline_text { join'',@_ } 1; } ## end BEGIN __END__ # 0 allowed<> { SPAN ( <text I<italic text>|class="span_class"> ) } # 1 text { text } # 1 allowed<> { I ( <italic text> ) } # 0 text { some more text } # 0 allowed<> { B ( <bold text> ) } # 0 inch-forward { . } ok 1 - shabba # 0 allowed<> { SPAN ( <text I<italic B<and bold> text>|class="span_cl +ass"> ) } # 1 text { text } # 1 allowed<> { I ( <italic B<and bold> text> ) } # 2 text { italic } # 2 allowed<> { B ( <and bold> ) } # 2 inch-forward { t } # 2 inch-forward { e } # 2 inch-forward { x } # 2 inch-forward { t } # 0 text { some more text } # 0 allowed<> { B ( <bold text> ) } # 0 inch-forward { . } ok 2 - shabba Use of uninitialized value $_ in scalar assignment at - line 61. Use of uninitialized value in numeric gt (>) at - line 64. ok 3 - a warning with infinite loop? 1..3
|
|---|