m{
# any of the 12 months:
(?: January |
February |
March |
April |
May |
June |
July |
August |
September |
October |
November |
December
)
\s # a space between month and day
[123]?\d # Is the first day 1, \s1, or 01?
, # a comma between day and year
\s? # an optional space between comma and year
[12]\d{3} # a four digit year
}xms
####
m{
# any of the 12 months:
(?: January |
February |
March |
April |
May |
June |
July |
August |
September |
October |
November |
December
)
(?:<.+?>|\s)* # zero or more tag like things or spaces
[123]?\d # Is the first day 1, \s1, or 01?
, # a comma between day and year
(?:<.+?>|\s)* # zero or more tag like things or spaces
[12]\d{3} # a four digit year
}xms
####
if ( $html =~ m{ ( blah blah as above blah blah ) }xms ) {
my $date = $1;
# remove the tags, if there are any
$date =~ s/<.+?>//g;
}