##
my $browser = LWP::UserAgent->new;
my $response = $browser->get( "http://publib.boulder.ibm.com/infocenter/brjrules/v7r0m3/basic/tocView.jsp?toc=/com.ibm.websphere.ilog.jrules.doc/toc.xml" );
my $content = $$response{_content}; ## yes inefficient coding, but it works
open(OUT, ">content.html");
print OUT $content;
close(OUT);
####
utf8::decode($content);
$content =~ s { ([\x00-\x08\x0B\x0C\x0E-\x1F\x80-\x{1FFFFF}]) }
{ sprintf('[U+%04X]', ord($1)) }gex;
####
What[U+2019]s new