use XML::Simple; my $ref=XMLin( "xml_invalid_char.input" ); print Dumper $ref; #### ?s«ndjfr?1 S334µµ!