$editted_copy = $string; # Look for codepoints not in Basic Latin while ( $string =~ s/(\P{InBasic_Latin})// ) { my $U_char = $1; my $U_codepoint = ord($U_char); #and try to replace them if( defined( $subs{$U_codepoint} ) && exists( $subs{$U_codepoint} )){ $editted_copy =~ s/$U_char/$subs{$U_codepoint}/; } else{ #add the missing U_codepoint by hand to the %subs hash #and iterate till no more U_codepoints causing problems }
In reply to Re^4: One bird, two Unicode names
by RCH
in thread One bird, two Unicode names
by RCH
| For: | Use: | ||
| & | & | ||
| < | < | ||
| > | > | ||
| [ | [ | ||
| ] | ] |