- or download this
$ hexdump -C in.txt | head -1
00000000 e6 88 96 e5 95 8f 20 57 41 4b 55 4d 4f 4e 20 31 |...... WA
+KUMON 1|
...
e6 88 96 : U+6216: CJK UNIFIED IDEOGRAPH-6216
$ unicode_char_name_fm_code_point.pl e5 95 8f
e5 95 8f : U+554f: CJK UNIFIED IDEOGRAPH-554F
- or download this
$ hexdump -C out.txt | head -1
00000000 c3 a4 c2 b8 2c 20 35 35 35 2e 37 30 38 35 35 36 |...., 555
+.708556|
...
c3 a4 : U+e4: LATIN SMALL LETTER A WITH DIAERESIS
$ unicode_char_name_fm_code_point.pl c2 b8
c2 b8 : U+b8: CEDILLA
- or download this
$ hexdump -C out2.txt | head -2
00000000 e4 b8 2c 20 35 35 35 2e 37 30 38 35 35 36 37 30 |.., 555.7
+0855670|
...
e7 ac 31 : U+7b31: CJK UNIFIED IDEOGRAPH-7B31 ERROR! (turn on dbg pr
+t stmt)
$ unicode_char_name_fm_code_point.pl ef bc 32
ef bc 32 : U+ff32: FULLWIDTH LATIN CAPITAL LETTER R ERROR! (turn on
+dbg prt stmt)