$ hexdump -C in.txt | head -1 00000000 e6 88 96 e5 95 8f 20 57 41 4b 55 4d 4f 4e 20 31 |...... WAKUMON 1| $ unicode_char_name_fm_code_point.pl e6 88 96 e6 88 96 : U+6216: CJK UNIFIED IDEOGRAPH-6216 $ unicode_char_name_fm_code_point.pl e5 95 8f e5 95 8f : U+554f: CJK UNIFIED IDEOGRAPH-554F #### $ hexdump -C out.txt | head -1 00000000 c3 a4 c2 b8 2c 20 35 35 35 2e 37 30 38 35 35 36 |...., 555.708556| $ unicode_char_name_fm_code_point.pl c3 a4 c3 a4 : U+e4: LATIN SMALL LETTER A WITH DIAERESIS $ unicode_char_name_fm_code_point.pl c2 b8 c2 b8 : U+b8: CEDILLA #### $ hexdump -C out2.txt | head -2 00000000 e4 b8 2c 20 35 35 35 2e 37 30 38 35 35 36 37 30 |.., 555.70855670| 00000010 39 33 36 0a e7 ac 31 34 ef bc 32 30 30 38 ef bc |936...14..2008..| $ unicode_char_name_fm_code_point.pl e4 b8 2c e4 b8 2c : U+4e2c: CJK UNIFIED IDEOGRAPH-4E2C ERROR! (turn on dbg prt stmt) $ unicode_char_name_fm_code_point.pl e7 ac 31 e7 ac 31 : U+7b31: CJK UNIFIED IDEOGRAPH-7B31 ERROR! (turn on dbg prt stmt) $ unicode_char_name_fm_code_point.pl ef bc 32 ef bc 32 : U+ff32: FULLWIDTH LATIN CAPITAL LETTER R ERROR! (turn on dbg prt stmt)