# concatenate all your records together into one data stream # and pipe it all through this perl command line: perl -ne 'tr/\x00-\x7f//d; $ch{$_}++ for (split//); END{printf("%x %d\n",ord,$ch{$_}) for (sort keys %ch)}' # this prints a histogram of non-ascii byte values