# Keep only the following characters # # [:print:] printable characters # \n end-of-line characters # \x85 MS Word ellipses # \x91 MS Word single opening quote # \x92 MS Word single closing quote # \x93 MS Word double opening quote # \x94 MS Word double closing quote # \x96 MS Word endash # \x97 MS Word emdash # \x99 MS Word trademark symbol # \xA7 MS Word section symbol # \xA9 MS Word copyright symbol # \xAE MS Word registered symbol $freeformtext =~ s/ [^[:print:]\n\x85\x91\x92\x93\x94\x96\x97\x99\xA7\xA9\xAE] //gx;