#!/usr/bin/perl -nw # # Written by Laurent Moss use Encode; #Remove Microsoft Word shit # s/[\x91\x92]/\\'/g; s/[\x96\x97]/-/g; s/\x9C/oe/g; s/\x8C/OE/g; #Change encoding Encode::from_to($_, 'iso-8859-1', 'utf8'); print;

Note: I used this script when upgrading old mysql3 tikis to more recent databases.

MS Word special characters like the curly bracket could be replaced by a question mark (?)
