$ perl -i.unmangled.by.$$ -MEncode -C0 -pe 's/&#(\d+);/chr($1)/ge; $_ = decode_utf8($_, 1); s/(\P{ASCII})/"&#".ord($1).";"/ge' all*your*broken*files.xhtml