Paste in some unicode text that appears to be broken and this tool will use the ftfy Python library to try and fix it.
import ftfy.bad_codecs # enables sloppy- codecs from ftfy.fixes import restore_byte_a0 s = 'It was namedÃ\x82 ââ\x82¬Å¾scarsÃ\x82´ stonesââ\x82¬Å\x9b after the rock-climbers who got hurt while climbing on it.' s = s.encode('latin-1') s = s.decode('utf-8') s = s.encode('sloppy-windows-1250') s = restore_byte_a0(s) s = s.decode('utf-8') print(s)
Web app source code on GitHub