# -*- coding: Windows-1251 -*- _goodchars=dict() def console(msg): ''' Author: Denis Barmenkov Date: 02-jul-2007 Write string to stdout. On UnicodeEncodeError exception all the unsafe chars from string replaced by its python representation ''' global _goodchars try: print msg except UnicodeEncodeError: # get error, res='' for i in list(msg): # try to put unknown characters thru print statement: if i not in _goodchars: try: print i # try print character, some extra trash on screen # for each unknown printable character _goodchars[i]=i # safe character, save it as is except UnicodeEncodeError: # format character as python string constant code=ord(i) if code < 256: t='\\x%02x' % code # 8-bit value elif code < 65536: t='\\u%04x' % code # 16-bit value unicode else: t='\\U%08x' % code # other values as 32-bit unicode _goodchars[i]=t # or '.' for readability ;-) res+=_goodchars[i] # append to result print res if __name__=='__main__': import codecs import sys reload(sys) # prepare my encodings sys.setdefaultencoding('cp1251') # set default encoding for source sys.stdout=codecs.getwriter('cp866')(sys.stdout) # set DOS cyrillic codepage test_string='\xab' try: print 'Using print statement:', test_string except UnicodeEncodeError: print 'UnicodeEncodeError exception while using print!' print 'Using console():', console(test_string)