[code.view]

[top] / python / PyMOTW / re / re_flags_unicode.py

     #!/usr/bin/env python
     # encoding: utf-8
     #
     # Copyright (c) 2010 Doug Hellmann.  All rights reserved.
     #
     """Unicode character definitions
     """
     #end_pymotw_header
     
     import re
     import codecs
     import sys
     
     # Set standard output encoding to UTF-8.
     sys.stdout = codecs.getwriter('UTF-8')(sys.stdout)
     
     text = u'Français złoty Österreich'
     pattern = ur'\w+'
     ascii_pattern = re.compile(pattern)
     unicode_pattern = re.compile(pattern, re.UNICODE)
     
     print 'Text    :', text
     print 'Pattern :', pattern
     print 'ASCII   :', u', '.join(ascii_pattern.findall(text))
     print 'Unicode :', u', '.join(unicode_pattern.findall(text))
     

[top] / python / PyMOTW / re / re_flags_unicode.py

contact | logmethods.com