#!/usr/bin/env python # encoding: utf-8 # # Copyright (c) 2010 Doug Hellmann. All rights reserved. # """Unicode character definitions """ #end_pymotw_header import re import codecs import sys # Set standard output encoding to UTF-8. sys.stdout = codecs.getwriter('UTF-8')(sys.stdout) text = u'Français złoty Österreich' pattern = ur'\w+' ascii_pattern = re.compile(pattern) unicode_pattern = re.compile(pattern, re.UNICODE) print 'Text :', text print 'Pattern :', pattern print 'ASCII :', u', '.join(ascii_pattern.findall(text)) print 'Unicode :', u', '.join(unicode_pattern.findall(text))