[code.view]

[top] / python / PyMOTW / codecs / codecs_bom_detection.py

     #!/usr/bin/env python
     # encoding: utf-8
     #
     # Copyright (c) 2010 Doug Hellmann.  All rights reserved.
     #
     """Detecting the BOM.
     """
     #end_pymotw_header
     
     import codecs
     from codecs_to_hex import to_hex
     
     # Look at the raw data
     with open('non-native-encoded.txt', mode='rb') as f:
         raw_bytes = f.read()
     
     print 'Raw    :', to_hex(raw_bytes, 2)
     
     # Re-open the file and let codecs detect the BOM
     with codecs.open('non-native-encoded.txt', mode='rt', encoding='utf-16') as f:
         decoded_text = f.read()
     
     print 'Decoded:', repr(decoded_text)
     

[top] / python / PyMOTW / codecs / codecs_bom_detection.py

contact | logmethods.com