| 1 | """ Python 'utf-16' Codec
|
|---|
| 2 |
|
|---|
| 3 |
|
|---|
| 4 | Written by Marc-Andre Lemburg ([email protected]).
|
|---|
| 5 |
|
|---|
| 6 | (c) Copyright CNRI, All Rights Reserved. NO WARRANTY.
|
|---|
| 7 |
|
|---|
| 8 | """
|
|---|
| 9 | import codecs, sys
|
|---|
| 10 |
|
|---|
| 11 | ### Codec APIs
|
|---|
| 12 |
|
|---|
| 13 | encode = codecs.utf_16_encode
|
|---|
| 14 |
|
|---|
| 15 | def decode(input, errors='strict'):
|
|---|
| 16 | return codecs.utf_16_decode(input, errors, True)
|
|---|
| 17 |
|
|---|
| 18 | class IncrementalEncoder(codecs.IncrementalEncoder):
|
|---|
| 19 | def __init__(self, errors='strict'):
|
|---|
| 20 | codecs.IncrementalEncoder.__init__(self, errors)
|
|---|
| 21 | self.encoder = None
|
|---|
| 22 |
|
|---|
| 23 | def encode(self, input, final=False):
|
|---|
| 24 | if self.encoder is None:
|
|---|
| 25 | result = codecs.utf_16_encode(input, self.errors)[0]
|
|---|
| 26 | if sys.byteorder == 'little':
|
|---|
| 27 | self.encoder = codecs.utf_16_le_encode
|
|---|
| 28 | else:
|
|---|
| 29 | self.encoder = codecs.utf_16_be_encode
|
|---|
| 30 | return result
|
|---|
| 31 | return self.encoder(input, self.errors)[0]
|
|---|
| 32 |
|
|---|
| 33 | def reset(self):
|
|---|
| 34 | codecs.IncrementalEncoder.reset(self)
|
|---|
| 35 | self.encoder = None
|
|---|
| 36 |
|
|---|
| 37 | class IncrementalDecoder(codecs.BufferedIncrementalDecoder):
|
|---|
| 38 | def __init__(self, errors='strict'):
|
|---|
| 39 | codecs.BufferedIncrementalDecoder.__init__(self, errors)
|
|---|
| 40 | self.decoder = None
|
|---|
| 41 |
|
|---|
| 42 | def _buffer_decode(self, input, errors, final):
|
|---|
| 43 | if self.decoder is None:
|
|---|
| 44 | (output, consumed, byteorder) = \
|
|---|
| 45 | codecs.utf_16_ex_decode(input, errors, 0, final)
|
|---|
| 46 | if byteorder == -1:
|
|---|
| 47 | self.decoder = codecs.utf_16_le_decode
|
|---|
| 48 | elif byteorder == 1:
|
|---|
| 49 | self.decoder = codecs.utf_16_be_decode
|
|---|
| 50 | elif consumed >= 2:
|
|---|
| 51 | raise UnicodeError("UTF-16 stream does not start with BOM")
|
|---|
| 52 | return (output, consumed)
|
|---|
| 53 | return self.decoder(input, self.errors, final)
|
|---|
| 54 |
|
|---|
| 55 | def reset(self):
|
|---|
| 56 | codecs.BufferedIncrementalDecoder.reset(self)
|
|---|
| 57 | self.decoder = None
|
|---|
| 58 |
|
|---|
| 59 | class StreamWriter(codecs.StreamWriter):
|
|---|
| 60 | def __init__(self, stream, errors='strict'):
|
|---|
| 61 | self.bom_written = False
|
|---|
| 62 | codecs.StreamWriter.__init__(self, stream, errors)
|
|---|
| 63 |
|
|---|
| 64 | def encode(self, input, errors='strict'):
|
|---|
| 65 | self.bom_written = True
|
|---|
| 66 | result = codecs.utf_16_encode(input, errors)
|
|---|
| 67 | if sys.byteorder == 'little':
|
|---|
| 68 | self.encode = codecs.utf_16_le_encode
|
|---|
| 69 | else:
|
|---|
| 70 | self.encode = codecs.utf_16_be_encode
|
|---|
| 71 | return result
|
|---|
| 72 |
|
|---|
| 73 | class StreamReader(codecs.StreamReader):
|
|---|
| 74 |
|
|---|
| 75 | def reset(self):
|
|---|
| 76 | codecs.StreamReader.reset(self)
|
|---|
| 77 | try:
|
|---|
| 78 | del self.decode
|
|---|
| 79 | except AttributeError:
|
|---|
| 80 | pass
|
|---|
| 81 |
|
|---|
| 82 | def decode(self, input, errors='strict'):
|
|---|
| 83 | (object, consumed, byteorder) = \
|
|---|
| 84 | codecs.utf_16_ex_decode(input, errors, 0, False)
|
|---|
| 85 | if byteorder == -1:
|
|---|
| 86 | self.decode = codecs.utf_16_le_decode
|
|---|
| 87 | elif byteorder == 1:
|
|---|
| 88 | self.decode = codecs.utf_16_be_decode
|
|---|
| 89 | elif consumed>=2:
|
|---|
| 90 | raise UnicodeError,"UTF-16 stream does not start with BOM"
|
|---|
| 91 | return (object, consumed)
|
|---|
| 92 |
|
|---|
| 93 | ### encodings module API
|
|---|
| 94 |
|
|---|
| 95 | def getregentry():
|
|---|
| 96 | return codecs.CodecInfo(
|
|---|
| 97 | name='utf-16',
|
|---|
| 98 | encode=encode,
|
|---|
| 99 | decode=decode,
|
|---|
| 100 | incrementalencoder=IncrementalEncoder,
|
|---|
| 101 | incrementaldecoder=IncrementalDecoder,
|
|---|
| 102 | streamreader=StreamReader,
|
|---|
| 103 | streamwriter=StreamWriter,
|
|---|
| 104 | )
|
|---|