]>
Commit | Line | Data |
---|---|---|
3257aa99 DM |
1 | """ Python 'utf-16' Codec\r |
2 | \r | |
3 | \r | |
4 | Written by Marc-Andre Lemburg (mal@lemburg.com).\r | |
5 | \r | |
6 | (c) Copyright CNRI, All Rights Reserved. NO WARRANTY.\r | |
7 | \r | |
8 | """\r | |
9 | import codecs, sys\r | |
10 | \r | |
11 | ### Codec APIs\r | |
12 | \r | |
13 | encode = codecs.utf_16_encode\r | |
14 | \r | |
15 | def decode(input, errors='strict'):\r | |
16 | return codecs.utf_16_decode(input, errors, True)\r | |
17 | \r | |
18 | class IncrementalEncoder(codecs.IncrementalEncoder):\r | |
19 | def __init__(self, errors='strict'):\r | |
20 | codecs.IncrementalEncoder.__init__(self, errors)\r | |
21 | self.encoder = None\r | |
22 | \r | |
23 | def encode(self, input, final=False):\r | |
24 | if self.encoder is None:\r | |
25 | result = codecs.utf_16_encode(input, self.errors)[0]\r | |
26 | if sys.byteorder == 'little':\r | |
27 | self.encoder = codecs.utf_16_le_encode\r | |
28 | else:\r | |
29 | self.encoder = codecs.utf_16_be_encode\r | |
30 | return result\r | |
31 | return self.encoder(input, self.errors)[0]\r | |
32 | \r | |
33 | def reset(self):\r | |
34 | codecs.IncrementalEncoder.reset(self)\r | |
35 | self.encoder = None\r | |
36 | \r | |
37 | def getstate(self):\r | |
38 | # state info we return to the caller:\r | |
39 | # 0: stream is in natural order for this platform\r | |
40 | # 2: endianness hasn't been determined yet\r | |
41 | # (we're never writing in unnatural order)\r | |
42 | return (2 if self.encoder is None else 0)\r | |
43 | \r | |
44 | def setstate(self, state):\r | |
45 | if state:\r | |
46 | self.encoder = None\r | |
47 | else:\r | |
48 | if sys.byteorder == 'little':\r | |
49 | self.encoder = codecs.utf_16_le_encode\r | |
50 | else:\r | |
51 | self.encoder = codecs.utf_16_be_encode\r | |
52 | \r | |
53 | class IncrementalDecoder(codecs.BufferedIncrementalDecoder):\r | |
54 | def __init__(self, errors='strict'):\r | |
55 | codecs.BufferedIncrementalDecoder.__init__(self, errors)\r | |
56 | self.decoder = None\r | |
57 | \r | |
58 | def _buffer_decode(self, input, errors, final):\r | |
59 | if self.decoder is None:\r | |
60 | (output, consumed, byteorder) = \\r | |
61 | codecs.utf_16_ex_decode(input, errors, 0, final)\r | |
62 | if byteorder == -1:\r | |
63 | self.decoder = codecs.utf_16_le_decode\r | |
64 | elif byteorder == 1:\r | |
65 | self.decoder = codecs.utf_16_be_decode\r | |
66 | elif consumed >= 2:\r | |
67 | raise UnicodeError("UTF-16 stream does not start with BOM")\r | |
68 | return (output, consumed)\r | |
69 | return self.decoder(input, self.errors, final)\r | |
70 | \r | |
71 | def reset(self):\r | |
72 | codecs.BufferedIncrementalDecoder.reset(self)\r | |
73 | self.decoder = None\r | |
74 | \r | |
75 | class StreamWriter(codecs.StreamWriter):\r | |
76 | def __init__(self, stream, errors='strict'):\r | |
77 | codecs.StreamWriter.__init__(self, stream, errors)\r | |
78 | self.encoder = None\r | |
79 | \r | |
80 | def reset(self):\r | |
81 | codecs.StreamWriter.reset(self)\r | |
82 | self.encoder = None\r | |
83 | \r | |
84 | def encode(self, input, errors='strict'):\r | |
85 | if self.encoder is None:\r | |
86 | result = codecs.utf_16_encode(input, errors)\r | |
87 | if sys.byteorder == 'little':\r | |
88 | self.encoder = codecs.utf_16_le_encode\r | |
89 | else:\r | |
90 | self.encoder = codecs.utf_16_be_encode\r | |
91 | return result\r | |
92 | else:\r | |
93 | return self.encoder(input, errors)\r | |
94 | \r | |
95 | class StreamReader(codecs.StreamReader):\r | |
96 | \r | |
97 | def reset(self):\r | |
98 | codecs.StreamReader.reset(self)\r | |
99 | try:\r | |
100 | del self.decode\r | |
101 | except AttributeError:\r | |
102 | pass\r | |
103 | \r | |
104 | def decode(self, input, errors='strict'):\r | |
105 | (object, consumed, byteorder) = \\r | |
106 | codecs.utf_16_ex_decode(input, errors, 0, False)\r | |
107 | if byteorder == -1:\r | |
108 | self.decode = codecs.utf_16_le_decode\r | |
109 | elif byteorder == 1:\r | |
110 | self.decode = codecs.utf_16_be_decode\r | |
111 | elif consumed>=2:\r | |
112 | raise UnicodeError,"UTF-16 stream does not start with BOM"\r | |
113 | return (object, consumed)\r | |
114 | \r | |
115 | ### encodings module API\r | |
116 | \r | |
117 | def getregentry():\r | |
118 | return codecs.CodecInfo(\r | |
119 | name='utf-16',\r | |
120 | encode=encode,\r | |
121 | decode=decode,\r | |
122 | incrementalencoder=IncrementalEncoder,\r | |
123 | incrementaldecoder=IncrementalDecoder,\r | |
124 | streamreader=StreamReader,\r | |
125 | streamwriter=StreamWriter,\r | |
126 | )\r |