]>
Commit | Line | Data |
---|---|---|
3257aa99 DM |
1 | """\r |
2 | Python 'utf-32' Codec\r | |
3 | """\r | |
4 | import codecs, sys\r | |
5 | \r | |
6 | ### Codec APIs\r | |
7 | \r | |
8 | encode = codecs.utf_32_encode\r | |
9 | \r | |
10 | def decode(input, errors='strict'):\r | |
11 | return codecs.utf_32_decode(input, errors, True)\r | |
12 | \r | |
13 | class IncrementalEncoder(codecs.IncrementalEncoder):\r | |
14 | def __init__(self, errors='strict'):\r | |
15 | codecs.IncrementalEncoder.__init__(self, errors)\r | |
16 | self.encoder = None\r | |
17 | \r | |
18 | def encode(self, input, final=False):\r | |
19 | if self.encoder is None:\r | |
20 | result = codecs.utf_32_encode(input, self.errors)[0]\r | |
21 | if sys.byteorder == 'little':\r | |
22 | self.encoder = codecs.utf_32_le_encode\r | |
23 | else:\r | |
24 | self.encoder = codecs.utf_32_be_encode\r | |
25 | return result\r | |
26 | return self.encoder(input, self.errors)[0]\r | |
27 | \r | |
28 | def reset(self):\r | |
29 | codecs.IncrementalEncoder.reset(self)\r | |
30 | self.encoder = None\r | |
31 | \r | |
32 | def getstate(self):\r | |
33 | # state info we return to the caller:\r | |
34 | # 0: stream is in natural order for this platform\r | |
35 | # 2: endianness hasn't been determined yet\r | |
36 | # (we're never writing in unnatural order)\r | |
37 | return (2 if self.encoder is None else 0)\r | |
38 | \r | |
39 | def setstate(self, state):\r | |
40 | if state:\r | |
41 | self.encoder = None\r | |
42 | else:\r | |
43 | if sys.byteorder == 'little':\r | |
44 | self.encoder = codecs.utf_32_le_encode\r | |
45 | else:\r | |
46 | self.encoder = codecs.utf_32_be_encode\r | |
47 | \r | |
48 | class IncrementalDecoder(codecs.BufferedIncrementalDecoder):\r | |
49 | def __init__(self, errors='strict'):\r | |
50 | codecs.BufferedIncrementalDecoder.__init__(self, errors)\r | |
51 | self.decoder = None\r | |
52 | \r | |
53 | def _buffer_decode(self, input, errors, final):\r | |
54 | if self.decoder is None:\r | |
55 | (output, consumed, byteorder) = \\r | |
56 | codecs.utf_32_ex_decode(input, errors, 0, final)\r | |
57 | if byteorder == -1:\r | |
58 | self.decoder = codecs.utf_32_le_decode\r | |
59 | elif byteorder == 1:\r | |
60 | self.decoder = codecs.utf_32_be_decode\r | |
61 | elif consumed >= 4:\r | |
62 | raise UnicodeError("UTF-32 stream does not start with BOM")\r | |
63 | return (output, consumed)\r | |
64 | return self.decoder(input, self.errors, final)\r | |
65 | \r | |
66 | def reset(self):\r | |
67 | codecs.BufferedIncrementalDecoder.reset(self)\r | |
68 | self.decoder = None\r | |
69 | \r | |
70 | def getstate(self):\r | |
71 | # additonal state info from the base class must be None here,\r | |
72 | # as it isn't passed along to the caller\r | |
73 | state = codecs.BufferedIncrementalDecoder.getstate(self)[0]\r | |
74 | # additional state info we pass to the caller:\r | |
75 | # 0: stream is in natural order for this platform\r | |
76 | # 1: stream is in unnatural order\r | |
77 | # 2: endianness hasn't been determined yet\r | |
78 | if self.decoder is None:\r | |
79 | return (state, 2)\r | |
80 | addstate = int((sys.byteorder == "big") !=\r | |
81 | (self.decoder is codecs.utf_32_be_decode))\r | |
82 | return (state, addstate)\r | |
83 | \r | |
84 | def setstate(self, state):\r | |
85 | # state[1] will be ignored by BufferedIncrementalDecoder.setstate()\r | |
86 | codecs.BufferedIncrementalDecoder.setstate(self, state)\r | |
87 | state = state[1]\r | |
88 | if state == 0:\r | |
89 | self.decoder = (codecs.utf_32_be_decode\r | |
90 | if sys.byteorder == "big"\r | |
91 | else codecs.utf_32_le_decode)\r | |
92 | elif state == 1:\r | |
93 | self.decoder = (codecs.utf_32_le_decode\r | |
94 | if sys.byteorder == "big"\r | |
95 | else codecs.utf_32_be_decode)\r | |
96 | else:\r | |
97 | self.decoder = None\r | |
98 | \r | |
99 | class StreamWriter(codecs.StreamWriter):\r | |
100 | def __init__(self, stream, errors='strict'):\r | |
101 | self.encoder = None\r | |
102 | codecs.StreamWriter.__init__(self, stream, errors)\r | |
103 | \r | |
104 | def reset(self):\r | |
105 | codecs.StreamWriter.reset(self)\r | |
106 | self.encoder = None\r | |
107 | \r | |
108 | def encode(self, input, errors='strict'):\r | |
109 | if self.encoder is None:\r | |
110 | result = codecs.utf_32_encode(input, errors)\r | |
111 | if sys.byteorder == 'little':\r | |
112 | self.encoder = codecs.utf_32_le_encode\r | |
113 | else:\r | |
114 | self.encoder = codecs.utf_32_be_encode\r | |
115 | return result\r | |
116 | else:\r | |
117 | return self.encoder(input, errors)\r | |
118 | \r | |
119 | class StreamReader(codecs.StreamReader):\r | |
120 | \r | |
121 | def reset(self):\r | |
122 | codecs.StreamReader.reset(self)\r | |
123 | try:\r | |
124 | del self.decode\r | |
125 | except AttributeError:\r | |
126 | pass\r | |
127 | \r | |
128 | def decode(self, input, errors='strict'):\r | |
129 | (object, consumed, byteorder) = \\r | |
130 | codecs.utf_32_ex_decode(input, errors, 0, False)\r | |
131 | if byteorder == -1:\r | |
132 | self.decode = codecs.utf_32_le_decode\r | |
133 | elif byteorder == 1:\r | |
134 | self.decode = codecs.utf_32_be_decode\r | |
135 | elif consumed>=4:\r | |
136 | raise UnicodeError,"UTF-32 stream does not start with BOM"\r | |
137 | return (object, consumed)\r | |
138 | \r | |
139 | ### encodings module API\r | |
140 | \r | |
141 | def getregentry():\r | |
142 | return codecs.CodecInfo(\r | |
143 | name='utf-32',\r | |
144 | encode=encode,\r | |
145 | decode=decode,\r | |
146 | incrementalencoder=IncrementalEncoder,\r | |
147 | incrementaldecoder=IncrementalDecoder,\r | |
148 | streamreader=StreamReader,\r | |
149 | streamwriter=StreamWriter,\r | |
150 | )\r |