76 (1, re.compile(r'''<\?xml.*\bencoding\s*=\s*['"]([-\w_.]+)['"]\?>''')), |
76 (1, re.compile(r'''<\?xml.*\bencoding\s*=\s*['"]([-\w_.]+)['"]\?>''')), |
77 ] |
77 ] |
78 |
78 |
79 supportedCodecs = [ |
79 supportedCodecs = [ |
80 'utf-8', |
80 'utf-8', |
|
81 |
81 'iso8859-1', 'iso8859-15', 'iso8859-2', 'iso8859-3', |
82 'iso8859-1', 'iso8859-15', 'iso8859-2', 'iso8859-3', |
82 'iso8859-4', 'iso8859-5', 'iso8859-6', 'iso8859-7', |
83 'iso8859-4', 'iso8859-5', 'iso8859-6', 'iso8859-7', |
83 'iso8859-8', 'iso8859-9', 'iso8859-10', 'iso8859-11', |
84 'iso8859-8', 'iso8859-9', 'iso8859-10', 'iso8859-11', |
84 'iso8859-13', 'iso8859-14', 'iso8859-16', 'latin-1', |
85 'iso8859-13', 'iso8859-14', 'iso8859-15', 'iso8859-16', |
85 'koi8-r', 'koi8-u', |
86 'latin-1', |
86 'utf-16', 'utf-32', |
87 |
87 'cp037', 'cp424', 'cp437', 'cp500', 'cp737', 'cp775', |
88 'koi8-r', 'koi8-t', 'koi8-u', |
88 'cp850', 'cp852', 'cp855', 'cp856', 'cp857', 'cp860', |
89 |
89 'cp861', 'cp862', 'cp863', 'cp864', 'cp865', 'cp866', |
90 'utf-7', |
90 'cp869', 'cp874', 'cp875', 'cp932', 'cp949', 'cp950', |
91 'utf-16', 'utf-16-be', 'utf-16-le', |
91 'cp1006', 'cp1026', 'cp1140', 'cp1250', 'cp1251', |
92 'utf-32', 'utf-32-be', 'utf-32-le', |
92 'cp1252', 'cp1253', 'cp1254', 'cp1255', 'cp1256', |
93 |
93 'cp1257', 'cp1258', |
94 'cp037', 'cp273', 'cp424', 'cp437', 'cp500', 'cp720', |
94 'gb2312', 'gb18030', |
95 'cp737', 'cp775', 'cp850', 'cp852', 'cp855', 'cp856', |
95 'ascii' |
96 'cp857', 'cp858', 'cp860', 'cp861', 'cp862', 'cp863', |
|
97 'cp864', 'cp865', 'cp866', 'cp869', 'cp874', 'cp875', |
|
98 'cp932', 'cp949', 'cp950', 'cp1006', 'cp1026', 'cp1125', |
|
99 'cp1140', |
|
100 |
|
101 'windows-1250', 'windows-1251', 'windows-1252', 'windows-1253', |
|
102 'windows-1254', 'windows-1255', 'windows-1256', 'windows-1257', |
|
103 'windows-1258', |
|
104 |
|
105 'gb2312', 'hz', 'gb18030', 'gbk', |
|
106 |
|
107 'iso2022-jp', 'iso2022-jp-1', 'iso2022-jp-2', 'iso2022-jp-2004', |
|
108 'iso2022-jp-3', 'iso2022-jp-ext', 'iso2022-kr', |
|
109 |
|
110 'mac-cyrillic', 'mac-greek', 'mac-iceland', 'mac-latin2', |
|
111 'mac-roman', 'mac-turkish', |
|
112 |
|
113 'ascii', |
|
114 'big5-tw', 'big5-hkscs', |
96 ] |
115 ] |
97 |
116 |
98 |
117 |
99 class CodingError(Exception): |
118 class CodingError(Exception): |
100 """ |
119 """ |