ThirdParty/CharDet/chardet/universaldetector.py

changeset 5310
f2b774d78b4a
parent 3537
7662053c3906
child 5714
90c57b50600f
diff -r 79b6a38edfc7 -r f2b774d78b4a ThirdParty/CharDet/chardet/universaldetector.py
--- a/ThirdParty/CharDet/chardet/universaldetector.py	Thu Nov 10 18:54:02 2016 +0100
+++ b/ThirdParty/CharDet/chardet/universaldetector.py	Thu Nov 10 18:57:50 2016 +0100
@@ -71,9 +71,9 @@
 
         if not self._mGotData:
             # If the data starts with BOM, we know it is UTF
-            if aBuf[:3] == codecs.BOM:
+            if aBuf[:3] == codecs.BOM_UTF8:
                 # EF BB BF  UTF-8 with BOM
-                self.result = {'encoding': "UTF-8", 'confidence': 1.0}
+                self.result = {'encoding': "UTF-8-SIG", 'confidence': 1.0}
             elif aBuf[:4] == codecs.BOM_UTF32_LE:
                 # FF FE 00 00  UTF-32, little-endian BOM
                 self.result = {'encoding': "UTF-32LE", 'confidence': 1.0}

eric ide

mercurial