From: Victor Stinner Date: Wed, 28 Jul 2010 01:39:45 +0000 (+0000) Subject: Issue #6213: Implement getstate() and setstate() methods of utf-8-sig and X-Git-Tag: v2.7.1rc1~546 X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=73363e817a45992d4299fe6634de2bee5e4a2768;p=python Issue #6213: Implement getstate() and setstate() methods of utf-8-sig and utf-16 incremental encoders. --- diff --git a/Lib/encodings/utf_16.py b/Lib/encodings/utf_16.py index b145a5d6f0..f3fadff615 100644 --- a/Lib/encodings/utf_16.py +++ b/Lib/encodings/utf_16.py @@ -34,6 +34,22 @@ class IncrementalEncoder(codecs.IncrementalEncoder): codecs.IncrementalEncoder.reset(self) self.encoder = None + def getstate(self): + # state info we return to the caller: + # 0: stream is in natural order for this platform + # 2: endianness hasn't been determined yet + # (we're never writing in unnatural order) + return (2 if self.encoder is None else 0) + + def setstate(self, state): + if state: + self.encoder = None + else: + if sys.byteorder == 'little': + self.encoder = codecs.utf_16_le_encode + else: + self.encoder = codecs.utf_16_be_encode + class IncrementalDecoder(codecs.BufferedIncrementalDecoder): def __init__(self, errors='strict'): codecs.BufferedIncrementalDecoder.__init__(self, errors) diff --git a/Lib/encodings/utf_8_sig.py b/Lib/encodings/utf_8_sig.py index 697ba95b4d..8784694f02 100644 --- a/Lib/encodings/utf_8_sig.py +++ b/Lib/encodings/utf_8_sig.py @@ -25,18 +25,24 @@ def decode(input, errors='strict'): class IncrementalEncoder(codecs.IncrementalEncoder): def __init__(self, errors='strict'): codecs.IncrementalEncoder.__init__(self, errors) - self.first = True + self.first = 1 def encode(self, input, final=False): if self.first: - self.first = False + self.first = 0 return codecs.BOM_UTF8 + codecs.utf_8_encode(input, self.errors)[0] else: return codecs.utf_8_encode(input, self.errors)[0] def reset(self): codecs.IncrementalEncoder.reset(self) - self.first = True + self.first = 1 + + def getstate(self): + return self.first + + def setstate(self, state): + self.first = state class IncrementalDecoder(codecs.BufferedIncrementalDecoder): def __init__(self, errors='strict'): diff --git a/Lib/test/test_io.py b/Lib/test/test_io.py index 2874d79d95..b6bf6863c1 100644 --- a/Lib/test/test_io.py +++ b/Lib/test/test_io.py @@ -2087,7 +2087,6 @@ class TextIOWrapperTest(unittest.TestCase): self.assertEqual(buffer.seekable(), txt.seekable()) - @unittest.skip("Issue #6213 with incremental encoders") def test_append_bom(self): # The BOM is not written again when appending to a non-empty file filename = support.TESTFN @@ -2103,7 +2102,6 @@ class TextIOWrapperTest(unittest.TestCase): with self.open(filename, 'rb') as f: self.assertEquals(f.read(), 'aaaxxx'.encode(charset)) - @unittest.skip("Issue #6213 with incremental encoders") def test_seek_bom(self): # Same test, but when seeking manually filename = support.TESTFN diff --git a/Misc/NEWS b/Misc/NEWS index 58abb15151..02472c8079 100644 --- a/Misc/NEWS +++ b/Misc/NEWS @@ -18,6 +18,9 @@ Core and Builtins Library ------- +- Issue #6213: Implement getstate() and setstate() methods of utf-8-sig and + utf-16 incremental encoders. + - Issue #7113: Speed up loading in ConfigParser. Patch by Łukasz Langa. - Issue #3704: cookielib was not properly handling URLs with a / in the