Backport checkin (and the appropriate fix to the test):

author Walter Dörwald <walter@livinglogic.de>

Thu, 21 Apr 2005 21:53:43 +0000 (21:53 +0000)

committer Walter Dörwald <walter@livinglogic.de>

Thu, 21 Apr 2005 21:53:43 +0000 (21:53 +0000)
author Walter Dörwald <walter@livinglogic.de>
Thu, 21 Apr 2005 21:53:43 +0000 (21:53 +0000)
committer Walter Dörwald <walter@livinglogic.de>
Thu, 21 Apr 2005 21:53:43 +0000 (21:53 +0000)
diff --git a/Lib/codecs.py b/Lib/codecs.py

index 3db9248bf40ab8842cbeb0cdc12f67859d2144fa..3b7c8bf419d0e034a3473e6405eef9d29ed62112 100644 (file)
--- a/Lib/codecs.py
+++ b/Lib/codecs.py
@@ -230,7 +230,6 @@ class StreamReader(Codec):
          self.errors = errors
          self.bytebuffer = ""
          self.charbuffer = u""
-        self.atcr = False
  
      def decode(self, input, errors='strict'):
          raise NotImplementedError
@@ -306,18 +305,12 @@ class StreamReader(Codec):
          # If size is given, we call read() only once
          while True:
              data = self.read(readsize)
-            if self.atcr and data.startswith(u"\n"):
-                data = data[1:]
              if data:
-                self.atcr = data.endswith(u"\r")
-                # If we're at a "\r" (and are allowed to read more), read one
-                # extra character (which might be a "\n") to get a proper
-                # line ending. (If the stream is temporarily exhausted we return
-                # the wrong line ending, but at least we won't generate a bogus
-                # second line.)
-                if self.atcr and size is None:
+                # If we're at a "\r" read one extra character (which might
+                # be a "\n") to get a proper line ending. If the stream is
+                # temporarily exhausted we return the wrong line ending.
+                if data.endswith(u"\r"):
                      data += self.read(size=1, chars=1)
-                    self.atcr = data.endswith(u"\r")
  
              line += data
              lines = line.splitlines(True)
@@ -367,7 +360,6 @@ class StreamReader(Codec):
          """
          self.bytebuffer = ""
          self.charbuffer = u""
-        self.atcr = False
  
      def seek(self, offset, whence=0):
          """ Set the input stream's current position.
diff --git a/Lib/test/test_codecs.py b/Lib/test/test_codecs.py

index 7a19b323cdcc628bcc056559184e93b97452b352..93c5ff180507abdb9f5acfa83ec75206e718aea8 100644 (file)
--- a/Lib/test/test_codecs.py
+++ b/Lib/test/test_codecs.py
@@ -176,6 +176,7 @@ class ReadTest(unittest.TestCase):
          writer.write(u"foo\r")
          self.assertEqual(reader.readline(keepends=False), u"foo")
          writer.write(u"\nbar\r")
+        self.assertEqual(reader.readline(keepends=False), u"")
          self.assertEqual(reader.readline(keepends=False), u"bar")
          writer.write(u"baz")
          self.assertEqual(reader.readline(keepends=False), u"baz")
@@ -185,6 +186,7 @@ class ReadTest(unittest.TestCase):
          writer.write(u"foo\r")
          self.assertEqual(reader.readline(keepends=True), u"foo\r")
          writer.write(u"\nbar\r")
+        self.assertEqual(reader.readline(keepends=True), u"\n")
          self.assertEqual(reader.readline(keepends=True), u"bar\r")
          writer.write(u"baz")
          self.assertEqual(reader.readline(keepends=True), u"baz")
diff --git a/Misc/NEWS b/Misc/NEWS

index 6e483052c869e71b45db78ba5a9f9ef26be6bef8..af55fb7c95d32836e88e30c2ff675a3e10dbc7b9 100644 (file)
--- a/Misc/NEWS
+++ b/Misc/NEWS
@@ -32,6 +32,12 @@ Library
  - distutils.commands.register now encodes the data as UTF-8 before posting
    them to PyPI.
  
+- Partial fixes for SF bugs #1163244 and #1175396: If a chunk read by
+  ``codecs.StreamReader.readline()`` has a trailing "\r", read one more
+  character even if the user has passed a size parameter to get a proper
+  line ending. Remove the special handling of a "\r\n" that has been split
+  between two lines.
+
  
  What's New in Python 2.4.1 final?
  =================================
author	Walter Dörwald <walter@livinglogic.de>
	Thu, 21 Apr 2005 21:53:43 +0000 (21:53 +0000)
committer	Walter Dörwald <walter@livinglogic.de>
	Thu, 21 Apr 2005 21:53:43 +0000 (21:53 +0000)
Lib/codecs.py		patch \| blob \| blame \| history
Lib/test/test_codecs.py		patch \| blob \| blame \| history
Misc/NEWS		patch \| blob \| blame \| history