Blame SOURCES/00236-use-Py_ssize_t-for-file-offset-and-length-computations-in-iteration.patch

ae2451
From 6bebd55022c82829c0b15d24d2ca99edd22562df Mon Sep 17 00:00:00 2001
ae2451
From: Charalampos Stratakis <cstratak@redhat.com>
ae2451
Date: Wed, 4 May 2016 10:39:40 +0200
ae2451
Subject: [PATCH] use Py_ssize_t for file offset and length computations in
ae2451
 iteration
ae2451
ae2451
---
ae2451
 Lib/test/test_file2k.py | 16 +++++++++++++++-
ae2451
 Objects/fileobject.c    | 15 +++++++--------
ae2451
 2 files changed, 22 insertions(+), 9 deletions(-)
ae2451
ae2451
diff --git a/Lib/test/test_file2k.py b/Lib/test/test_file2k.py
ae2451
index 5a3c354..8f94cee 100644
ae2451
--- a/Lib/test/test_file2k.py
ae2451
+++ b/Lib/test/test_file2k.py
ae2451
@@ -14,7 +14,7 @@ except ImportError:
ae2451
     threading = None
ae2451
ae2451
 from test import test_support
ae2451
-from test.test_support import TESTFN, run_unittest
ae2451
+from test.test_support import TESTFN, run_unittest, requires
ae2451
 from UserList import UserList
ae2451
ae2451
 class AutoFileTests(unittest.TestCase):
ae2451
@@ -416,6 +416,20 @@ class OtherFileTests(unittest.TestCase):
ae2451
         finally:
ae2451
             os.unlink(TESTFN)
ae2451
ae2451
+    @test_support.precisionbigmemtest(2**31, 2.5, dry_run=False)
ae2451
+    def test_very_long_line(self, size):
ae2451
+        # Issue #22526
ae2451
+        requires('largefile')
ae2451
+        with open(TESTFN, "wb") as fp:
ae2451
+            fp.seek(size - 1)
ae2451
+            fp.write("\0")
ae2451
+            with open(TESTFN, "rb") as fp:
ae2451
+                for l in fp:
ae2451
+                    pass
ae2451
+            self.assertEqual(len(l), size)
ae2451
+            self.assertEqual(l.count("\0"), size)
ae2451
+            l = None
ae2451
+
ae2451
 class FileSubclassTests(unittest.TestCase):
ae2451
ae2451
     def testExit(self):
ae2451
diff --git a/Objects/fileobject.c b/Objects/fileobject.c
ae2451
index 76cdf74..fabe207 100644
ae2451
--- a/Objects/fileobject.c
ae2451
+++ b/Objects/fileobject.c
ae2451
@@ -2230,7 +2230,7 @@ drop_readahead(PyFileObject *f)
ae2451
    (unless at EOF) and no more than bufsize.  Returns negative value on
ae2451
    error, will set MemoryError if bufsize bytes cannot be allocated. */
ae2451
 static int
ae2451
-readahead(PyFileObject *f, int bufsize)
ae2451
+readahead(PyFileObject *f, Py_ssize_t bufsize)
ae2451
 {
ae2451
     Py_ssize_t chunksize;
ae2451
ae2451
@@ -2268,7 +2268,7 @@ readahead(PyFileObject *f, int bufsize)
ae2451
    logarithmic buffer growth to about 50 even when reading a 1gb line. */
ae2451
ae2451
 static PyStringObject *
ae2451
-readahead_get_line_skip(PyFileObject *f, int skip, int bufsize)
ae2451
+readahead_get_line_skip(PyFileObject *f, Py_ssize_t skip, Py_ssize_t bufsize)
ae2451
 {
ae2451
     PyStringObject* s;
ae2451
     char *bufptr;
ae2451
@@ -2288,10 +2288,10 @@ readahead_get_line_skip(PyFileObject *f, int skip, int bufsize)
ae2451
         bufptr++;                               /* Count the '\n' */
ae2451
         len = bufptr - f->f_bufptr;
ae2451
         s = (PyStringObject *)
ae2451
-            PyString_FromStringAndSize(NULL, skip+len);
ae2451
+            PyString_FromStringAndSize(NULL, skip + len);
ae2451
         if (s == NULL)
ae2451
             return NULL;
ae2451
-        memcpy(PyString_AS_STRING(s)+skip, f->f_bufptr, len);
ae2451
+        memcpy(PyString_AS_STRING(s) + skip, f->f_bufptr, len);
ae2451
         f->f_bufptr = bufptr;
ae2451
         if (bufptr == f->f_bufend)
ae2451
             drop_readahead(f);
ae2451
@@ -2299,14 +2299,13 @@ readahead_get_line_skip(PyFileObject *f, int skip, int bufsize)
ae2451
         bufptr = f->f_bufptr;
ae2451
         buf = f->f_buf;
ae2451
         f->f_buf = NULL;                /* Force new readahead buffer */
ae2451
-        assert(skip+len < INT_MAX);
ae2451
-        s = readahead_get_line_skip(
ae2451
-            f, (int)(skip+len), bufsize + (bufsize>>2) );
ae2451
+        assert(len <= PY_SSIZE_T_MAX - skip);
ae2451
+        s = readahead_get_line_skip(f, skip + len, bufsize + (bufsize>>2));
ae2451
         if (s == NULL) {
ae2451
             PyMem_Free(buf);
ae2451
             return NULL;
ae2451
         }
ae2451
-        memcpy(PyString_AS_STRING(s)+skip, bufptr, len);
ae2451
+        memcpy(PyString_AS_STRING(s) + skip, bufptr, len);
ae2451
         PyMem_Free(buf);
ae2451
     }
ae2451
     return s;
ae2451
--
ae2451
2.5.5
ae2451