Merge pull request #821 from wiredfool/pypy-performance

PyPy performance improvements
2026-02-04 22:39:33 +03:00 · 2014-07-29 13:12:54 +03:00 · 2014-07-29 13:12:54 +03:00 · 58c56e9aa4
commit 58c56e9aa4
parent bfb482dc66 1a245a577b
6 changed files with 126 additions and 136 deletions
--- a/Tests/helper.py
+++ b/Tests/helper.py
@ -124,7 +124,8 @@ class PillowTestCase(unittest.TestCase):
            self.assertTrue(found)
        return result

-    def skipKnownBadTest(self, msg=None, platform=None, travis=None):
+    def skipKnownBadTest(self, msg=None, platform=None,
+                         travis=None, interpreter=None):
        # Skip if platform/travis matches, and
        # PILLOW_RUN_KNOWN_BAD is not true in the environment.
        if bool(os.environ.get('PILLOW_RUN_KNOWN_BAD', False)):
@ -136,6 +137,8 @@ class PillowTestCase(unittest.TestCase):
            skip = sys.platform.startswith(platform)
        if travis is not None:
            skip = skip and (travis == bool(os.environ.get('TRAVIS', False)))
+        if interpreter is not None:
+            skip = skip and (interpreter == 'pypy' and hasattr(sys, 'pypy_version_info'))
        if skip:
            self.skipTest(msg or "Known Bad Test")

--- a/Tests/test_image_point.py
+++ b/Tests/test_image_point.py
@ -5,12 +5,6 @@ import sys

 class TestImagePoint(PillowTestCase):

-    def setUp(self):
-        if hasattr(sys, 'pypy_version_info'):
-            # This takes _forever_ on PyPy. Open Bug,
-            # see https://github.com/python-pillow/Pillow/issues/484
-            self.skipTest("Too slow on PyPy")
-
    def test_sanity(self):
        im = lena()

@ -29,11 +23,24 @@ class TestImagePoint(PillowTestCase):
    def test_16bit_lut(self):
        """ Tests for 16 bit -> 8 bit lut for converting I->L images
            see https://github.com/python-pillow/Pillow/issues/440
-        """
+            """
+        # This takes _forever_ on PyPy. Open Bug,
+        # see https://github.com/python-pillow/Pillow/issues/484
+        #self.skipKnownBadTest(msg="Too Slow on pypy", interpreter='pypy')

        im = lena("I")
        im.point(list(range(256))*256, 'L')

+    def test_f_lut(self):
+        """ Tests for floating point lut of 8bit gray image """
+        im = lena('L')
+        lut = [0.5 * float(x) for x in range(256)]
+
+        out = im.point(lut, 'F')
+
+        int_lut = [x//2 for x in range(256)]
+        self.assert_image_equal(out.convert('L'), im.point(int_lut, 'L'))
+        

 if __name__ == '__main__':
    unittest.main()
--- a/Tests/test_image_putdata.py
+++ b/Tests/test_image_putdata.py
@ -42,6 +42,30 @@ class TestImagePutData(PillowTestCase):
            self.assertEqual(put(sys.maxsize), (255, 255, 255, 127))


+    def test_pypy_performance(self):
+        im = Image.new('L', (256,256))
+        im.putdata(list(range(256))*256)
+
+    def test_mode_i(self):
+        src = lena('L')
+        data = list(src.getdata())
+        im = Image.new('I', src.size, 0)
+        im.putdata(data, 2, 256)
+
+        target = [2* elt + 256 for elt in data]
+        self.assertEqual(list(im.getdata()), target)
+
+    def test_mode_F(self):
+        src = lena('L')
+        data = list(src.getdata())
+        im = Image.new('F', src.size, 0)
+        im.putdata(data, 2.0, 256.0)
+
+        target = [2.0* float(elt) + 256.0 for elt in data]
+        self.assertEqual(list(im.getdata()), target)
+
+    
+
 if __name__ == '__main__':
    unittest.main()

--- a/Tests/test_mode_i16.py
+++ b/Tests/test_mode_i16.py
@ -5,18 +5,22 @@ from PIL import Image

 class TestModeI16(PillowTestCase):

+    original = lena().resize((32,32)).convert('I')
+
    def verify(self, im1):
-        im2 = lena("I")
+        im2 = self.original.copy()
        self.assertEqual(im1.size, im2.size)
        pix1 = im1.load()
        pix2 = im2.load()
        for y in range(im1.size[1]):
            for x in range(im1.size[0]):
                xy = x, y
+                p1 = pix1[xy]
+                p2 = pix2[xy]
                self.assertEqual(
-                    pix1[xy], pix2[xy],
+                    p1, p2,
                    ("got %r from mode %s at %s, expected %r" %
-                        (pix1[xy], im1.mode, xy, pix2[xy])))
+                        (p1, im1.mode, xy, p2)))

    def test_basic(self):
        # PIL 1.1 has limited support for 16-bit image data.  Check that
@ -24,7 +28,7 @@ class TestModeI16(PillowTestCase):

        def basic(mode):

-            imIn = lena("I").convert(mode)
+            imIn = self.original.convert(mode)
            self.verify(imIn)

            w, h = imIn.size
@ -92,7 +96,7 @@ class TestModeI16(PillowTestCase):

    def test_convert(self):

-        im = lena("I")
+        im = self.original.copy()

        self.verify(im.convert("I;16"))
        self.verify(im.convert("I;16").convert("L"))
--- a/_imaging.c
+++ b/_imaging.c
@ -365,9 +365,12 @@ getbands(const char* mode)
 static void*
 getlist(PyObject* arg, int* length, const char* wrong_length, int type)
 {
-    int i, n;
+    int i, n, itemp;
+    double dtemp;
    void* list;
-
+    PyObject* seq;
+    PyObject* op;
+    
    if (!PySequence_Check(arg)) {
        PyErr_SetString(PyExc_TypeError, must_be_sequence);
        return NULL;
@ -383,71 +386,35 @@ getlist(PyObject* arg, int* length, const char* wrong_length, int type)
    if (!list)
        return PyErr_NoMemory();

-    switch (type) {
-    case TYPE_UINT8:
-        if (PyList_Check(arg)) {
-            for (i = 0; i < n; i++) {
-                PyObject *op = PyList_GET_ITEM(arg, i);
-                int temp = PyInt_AsLong(op);
-                ((UINT8*)list)[i] = CLIP(temp);
-            }
-        } else {
-            for (i = 0; i < n; i++) {
-                PyObject *op = PySequence_GetItem(arg, i);
-                int temp = PyInt_AsLong(op);
-                Py_XDECREF(op);
-                ((UINT8*)list)[i] = CLIP(temp);
-            }
+    seq = PySequence_Fast(arg, must_be_sequence);
+    if (!seq) {
+        free(list);
+        PyErr_SetString(PyExc_TypeError, must_be_sequence);
+        return NULL;
+    }
+    
+    for (i = 0; i < n; i++) {
+        op = PySequence_Fast_GET_ITEM(seq, i);
+        // DRY, branch prediction is going to work _really_ well 
+        // on this switch. And 3 fewer loops to copy/paste. 
+        switch (type) {
+        case TYPE_UINT8:
+            itemp = PyInt_AsLong(op);
+            ((UINT8*)list)[i] = CLIP(itemp);
+            break;
+        case TYPE_INT32:
+            itemp = PyInt_AsLong(op);
+            ((INT32*)list)[i] = itemp;
+            break;
+        case TYPE_FLOAT32:
+            dtemp = PyFloat_AsDouble(op);
+            ((FLOAT32*)list)[i] = (FLOAT32) dtemp;
+            break;
+        case TYPE_DOUBLE:
+            dtemp = PyFloat_AsDouble(op);
+            ((double*)list)[i] = (double) dtemp;
+            break;
        }
-        break;
-    case TYPE_INT32:
-        if (PyList_Check(arg)) {
-            for (i = 0; i < n; i++) {
-                PyObject *op = PyList_GET_ITEM(arg, i);
-                int temp = PyInt_AsLong(op);
-                ((INT32*)list)[i] = temp;
-            }
-        } else {
-            for (i = 0; i < n; i++) {
-                PyObject *op = PySequence_GetItem(arg, i);
-                int temp = PyInt_AsLong(op);
-                Py_XDECREF(op);
-                ((INT32*)list)[i] = temp;
-            }
-        }
-        break;
-    case TYPE_FLOAT32:
-        if (PyList_Check(arg)) {
-            for (i = 0; i < n; i++) {
-                PyObject *op = PyList_GET_ITEM(arg, i);
-                double temp = PyFloat_AsDouble(op);
-                ((FLOAT32*)list)[i] = (FLOAT32) temp;
-            }
-        } else {
-            for (i = 0; i < n; i++) {
-                PyObject *op = PySequence_GetItem(arg, i);
-                double temp = PyFloat_AsDouble(op);
-                Py_XDECREF(op);
-                ((FLOAT32*)list)[i] = (FLOAT32) temp;
-            }
-        }
-        break;
-    case TYPE_DOUBLE:
-        if (PyList_Check(arg)) {
-            for (i = 0; i < n; i++) {
-                PyObject *op = PyList_GET_ITEM(arg, i);
-                double temp = PyFloat_AsDouble(op);
-                ((double*)list)[i] = temp;
-            }
-        } else {
-            for (i = 0; i < n; i++) {
-                PyObject *op = PySequence_GetItem(arg, i);
-                double temp = PyFloat_AsDouble(op);
-                Py_XDECREF(op);
-                ((double*)list)[i] = temp;
-            }
-        }
-        break;
    }

    if (length)
@ -1253,6 +1220,8 @@ _putdata(ImagingObject* self, PyObject* args)
    Py_ssize_t n, i, x, y;

    PyObject* data;
+    PyObject* seq;
+    PyObject* op;
    double scale = 1.0;
    double offset = 0.0;

@ -1292,69 +1261,61 @@ _putdata(ImagingObject* self, PyObject* args)
                        x = 0, y++;
                }
        } else {
-            if (scale == 1.0 && offset == 0.0) {
-                /* Clipped data */
-                if (PyList_Check(data)) {
-                    for (i = x = y = 0; i < n; i++) {
-                        PyObject *op = PyList_GET_ITEM(data, i);
-                        image->image8[y][x] = (UINT8) CLIP(PyInt_AsLong(op));
-                        if (++x >= (int) image->xsize)
-                            x = 0, y++;
-                    }
-                } else {
-                    for (i = x = y = 0; i < n; i++) {
-                        PyObject *op = PySequence_GetItem(data, i);
-                        image->image8[y][x] = (UINT8) CLIP(PyInt_AsLong(op));
-                        Py_XDECREF(op);
-                        if (++x >= (int) image->xsize)
-                            x = 0, y++;
-                    }
-                }
+           seq = PySequence_Fast(data, must_be_sequence);
+           if (!seq) {
+               PyErr_SetString(PyExc_TypeError, must_be_sequence);
+               return NULL;
+           }
+           if (scale == 1.0 && offset == 0.0) {
+               /* Clipped data */
+               for (i = x = y = 0; i < n; i++) {
+                   op = PySequence_Fast_GET_ITEM(data, i);
+                   image->image8[y][x] = (UINT8) CLIP(PyInt_AsLong(op));
+                   if (++x >= (int) image->xsize){
+                       x = 0, y++;
+                   }
+               }
+
            } else {
-                if (PyList_Check(data)) {
-                    /* Scaled and clipped data */
-                    for (i = x = y = 0; i < n; i++) {
-                        PyObject *op = PyList_GET_ITEM(data, i);
-                        image->image8[y][x] = CLIP(
-                            (int) (PyFloat_AsDouble(op) * scale + offset));
-                        if (++x >= (int) image->xsize)
-                            x = 0, y++;
-                    }
-                } else {
-                    for (i = x = y = 0; i < n; i++) {
-                        PyObject *op = PySequence_GetItem(data, i);
-                        image->image8[y][x] = CLIP(
-                            (int) (PyFloat_AsDouble(op) * scale + offset));
-                        Py_XDECREF(op);
-                        if (++x >= (int) image->xsize)
-                            x = 0, y++;
-                    }
-                }
-            }
-            PyErr_Clear(); /* Avoid weird exceptions */
+               /* Scaled and clipped data */
+               for (i = x = y = 0; i < n; i++) {
+                   PyObject *op = PySequence_Fast_GET_ITEM(data, i);
+                   image->image8[y][x] = CLIP(
+                       (int) (PyFloat_AsDouble(op) * scale + offset));
+                   if (++x >= (int) image->xsize){
+                       x = 0, y++;
+                   }
+               }
+           }
+           PyErr_Clear(); /* Avoid weird exceptions */
        }
    } else {
        /* 32-bit images */
+        seq = PySequence_Fast(data, must_be_sequence);
+        if (!seq) {
+            PyErr_SetString(PyExc_TypeError, must_be_sequence);
+            return NULL;
+        }
        switch (image->type) {
        case IMAGING_TYPE_INT32:
            for (i = x = y = 0; i < n; i++) {
-                PyObject *op = PySequence_GetItem(data, i);
+                op = PySequence_Fast_GET_ITEM(data, i);
                IMAGING_PIXEL_INT32(image, x, y) =
                    (INT32) (PyFloat_AsDouble(op) * scale + offset);
-                Py_XDECREF(op);
-                if (++x >= (int) image->xsize)
+                if (++x >= (int) image->xsize){
                    x = 0, y++;
+                }
            }
            PyErr_Clear(); /* Avoid weird exceptions */
            break;
        case IMAGING_TYPE_FLOAT32:
            for (i = x = y = 0; i < n; i++) {
-                PyObject *op = PySequence_GetItem(data, i);
+                op = PySequence_Fast_GET_ITEM(data, i);
                IMAGING_PIXEL_FLOAT32(image, x, y) =
                    (FLOAT32) (PyFloat_AsDouble(op) * scale + offset);
-                Py_XDECREF(op);
-                if (++x >= (int) image->xsize)
+                if (++x >= (int) image->xsize){
                    x = 0, y++;
+                }
            }
            PyErr_Clear(); /* Avoid weird exceptions */
            break;
@ -1365,16 +1326,15 @@ _putdata(ImagingObject* self, PyObject* args)
                    INT32 inkint;
                } u;

-                PyObject *op = PySequence_GetItem(data, i);
+                op = PySequence_Fast_GET_ITEM(data, i);
                if (!op || !getink(op, image, u.ink)) {
-                    Py_DECREF(op);
                    return NULL;
                }
                /* FIXME: what about scale and offset? */
                image->image32[y][x] = u.inkint;
-                Py_XDECREF(op);
-                if (++x >= (int) image->xsize)
+                if (++x >= (int) image->xsize){
                    x = 0, y++;
+                }
            }
            PyErr_Clear(); /* Avoid weird exceptions */
            break;
--- a/profile-installed.py
+++ b/profile-installed.py
@ -21,14 +21,6 @@ if len(sys.argv) == 1:
 # Make sure that nose doesn't muck with our paths.
 if ('--no-path-adjustment' not in sys.argv) and ('-P' not in sys.argv):
    sys.argv.insert(1, '--no-path-adjustment')
-
-if 'NOSE_PROCESSES' not in os.environ:
-    for arg in sys.argv:
-        if '--processes' in arg:
-            break
-    else: #  for
-        sys.argv.insert(1, '--processes=-1') # -1 == number of cores
-        sys.argv.insert(1, '--process-timeout=30') 
    
 if __name__ == '__main__':
    profile.run("nose.main()", sort=2)