Opt for always correct readall implementation

rhpvorderman · rhpvorderman · commit c56898a4a71a · 2023-10-02T09:05:48.000+02:00
diff --git a/src/isal/isal_zlibmodule.c b/src/isal/isal_zlibmodule.c
@@ -1658,73 +1658,48 @@ GzipReader_seek(GzipReader *self, PyObject *args, PyObject *kwargs)
 }
 
 static PyObject *
-GzipReader_readall(GzipReader *self, PyObject *Py_UNUSED(ignore)) 
+GzipReader_readall(GzipReader *self, PyObject *Py_UNUSED(ignore))
 {
-    /* Pretty standard pattern: create a lot of bytes objects, stuff them in 
-       a list, and join them.
-        Optimizations:
-        - Do not create a list but use static array and keep track of the 
-          number of bytes objects.
-        - Start reading DEF_BUF_SIZE (16k) and increase by 2x.
-        - The static array contains 48 slots. The 48th chunk will have size
-          2 ** 47 * 16k. That is 2 million TB. That should be quite future proof.
-        - Since we kan keep track of the size while creating the chunks, there 
-          is no need to go over all the bytes objects again to calculate the
-          total size. (This is what _PyBytes_Join does internally). 
-        - If there is only one item, return that one. 
-    */
-    Py_ssize_t chunk_size = DEF_BUF_SIZE;
-    static PyObject *chunk_list[48];
-    size_t number_of_chunks = 0;
-    size_t total_size = 0;
-    PyObject *ret = NULL;
+    /* Try to consume the entire buffer without too much overallocation */
+    Py_ssize_t chunk_size = self->buffer_size * 4;
+    PyObject *chunk_list = PyList_New(0);
+    if (chunk_list == NULL) {
+        return NULL;
+    }
     while (1) {
         PyObject *chunk = PyBytes_FromStringAndSize(NULL, chunk_size);
         if (chunk == NULL) {
-            goto readall_finish;
+            Py_DECREF(chunk_list);
+            return NULL;
         }
         ssize_t written_size = GzipReader_read_into_buffer(
             self, (uint8_t *)PyBytes_AS_STRING(chunk), chunk_size);
         if (written_size < 0) {
             Py_DECREF(chunk);
-            goto readall_finish;
+            Py_DECREF(chunk_list);
+            return NULL;
         }
-        total_size += written_size;
-
-        if (written_size < chunk_size) {
-            // Reached the end, resize the smaller chunk
-            if (_PyBytes_Resize(&chunk, written_size) < 0) {
-                goto readall_finish;
-            }
-            chunk_list[number_of_chunks] = chunk;
-            number_of_chunks += 1;
+        if (written_size == 0) {
             break;
         }
-        chunk_list[number_of_chunks] = chunk;
-        number_of_chunks += 1;
-        chunk_size *= 2; 
-    }
-    if (number_of_chunks == 1) {
-        // No need for an intermediate result. Return immediately.
-        return chunk_list[0];
-    }
-    ret = PyBytes_FromStringAndSize(NULL, total_size);
-    if (ret == NULL) {
-        goto readall_finish;
-    }
-    char *ret_ptr = PyBytes_AS_STRING(ret);
-    chunk_size = DEF_BUF_SIZE;
-    for (size_t i=0; i < number_of_chunks; i++) {
-        PyObject *chunk = chunk_list[i];
-        Py_ssize_t chunk_size = PyBytes_GET_SIZE(chunk);
-        memcpy(ret_ptr, PyBytes_AS_STRING(chunk), chunk_size);
-        ret_ptr += chunk_size;
-    }
-readall_finish:
-    for (size_t i=0; i < number_of_chunks; i++) {
-        Py_DECREF(chunk_list[i]);
-    }
-    return ret;    
+        if (_PyBytes_Resize(&chunk, written_size) < 0) {
+            Py_DECREF(chunk_list);
+            return NULL;
+        }
+        if (PyList_Append(chunk_list, chunk) < 0) {
+            Py_DECREF(chunk);
+            Py_DECREF(chunk_list);
+            return NULL;
+        }
+    }
+    PyObject *empty_bytes = PyBytes_FromStringAndSize(NULL, 0);
+    if (empty_bytes == NULL) {
+        Py_DECREF(chunk_list);
+        return NULL;
+    }
+    PyObject *ret = _PyBytes_Join(empty_bytes, chunk_list);
+    Py_DECREF(empty_bytes);
+    return ret;
 }
 
 static PyObject *