utils: Add process_list_in_batches().

2025-11-06 15:03:34 +00:00 · 2018-10-15 12:24:13 +00:00
parent 75ae94e459
commit 2d4b09f59d
2 changed files with 18 additions and 8 deletions
--- a/zerver/lib/import_realm.py
+++ b/zerver/lib/import_realm.py
@@ -23,7 +23,7 @@ from zerver.lib.message import save_message_rendered_content
 from zerver.lib.bugdown import version as bugdown_version
 from zerver.lib.upload import random_name, sanitize_name, \
    S3UploadBackend, LocalUploadBackend, guess_type
-from zerver.lib.utils import generate_api_key
+from zerver.lib.utils import generate_api_key, process_list_in_batches
 from zerver.models import UserProfile, Realm, Client, Huddle, Stream, \
    UserMessage, Subscription, Message, RealmEmoji, \
    RealmDomain, Recipient, get_user_profile_by_id, \
@@ -435,15 +435,13 @@ def bulk_import_user_message_data(data: TableData, dump_file_id: int) -> None:
        ]
        bulk_insert_ums(ums)
    offset = 0
    chunk_size = 10000
-    while True:
+    process_list_in_batches(
-        items = lst[offset:offset+chunk_size]
+        lst=lst,
-        if not items:
+        chunk_size=chunk_size,
-            break
+        process_batch=process_batch,
-        process_batch(items)
+    )
        offset += chunk_size
    logging.info("Successfully imported %s from %s[%s]." % (model, table, dump_file_id))
--- a/zerver/lib/utils.py
+++ b/zerver/lib/utils.py
@@ -177,6 +177,18 @@ def query_chunker(queries: List[Any],
        yield [row for row_id, i, row in tup_chunk]
 def process_list_in_batches(lst: List[Any],
                            chunk_size: int,
                            process_batch: Callable[[List[Any]], None]) -> None:
    offset = 0
    while True:
        items = lst[offset:offset+chunk_size]
        if not items:
            break
        process_batch(items)
        offset += chunk_size
 def split_by(array: List[Any], group_size: int, filler: Any) -> List[List[Any]]:
    """
    Group elements into list of size `group_size` and fill empty cells with