fix(server): Removes the parallelism in file convertion (during download) (#275)

2025-09-17 23:34:52 +00:00 · 2023-05-04 15:22:54 +02:00 · 2023-05-04 15:22:54 +02:00 · f08343d44d
commit f08343d44d
parent b4fe248b17
1 changed files with 6 additions and 13 deletions
--- a/server/text_generation_server/utils/convert.py
+++ b/server/text_generation_server/utils/convert.py
@ -1,5 +1,6 @@
 import concurrent
 import time
 import datetime
 import torch
 from concurrent.futures import ThreadPoolExecutor
@ -78,17 +79,9 @@ def convert_file(pt_file: Path, st_file: Path):
 def convert_files(pt_files: List[Path], st_files: List[Path]):
    assert len(pt_files) == len(st_files)
-    executor = ThreadPoolExecutor(max_workers=5)
+    N = len(pt_files)
    futures = [
        executor.submit(convert_file, pt_file=pt_file, st_file=st_file)
        for pt_file, st_file in zip(pt_files, st_files)
    ]
    # We do this instead of using tqdm because we want to parse the logs with the launcher
-    start_time = time.time()
+    start = datetime.datetime.now()
-    for i, future in enumerate(concurrent.futures.as_completed(futures)):
+    for i, (pt_file, sf_file) in enumerate(zip(pt_files, st_files)):
-        elapsed = timedelta(seconds=int(time.time() - start_time))
+        elapsed = datetime.datetime.now() - start
-        remaining = len(futures) - (i + 1)
+        logger.info(f"Convert: [{i + 1}/{N}] -- Took: {elapsed}")
        eta = (elapsed / (i + 1)) * remaining if remaining > 0 else 0
        logger.info(f"Convert: [{i + 1}/{len(futures)}] -- ETA: {eta}")