Merge pull request #271 from s-jse/patch-1

Allocate all the memory at once when coalescing residuals
stanford-futuredata · Oct 30, 2023 · e616cc7 · e616cc7
2 parents cd8582f + 77d62f2
commit e616cc7
Showing 1 changed file with 5 additions and 2 deletions.
diff --git a/colbert/utils/coalesce.py b/colbert/utils/coalesce.py
@@ -57,12 +57,15 @@ def main(args):
     ## Coalesce residuals ##
     print("Coalescing residuals files...")
 
-    temp = torch.empty(0, dtype=torch.uint8)
+    # Allocate all the memory needed in the beginning. Starting from torch.empty() and concatenating repeatedly results in excessive memory use and is much much slower.
+    temp = torch.zeros(((metadata['num_embeddings'], int(metadata['config']['dim'] * metadata['config']['nbits'] // 8))), dtype=torch.uint8)
+    cur_offset = 0
     # read into one large tensor
     for i in tqdm(range(num_chunks)):
         filepath = os.path.join(in_file, f'{i}.residuals.pt')
         chunk = torch.load(filepath)
-        temp = torch.cat((temp, chunk))
+        temp[cur_offset : cur_offset + len(chunk):] = chunk
+        cur_offset += len(chunk)
 
     print("Saving residuals to output directory (this may take a few minutes)...")