torch tensor can't handle uint16 so let's convert to int32, which is silly because we'll convert to .long right after but ok

karpathy · karpathy · commit 587506d09604 · 2024-05-21T19:22:09.000Z
diff --git a/train_gpt2.py b/train_gpt2.py
@@ -514,6 +514,8 @@ def print0(*args, **kwargs):
         ntok = header[2] # number of tokens (claimed)
         # the rest of it are tokens, stored as uint16
         tokens = np.frombuffer(f.read(), dtype=np.uint16)
+        # convert tokens to int32 because torch can't handle uint16 sad
+        tokens = tokens.astype(np.int32)
         assert len(tokens) == ntok, "number of tokens read does not match header?"
 
     # np -> tensor, long, on device