From e8ee957b4d243c356841dad3b476e657006a73c6 Mon Sep 17 00:00:00 2001 From: Adam Belfki Date: Tue, 3 Sep 2024 16:55:49 -0400 Subject: [PATCH] fix: tokenizer padding side is set to left by default --- src/nnsight/models/LanguageModel.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/src/nnsight/models/LanguageModel.py b/src/nnsight/models/LanguageModel.py index 164630fe..c703a31a 100755 --- a/src/nnsight/models/LanguageModel.py +++ b/src/nnsight/models/LanguageModel.py @@ -175,6 +175,9 @@ def _load( if tokenizer_kwargs is None: tokenizer_kwargs = {} + if "padding_side" not in tokenizer_kwargs: + tokenizer_kwargs["padding_side"] = "left" + self.tokenizer = AutoTokenizer.from_pretrained( repo_id, config=config, **tokenizer_kwargs )