[Feature] Add support for optional BOS token handling in input preprocessing

0xrushi · 0xrushi · commit a47979b7f729 · 2025-10-25T21:15:38.000-04:00
Signed-off-by: 0xrushi &lt;6279035+0xrushi@users.noreply.github.com&gt;
diff --git a/vllm/inputs/preprocess.py b/vllm/inputs/preprocess.py
@@ -221,6 +221,14 @@ def _tokenize_prompt(
         tokenizer = self.get_tokenizer()
         tokenization_kwargs = self._get_tokenization_kw(tokenization_kwargs)
 
+
+        bos_token_text = getattr(tokenizer, "bos_token", None)
+        if bos_token_text and isinstance(bos_token_text, str):
+            if prompt.lstrip().startswith(bos_token_text):
+                # override if not explicitly set by caller.
+                if "add_special_tokens" not in tokenization_kwargs:
+                    tokenization_kwargs["add_special_tokens"] = False
+
         encoder_config = self.model_config.encoder_config
 
         if encoder_config and encoder_config.get("do_lower_case", False):