Fixed: Cannot handle batch sizes > 1 if no padding token is defined

Fixes Cannot handle batch sizes > 1 if no padding token is defined For reranker models that do not have this defined in their config by using the eos_token_id if present as pad_token_id.
2025-10-07 14:47:35 +02:00 · 2025-10-07 14:47:35 +02:00 · f69426fd77
parent 4d7fddaf7e
commit f69426fd77
1 changed files with 16 additions and 0 deletions
--- a/backend/open_webui/routers/retrieval.py
+++ b/backend/open_webui/routers/retrieval.py
@ -189,6 +189,22 @@ def get_rf(
                    log.error(f"CrossEncoder: {e}")
                    raise Exception(ERROR_MESSAGES.DEFAULT("CrossEncoder error"))
                # Safely adjust pad_token_id if missing as some models do not have this in config
                try:
                    model_cfg = getattr(rf, "model", None)
                    if model_cfg and hasattr(model_cfg, "config"):
                        cfg = model_cfg.config
                        if getattr(cfg, "pad_token_id", None) is None:
                            # Fallback to eos_token_id when available
                            eos = getattr(cfg, "eos_token_id", None)
                            if eos is not None:
                                cfg.pad_token_id = eos
                                log.debug(f"Missing pad_token_id detected; set to eos_token_id={eos}")
                            else:
                                log.warning("Neither pad_token_id nor eos_token_id present in model config")
                except Exception as e2:
                    log.warning(f"Failed to adjust pad_token_id on CrossEncoder: {e2}")
    return rf