From 2858d6c634b7ba3348abecdfd2cc403e50991929 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Leon=20Engl=C3=A4nder?= Date: Fri, 1 Mar 2024 02:58:19 +0100 Subject: [PATCH] Fix Base Model Name of LlamaForQuestionAnswering (#29258) * LlamaForQuestionAnswering self.transformer->self.model * fix "Copied from" string * Llama QA model: set base_model_prefix = "transformer" --- src/transformers/models/llama/modeling_llama.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/transformers/models/llama/modeling_llama.py b/src/transformers/models/llama/modeling_llama.py index 4ea8a208a..43de19d32 100644 --- a/src/transformers/models/llama/modeling_llama.py +++ b/src/transformers/models/llama/modeling_llama.py @@ -1454,6 +1454,8 @@ SQuAD (a linear layer on top of the hidden-states output to compute `span start LLAMA_START_DOCSTRING, ) class LlamaForQuestionAnswering(LlamaPreTrainedModel): + base_model_prefix = "transformer" + # Copied from transformers.models.bloom.modeling_bloom.BloomForQuestionAnswering.__init__ with Bloom->Llama def __init__(self, config): super().__init__(config)