mirror of
https://github.com/saymrwulf/transformers.git
synced 2026-05-14 20:58:08 +00:00
parent
91f14f1fc4
commit
87089176d9
2 changed files with 4 additions and 2 deletions
|
|
@ -727,7 +727,7 @@ class PhiForCausalLM(PhiPreTrainedModel, GenerationMixin):
|
|||
super().__init__(config)
|
||||
self.model = PhiModel(config)
|
||||
self.vocab_size = config.vocab_size
|
||||
self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False)
|
||||
self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=True)
|
||||
|
||||
# Initialize weights and apply final processing
|
||||
self.post_init()
|
||||
|
|
|
|||
|
|
@ -284,7 +284,9 @@ class PhiModel(LlamaModel):
|
|||
|
||||
|
||||
class PhiForCausalLM(LlamaForCausalLM):
|
||||
pass
|
||||
def __init__(self, config):
|
||||
super().__init__(config)
|
||||
self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=True)
|
||||
|
||||
|
||||
class PhiForSequenceClassification(LlamaForSequenceClassification):
|
||||
|
|
|
|||
Loading…
Reference in a new issue