mirror of
https://github.com/huggingface/transformers.git
synced 2025-08-02 19:21:31 +06:00
parent
91f14f1fc4
commit
87089176d9
@ -727,7 +727,7 @@ class PhiForCausalLM(PhiPreTrainedModel, GenerationMixin):
|
||||
super().__init__(config)
|
||||
self.model = PhiModel(config)
|
||||
self.vocab_size = config.vocab_size
|
||||
self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False)
|
||||
self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=True)
|
||||
|
||||
# Initialize weights and apply final processing
|
||||
self.post_init()
|
||||
|
@ -284,7 +284,9 @@ class PhiModel(LlamaModel):
|
||||
|
||||
|
||||
class PhiForCausalLM(LlamaForCausalLM):
|
||||
pass
|
||||
def __init__(self, config):
|
||||
super().__init__(config)
|
||||
self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=True)
|
||||
|
||||
|
||||
class PhiForSequenceClassification(LlamaForSequenceClassification):
|
||||
|
Loading…
Reference in New Issue
Block a user