|
from transformers import GPT2Config |
|
|
|
|
|
class BackpackGPT2Config(GPT2Config): |
|
model_type = "backpack-gpt2" |
|
|
|
def __init__( |
|
self, |
|
num_senses: int = 16, |
|
sense_intermediate_scale: int = 4, |
|
vocab_size: int = 50264, |
|
n_positions: int = 512, |
|
scale_attn_by_inverse_layer_idx: bool = True, |
|
**kwargs, |
|
): |
|
self.num_senses = num_senses |
|
self.sense_intermediate_scale = sense_intermediate_scale |
|
super().__init__( |
|
vocab_size=vocab_size, |
|
n_positions=n_positions, |
|
scale_attn_by_inverse_layer_idx=scale_attn_by_inverse_layer_idx, |
|
**kwargs, |
|
) |
|
|