fbaldassarri's picture
Initial Upload
718520e verified
raw
history blame contribute delete
410 Bytes
from transformers.models.gpt_neox.configuration_gpt_neox import GPTNeoXConfig
class ItaliaConfig(GPTNeoXConfig):
model_type = "italia"
keys_to_ignore_at_inference = ["past_key_values"]
def __init__(
self,
hidden_act="gelu_new",
*args,
**kwargs,
):
super().__init__(
hidden_act=hidden_act,
*args,
**kwargs,
)