from transformers.models.gpt_neox.configuration_gpt_neox import GPTNeoXConfig class ItaliaConfig(GPTNeoXConfig): model_type = "italia" keys_to_ignore_at_inference = ["past_key_values"] def __init__( self, hidden_act="gelu_new", *args, **kwargs, ): super().__init__( hidden_act=hidden_act, *args, **kwargs, )