Getting import error

from transformers import BertPreTrainedModel, RobertaModel
import torch


class RobertaForMD(BertPreTrainedModel): # Metaphor Detection, modified from BertForTokenClassification
    def __init__(self, config):
        super().__init__(config)
        self.num_labels = config.num_labels

        self.bert = RobertaModel(config)
        self.dropout = torch.nn.Dropout(config.hidden_dropout_prob)
        self.classifier = torch.nn.Linear(config.hidden_size, self.config.num_labels)
        # self.loss = torch.nn.BCEWithLogitsLoss(pos_weight=torch.tensor([3], dtype=torch.float32))
        self.loss = torch.nn.BCEWithLogitsLoss()

        self.init_weights()

    def forward(
        self,
        input_ids=None,
        attention_mask=None,
        token_type_ids=None,
        position_ids=None,
        head_mask=None,
        inputs_embeds=None,
        labels=None,
        word_posi=None
    ):
        outputs = self.bert(
            input_ids,
            attention_mask=attention_mask,
            token_type_ids=token_type_ids,
            position_ids=position_ids,
            head_mask=head_mask,
            inputs_embeds=inputs_embeds,
        )

        last_hidden_state = outputs[0]
        last_hidden_state = self.dropout(last_hidden_state)
        batch_size = input_ids.shape[0]

        word_state = torch.empty((0, last_hidden_state.shape[2]), dtype=torch.float32).cuda()
        for i in range(batch_size):
            word_state = torch.cat((word_state, last_hidden_state[i][word_posi[i]].unsqueeze(0)))

        logits = self.classifier(word_state)

        outputs = (logits,) + outputs[2:]  # add hidden states and attention if they are here

        if labels is not None:
            loss = self.loss(logits.view(-1), labels.to(torch.float32))
            outputs = (loss,) + outputs

        return outputs  # (loss), logits, (hidden_states), (attentions)

I am calling this using
model = RobertaForMD.from_pretrained(model_name, num_labels=1)

Error

File “main.py”, line 276, in main
model = RobertaForMD.from_pretrained(model_name, num_labels=1)
File “/nas/home/tuhinc/miniconda3/lib/python3.7/site-packages/transformers/modeling_utils.py”, line 438, in from_pretrained
**kwargs,
File “/nas/home/tuhinc/miniconda3/lib/python3.7/site-packages/transformers/configuration_utils.py”, line 199, in from_pretrained
config_dict, kwargs = cls.get_config_dict(pretrained_model_name_or_path, **kwargs)
File “/nas/home/tuhinc/miniconda3/lib/python3.7/site-packages/transformers/configuration_utils.py”, line 269, in get_config_dict
raise EnvironmentError(msg)
OSError: Can’t load ‘roberta-large’. Make sure that:

  • ‘roberta-large’ is a correct model identifier listed on ‘https://huggingface.co/models’

  • or ‘roberta-large’ is the correct path to a directory containing a ‘config.json’ file

Not sure how you mean , any code or link which does that ?

Oh, sorry I mistook for AutoModel. Can you just try doing this instead ?
AutoModel.from_pretrained('roberta-large', config). This should work.

This worked for me

model = RobertaForMD.from_pretrained("roberta-large")