zhihan1996
/

DNABERT-2-117M

Inference Endpoints

Model card Files Files and versions Community

zhihan1996 commited on Feb 22

Commit

faf3caf

•

1 Parent(s): 55b04c5

Update bert_layers.py

Files changed (1) hide show

bert_layers.py +3 -8

bert_layers.py CHANGED Viewed

@@ -18,7 +18,6 @@ from torch.nn.modules.utils import consume_prefix_in_state_dict_if_present
 from transformers.activations import ACT2FN
 from transformers.modeling_outputs import (MaskedLMOutput,
                                            SequenceClassifierOutput)
-from transformers.models.bert.modeling_bert import BertPreTrainedModel
 from transformers.modeling_utils import PreTrainedModel
 from .bert_padding import (index_first_axis,
@@ -522,7 +521,7 @@ class BertPredictionHeadTransform(nn.Module):
         return hidden_states
-class BertModel(BertPreTrainedModel):
     """Overall BERT model.
     Args:
@@ -682,7 +681,7 @@ class BertOnlyNSPHead(nn.Module):
-class BertForMaskedLM(BertPreTrainedModel):
     def __init__(self, config):
         super().__init__(config)
@@ -810,12 +809,8 @@ class BertForMaskedLM(BertPreTrainedModel):
         return {'input_ids': input_ids, 'attention_mask': attention_mask}
-class BertForNextSentencePrediction(BertPreTrainedModel):
-    #TBD: Push in future commit
-    pass
-class BertForSequenceClassification(BertPreTrainedModel):
     """Bert Model transformer with a sequence classification/regression head.
     This head is just a linear layer on top of the pooled output. Used for,

 from transformers.activations import ACT2FN
 from transformers.modeling_outputs import (MaskedLMOutput,
                                            SequenceClassifierOutput)
 from transformers.modeling_utils import PreTrainedModel
 from .bert_padding import (index_first_axis,
         return hidden_states
+class BertModel(PreTrainedModel):
     """Overall BERT model.
     Args:
+class BertForMaskedLM(PreTrainedModel):
     def __init__(self, config):
         super().__init__(config)
         return {'input_ids': input_ids, 'attention_mask': attention_mask}
+class BertForSequenceClassification(PreTrainedModel):
     """Bert Model transformer with a sequence classification/regression head.
     This head is just a linear layer on top of the pooled output. Used for,