Masioki's picture
End of training
df9391c verified
raw
history blame contribute delete
No virus
604 Bytes
{
"architectures": [
"CrossAttentionSentenceClassifier"
],
"cross_layers": 3,
"dropout": 0.3,
"embedding_strategy": "self-att",
"fp16": false,
"heads": 8,
"hidden_size": 768,
"k_backbone": "transformer-prosody-encoder192",
"k_freezed": false,
"k_kwargs": {
"dropout": 0.3,
"heads": 8,
"input_size": 2,
"num_layers": 2
},
"labels": 18,
"model_type": "cross-attention-sentence-classifier",
"multilabel": true,
"q_backbone": "Phi-3-mini-4k-instruct",
"q_freezed": true,
"q_kwargs": {},
"torch_dtype": "float32",
"transformers_version": "4.41.2"
}