BounharAbdelaziz commited on
Commit
548143d
1 Parent(s): bf90461

BounharAbdelaziz/Transliteration-Moroccan-Darija

Browse files
Files changed (5) hide show
  1. README.md +7 -5
  2. config.json +7 -7
  3. model.safetensors +2 -2
  4. tokenizer.json +0 -0
  5. training_args.bin +1 -1
README.md CHANGED
@@ -30,14 +30,16 @@ More information needed
30
  ### Training hyperparameters
31
 
32
  The following hyperparameters were used during training:
33
- - learning_rate: 0.05
34
- - train_batch_size: 512
35
- - eval_batch_size: 512
36
  - seed: 42
 
 
37
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
38
  - lr_scheduler_type: linear
39
- - lr_scheduler_warmup_ratio: 0.01
40
- - num_epochs: 30
41
 
42
  ### Framework versions
43
 
 
30
  ### Training hyperparameters
31
 
32
  The following hyperparameters were used during training:
33
+ - learning_rate: 3e-05
34
+ - train_batch_size: 128
35
+ - eval_batch_size: 128
36
  - seed: 42
37
+ - gradient_accumulation_steps: 2
38
+ - total_train_batch_size: 256
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
+ - lr_scheduler_warmup_ratio: 0.02
42
+ - num_epochs: 120
43
 
44
  ### Framework versions
45
 
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "./checkpoint-1500/",
3
  "architectures": [
4
  "EncoderDecoderModel"
5
  ],
@@ -26,7 +26,7 @@
26
  "forced_eos_token_id": null,
27
  "hidden_act": "gelu",
28
  "hidden_dropout_prob": 0.1,
29
- "hidden_size": 64,
30
  "id2label": {
31
  "0": "LABEL_0",
32
  "1": "LABEL_1"
@@ -46,10 +46,10 @@
46
  "min_length": 0,
47
  "model_type": "bert",
48
  "no_repeat_ngram_size": 0,
49
- "num_attention_heads": 2,
50
  "num_beam_groups": 1,
51
  "num_beams": 1,
52
- "num_hidden_layers": 2,
53
  "num_return_sequences": 1,
54
  "output_attentions": false,
55
  "output_hidden_states": false,
@@ -105,7 +105,7 @@
105
  "forced_eos_token_id": null,
106
  "hidden_act": "gelu",
107
  "hidden_dropout_prob": 0.1,
108
- "hidden_size": 64,
109
  "id2label": {
110
  "0": "LABEL_0",
111
  "1": "LABEL_1"
@@ -125,10 +125,10 @@
125
  "min_length": 0,
126
  "model_type": "bert",
127
  "no_repeat_ngram_size": 0,
128
- "num_attention_heads": 2,
129
  "num_beam_groups": 1,
130
  "num_beams": 1,
131
- "num_hidden_layers": 2,
132
  "num_return_sequences": 1,
133
  "output_attentions": false,
134
  "output_hidden_states": false,
 
1
  {
2
+ "_name_or_path": "./checkpoint-5000/",
3
  "architectures": [
4
  "EncoderDecoderModel"
5
  ],
 
26
  "forced_eos_token_id": null,
27
  "hidden_act": "gelu",
28
  "hidden_dropout_prob": 0.1,
29
+ "hidden_size": 256,
30
  "id2label": {
31
  "0": "LABEL_0",
32
  "1": "LABEL_1"
 
46
  "min_length": 0,
47
  "model_type": "bert",
48
  "no_repeat_ngram_size": 0,
49
+ "num_attention_heads": 8,
50
  "num_beam_groups": 1,
51
  "num_beams": 1,
52
+ "num_hidden_layers": 4,
53
  "num_return_sequences": 1,
54
  "output_attentions": false,
55
  "output_hidden_states": false,
 
105
  "forced_eos_token_id": null,
106
  "hidden_act": "gelu",
107
  "hidden_dropout_prob": 0.1,
108
+ "hidden_size": 256,
109
  "id2label": {
110
  "0": "LABEL_0",
111
  "1": "LABEL_1"
 
125
  "min_length": 0,
126
  "model_type": "bert",
127
  "no_repeat_ngram_size": 0,
128
+ "num_attention_heads": 8,
129
  "num_beam_groups": 1,
130
  "num_beams": 1,
131
+ "num_hidden_layers": 4,
132
  "num_return_sequences": 1,
133
  "output_attentions": false,
134
  "output_hidden_states": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:816a30480e3c6c9dbbbb8beda170def7573bba47ecbd7ea18790f9829eadfcae
3
- size 22805496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06752f7d26b1fd95377b38f6cc6c2be1ca93b2d04222f65053155b794e6ff532
3
+ size 127350216
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:000459e2b1cc8e87d2d315734c195c15b6a59ac770c9921ddf85433e87be1519
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6927d6e7c46d3c0f554f1706565c3cbaedeb09f7598e1c70acfb2f6186fba18
3
  size 5048