Rodrigo1771 commited on
Commit
e51ed61
1 Parent(s): c5559cc

Training in progress, epoch 1

Browse files
README.md ADDED
@@ -0,0 +1,103 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: transformers
3
+ license: apache-2.0
4
+ base_model: michiyasunaga/BioLinkBERT-base
5
+ tags:
6
+ - token-classification
7
+ - generated_from_trainer
8
+ datasets:
9
+ - Rodrigo1771/drugtemist-en-fasttext-8-ner
10
+ metrics:
11
+ - precision
12
+ - recall
13
+ - f1
14
+ - accuracy
15
+ model-index:
16
+ - name: output
17
+ results:
18
+ - task:
19
+ name: Token Classification
20
+ type: token-classification
21
+ dataset:
22
+ name: Rodrigo1771/drugtemist-en-fasttext-8-ner
23
+ type: Rodrigo1771/drugtemist-en-fasttext-8-ner
24
+ config: DrugTEMIST English NER
25
+ split: validation
26
+ args: DrugTEMIST English NER
27
+ metrics:
28
+ - name: Precision
29
+ type: precision
30
+ value: 0.9271889400921659
31
+ - name: Recall
32
+ type: recall
33
+ value: 0.9375582479030755
34
+ - name: F1
35
+ type: f1
36
+ value: 0.9323447636700648
37
+ - name: Accuracy
38
+ type: accuracy
39
+ value: 0.9987162671280663
40
+ ---
41
+
42
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
43
+ should probably proofread and complete it, then remove this comment. -->
44
+
45
+ # output
46
+
47
+ This model is a fine-tuned version of [michiyasunaga/BioLinkBERT-base](https://huggingface.co/michiyasunaga/BioLinkBERT-base) on the Rodrigo1771/drugtemist-en-fasttext-8-ner dataset.
48
+ It achieves the following results on the evaluation set:
49
+ - Loss: 0.0080
50
+ - Precision: 0.9272
51
+ - Recall: 0.9376
52
+ - F1: 0.9323
53
+ - Accuracy: 0.9987
54
+
55
+ ## Model description
56
+
57
+ More information needed
58
+
59
+ ## Intended uses & limitations
60
+
61
+ More information needed
62
+
63
+ ## Training and evaluation data
64
+
65
+ More information needed
66
+
67
+ ## Training procedure
68
+
69
+ ### Training hyperparameters
70
+
71
+ The following hyperparameters were used during training:
72
+ - learning_rate: 5e-05
73
+ - train_batch_size: 32
74
+ - eval_batch_size: 8
75
+ - seed: 42
76
+ - gradient_accumulation_steps: 2
77
+ - total_train_batch_size: 64
78
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
79
+ - lr_scheduler_type: linear
80
+ - num_epochs: 10.0
81
+
82
+ ### Training results
83
+
84
+ | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
85
+ |:-------------:|:------:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
86
+ | No log | 0.9990 | 481 | 0.0042 | 0.9173 | 0.9413 | 0.9292 | 0.9987 |
87
+ | 0.0156 | 2.0 | 963 | 0.0049 | 0.9134 | 0.9245 | 0.9189 | 0.9986 |
88
+ | 0.0039 | 2.9990 | 1444 | 0.0053 | 0.8914 | 0.9487 | 0.9192 | 0.9986 |
89
+ | 0.0024 | 4.0 | 1926 | 0.0061 | 0.8820 | 0.9543 | 0.9167 | 0.9985 |
90
+ | 0.0017 | 4.9990 | 2407 | 0.0074 | 0.9199 | 0.9310 | 0.9254 | 0.9986 |
91
+ | 0.0011 | 6.0 | 2889 | 0.0079 | 0.9170 | 0.9366 | 0.9267 | 0.9986 |
92
+ | 0.0007 | 6.9990 | 3370 | 0.0067 | 0.9092 | 0.9422 | 0.9254 | 0.9987 |
93
+ | 0.0005 | 8.0 | 3852 | 0.0073 | 0.9249 | 0.9301 | 0.9275 | 0.9987 |
94
+ | 0.0004 | 8.9990 | 4333 | 0.0080 | 0.9272 | 0.9376 | 0.9323 | 0.9987 |
95
+ | 0.0002 | 9.9896 | 4810 | 0.0079 | 0.9247 | 0.9385 | 0.9315 | 0.9987 |
96
+
97
+
98
+ ### Framework versions
99
+
100
+ - Transformers 4.44.2
101
+ - Pytorch 2.4.0+cu121
102
+ - Datasets 2.21.0
103
+ - Tokenizers 0.19.1
all_results.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.989615784008308,
3
+ "eval_accuracy": 0.9987162671280663,
4
+ "eval_f1": 0.9323447636700648,
5
+ "eval_loss": 0.008018395863473415,
6
+ "eval_precision": 0.9271889400921659,
7
+ "eval_recall": 0.9375582479030755,
8
+ "eval_runtime": 15.1949,
9
+ "eval_samples": 6946,
10
+ "eval_samples_per_second": 457.127,
11
+ "eval_steps_per_second": 57.19,
12
+ "predict_accuracy": 0.9987276251102988,
13
+ "predict_f1": 0.9228159457167091,
14
+ "predict_loss": 0.007742513902485371,
15
+ "predict_precision": 0.8991735537190083,
16
+ "predict_recall": 0.9477351916376306,
17
+ "predict_runtime": 28.7894,
18
+ "predict_samples_per_second": 511.125,
19
+ "predict_steps_per_second": 63.912,
20
+ "total_flos": 1.3132946802550608e+16,
21
+ "train_loss": 0.0027612092573652642,
22
+ "train_runtime": 2084.9871,
23
+ "train_samples": 30812,
24
+ "train_samples_per_second": 147.78,
25
+ "train_steps_per_second": 2.307
26
+ }
config.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "michiyasunaga/BioLinkBERT-base",
3
+ "architectures": [
4
+ "BertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "finetuning_task": "ner",
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "id2label": {
14
+ "0": "O",
15
+ "1": "B-FARMACO",
16
+ "2": "I-FARMACO"
17
+ },
18
+ "initializer_range": 0.02,
19
+ "intermediate_size": 3072,
20
+ "label2id": {
21
+ "B-FARMACO": 1,
22
+ "I-FARMACO": 2,
23
+ "O": 0
24
+ },
25
+ "layer_norm_eps": 1e-12,
26
+ "max_position_embeddings": 512,
27
+ "model_type": "bert",
28
+ "num_attention_heads": 12,
29
+ "num_hidden_layers": 12,
30
+ "pad_token_id": 0,
31
+ "position_embedding_type": "absolute",
32
+ "torch_dtype": "float32",
33
+ "transformers_version": "4.44.2",
34
+ "type_vocab_size": 2,
35
+ "use_cache": true,
36
+ "vocab_size": 28895
37
+ }
eval_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.989615784008308,
3
+ "eval_accuracy": 0.9987162671280663,
4
+ "eval_f1": 0.9323447636700648,
5
+ "eval_loss": 0.008018395863473415,
6
+ "eval_precision": 0.9271889400921659,
7
+ "eval_recall": 0.9375582479030755,
8
+ "eval_runtime": 15.1949,
9
+ "eval_samples": 6946,
10
+ "eval_samples_per_second": 457.127,
11
+ "eval_steps_per_second": 57.19
12
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43857b892e7658830c5b99b9e8e7e7b22774f70e3afe6b5e125c652d71a35e18
3
+ size 430601004
predict_results.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "predict_accuracy": 0.9987276251102988,
3
+ "predict_f1": 0.9228159457167091,
4
+ "predict_loss": 0.007742513902485371,
5
+ "predict_precision": 0.8991735537190083,
6
+ "predict_recall": 0.9477351916376306,
7
+ "predict_runtime": 28.7894,
8
+ "predict_samples_per_second": 511.125,
9
+ "predict_steps_per_second": 63.912
10
+ }
predictions.txt ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
tb/events.out.tfevents.1725881335.0a1c9bec2a53.3232.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:593e737686a00ae0f64a94f2ef02389ad7dff30c0ba6a6f2b1c65ac31e873867
3
+ size 11302
tb/events.out.tfevents.1725882696.0a1c9bec2a53.3232.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ecdc6d00855fb66deb25a7b5be160aa0ebb2ebe07a43beb7d88fb0430fb141
3
+ size 560
tb/events.out.tfevents.1725882852.0a1c9bec2a53.9893.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:543df15001da008ba822f9c1ebf4f77259f803cbf1c5758f2da70bdbf003d86f
3
+ size 11091
tb/events.out.tfevents.1725883955.0a1c9bec2a53.9893.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b842d84c89f0d88706e31e98b113fae6b45879220115930147db648f848a8c24
3
+ size 560
tb/events.out.tfevents.1725884095.0a1c9bec2a53.15221.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a5eb73def06ef281d6c5abe9cbb6a47c633f2d7191b334dbe5cbead1c284e80
3
+ size 10880
tb/events.out.tfevents.1725885059.0a1c9bec2a53.15221.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c793a2eec8072a81c25e2f78d3ef7bcf74abbe37e32354df7dcda008aa71eda
3
+ size 560
tb/events.out.tfevents.1725885168.0a1c9bec2a53.19825.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0f9a2adaf22b0a47090405af62255c59f8c395faf6fe62ec62fa970d9063713
3
+ size 10880
tb/events.out.tfevents.1725886061.0a1c9bec2a53.19825.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa09451db71ecc3a737f5726105cdc310a150c4cd36e427e1f2dad13956046fd
3
+ size 560
tb/events.out.tfevents.1725886210.0a1c9bec2a53.24273.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a173893ab6ea4bae83ba8f7d43d877ca16a06c53d30cb7f414ae20737d881888
3
+ size 12305
tb/events.out.tfevents.1725888457.0a1c9bec2a53.24273.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bb5583c37fdbd9ea659142a09fba0fae95a78d6f0eaac64a0292bc00e64215d
3
+ size 560
tb/events.out.tfevents.1725888716.0a1c9bec2a53.34821.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90e8e7961730149c6c235f6c85cd7c14fbfd2b133f0d765a77e4ff36d922e037
3
+ size 12094
tb/events.out.tfevents.1725890856.0a1c9bec2a53.34821.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e48c8b756097d535fb92e12d532058c15666eb7d5fe08ece1421f853f8616afe
3
+ size 560
tb/events.out.tfevents.1725891307.0a1c9bec2a53.45801.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb08a4d1f7207eb6df7a033a5d21f394a4f6b8b609afce2a53edf00aae1336d
3
+ size 5593
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "4": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 1000000000000000019884624838656,
50
+ "never_split": null,
51
+ "pad_token": "[PAD]",
52
+ "sep_token": "[SEP]",
53
+ "strip_accents": null,
54
+ "tokenize_chinese_chars": true,
55
+ "tokenizer_class": "BertTokenizer",
56
+ "unk_token": "[UNK]"
57
+ }
train.log ADDED
@@ -0,0 +1,329 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0
  0%| | 0/4480 [00:00<?, ?it/s]
1
  0%| | 1/4480 [00:01<1:27:13, 1.17s/it]
2
  0%| | 2/4480 [00:01<58:18, 1.28it/s]
3
  0%| | 3/4480 [00:01<42:36, 1.75it/s]
4
  0%| | 4/4480 [00:02<40:37, 1.84it/s]
5
  0%| | 5/4480 [00:02<38:44, 1.93it/s]
6
  0%| | 6/4480 [00:03<38:28, 1.94it/s]
7
  0%| | 7/4480 [00:04<40:28, 1.84it/s]
8
  0%| | 8/4480 [00:04<33:34, 2.22it/s]
9
  0%| | 9/4480 [00:05<43:45, 1.70it/s]
10
  0%| | 10/4480 [00:05<37:41, 1.98it/s]
11
  0%| | 11/4480 [00:05<33:46, 2.21it/s]
12
  0%| | 12/4480 [00:06<29:48, 2.50it/s]
13
  0%| | 13/4480 [00:06<27:25, 2.71it/s]
14
  0%| | 14/4480 [00:06<26:26, 2.81it/s]
15
  0%| | 15/4480 [00:07<27:19, 2.72it/s]
16
  0%| | 16/4480 [00:07<26:01, 2.86it/s]
17
  0%| | 17/4480 [00:07<25:55, 2.87it/s]
18
  0%| | 18/4480 [00:08<25:52, 2.87it/s]
19
  0%| | 19/4480 [00:08<26:25, 2.81it/s]
20
  0%| | 20/4480 [00:09<29:47, 2.50it/s]
21
  0%| | 21/4480 [00:09<27:56, 2.66it/s]
22
  0%| | 22/4480 [00:09<26:06, 2.85it/s]
23
  1%| | 23/4480 [00:10<29:12, 2.54it/s]
24
  1%| | 24/4480 [00:10<29:18, 2.53it/s]
25
  1%| | 25/4480 [00:10<28:01, 2.65it/s]
26
  1%| | 26/4480 [00:11<27:24, 2.71it/s]
27
  1%| | 27/4480 [00:11<26:48, 2.77it/s]
28
  1%| | 28/4480 [00:11<24:44, 3.00it/s]
29
  1%| | 29/4480 [00:12<23:45, 3.12it/s]
30
  1%| | 30/4480 [00:12<24:01, 3.09it/s]
31
  1%| | 31/4480 [00:12<25:11, 2.94it/s]
32
  1%| | 32/4480 [00:13<31:17, 2.37it/s]
33
  1%| | 33/4480 [00:13<29:50, 2.48it/s]
34
  1%| | 34/4480 [00:14<28:19, 2.62it/s]
35
  1%| | 35/4480 [00:14<27:06, 2.73it/s]
36
  1%| | 36/4480 [00:14<25:14, 2.93it/s]
37
  1%| | 37/4480 [00:15<25:46, 2.87it/s]
38
  1%| | 38/4480 [00:15<25:39, 2.89it/s]
39
  1%| | 39/4480 [00:15<25:19, 2.92it/s]
40
  1%| | 40/4480 [00:16<23:37, 3.13it/s]
41
  1%| | 41/4480 [00:16<26:05, 2.84it/s]
42
  1%| | 42/4480 [00:16<27:16, 2.71it/s]
43
  1%| | 43/4480 [00:17<27:36, 2.68it/s]
44
  1%| | 44/4480 [00:17<25:25, 2.91it/s]
45
  1%| | 45/4480 [00:17<26:45, 2.76it/s]
46
  1%| | 46/4480 [00:18<27:15, 2.71it/s]
47
  1%| | 47/4480 [00:18<24:30, 3.01it/s]
48
  1%| | 48/4480 [00:18<23:58, 3.08it/s]
49
  1%| | 49/4480 [00:19<27:39, 2.67it/s]
50
  1%| | 50/4480 [00:19<27:03, 2.73it/s]
51
  1%| | 51/4480 [00:20<26:51, 2.75it/s]
52
  1%| | 52/4480 [00:20<26:28, 2.79it/s]
53
  1%| | 53/4480 [00:20<25:58, 2.84it/s]
54
  1%| | 54/4480 [00:21<25:34, 2.88it/s]
55
  1%| | 55/4480 [00:21<26:41, 2.76it/s]
56
  1%|▏ | 56/4480 [00:21<25:43, 2.87it/s]
57
  1%|▏ | 57/4480 [00:22<25:10, 2.93it/s]
58
  1%|▏ | 58/4480 [00:22<24:48, 2.97it/s]
59
  1%|▏ | 59/4480 [00:22<27:00, 2.73it/s]
60
  1%|▏ | 60/4480 [00:23<25:08, 2.93it/s]
61
  1%|▏ | 61/4480 [00:23<23:47, 3.10it/s]
62
  1%|▏ | 62/4480 [00:23<24:58, 2.95it/s]
63
  1%|▏ | 63/4480 [00:24<25:04, 2.94it/s]
64
  1%|▏ | 64/4480 [00:24<25:28, 2.89it/s]
65
  1%|▏ | 65/4480 [00:24<26:23, 2.79it/s]
66
  1%|▏ | 66/4480 [00:25<27:05, 2.72it/s]
67
  1%|▏ | 67/4480 [00:25<24:30, 3.00it/s]
68
  2%|▏ | 68/4480 [00:26<27:07, 2.71it/s]
69
  2%|▏ | 69/4480 [00:26<24:36, 2.99it/s]
70
  2%|▏ | 70/4480 [00:26<23:24, 3.14it/s]
71
  2%|▏ | 71/4480 [00:26<23:37, 3.11it/s]
72
  2%|▏ | 72/4480 [00:27<25:38, 2.87it/s]
73
  2%|▏ | 73/4480 [00:27<25:22, 2.89it/s]
74
  2%|▏ | 74/4480 [00:28<29:49, 2.46it/s]
75
  2%|▏ | 75/4480 [00:28<27:22, 2.68it/s]
76
  2%|▏ | 76/4480 [00:28<28:53, 2.54it/s]
77
  2%|▏ | 77/4480 [00:29<26:12, 2.80it/s]
78
  2%|▏ | 78/4480 [00:29<25:33, 2.87it/s]
79
  2%|▏ | 79/4480 [00:29<24:38, 2.98it/s]
80
  2%|▏ | 80/4480 [00:30<23:06, 3.17it/s]
81
  2%|▏ | 81/4480 [00:30<21:32, 3.40it/s]
82
  2%|▏ | 82/4480 [00:30<23:59, 3.06it/s]
83
  2%|▏ | 83/4480 [00:31<25:23, 2.89it/s]
84
  2%|▏ | 84/4480 [00:31<23:38, 3.10it/s]
85
  2%|▏ | 85/4480 [00:31<26:33, 2.76it/s]
86
  2%|▏ | 86/4480 [00:32<25:19, 2.89it/s]
87
  2%|▏ | 87/4480 [00:32<26:24, 2.77it/s]
88
  2%|▏ | 88/4480 [00:32<26:14, 2.79it/s]
89
  2%|▏ | 89/4480 [00:33<27:43, 2.64it/s]
90
  2%|▏ | 90/4480 [00:33<27:35, 2.65it/s]
91
  2%|▏ | 91/4480 [00:34<26:44, 2.73it/s]
92
  2%|▏ | 92/4480 [00:34<25:58, 2.82it/s]
93
  2%|▏ | 93/4480 [00:34<29:40, 2.46it/s]
94
  2%|▏ | 94/4480 [00:35<31:01, 2.36it/s]
95
  2%|▏ | 95/4480 [00:35<28:40, 2.55it/s]
96
  2%|▏ | 96/4480 [00:36<29:02, 2.52it/s]
97
  2%|▏ | 97/4480 [00:36<27:33, 2.65it/s]
98
  2%|▏ | 98/4480 [00:36<25:41, 2.84it/s]
99
  2%|▏ | 99/4480 [00:37<25:00, 2.92it/s]
100
  2%|▏ | 100/4480 [00:37<24:27, 2.98it/s]
101
  2%|▏ | 101/4480 [00:37<23:31, 3.10it/s]
102
  2%|▏ | 102/4480 [00:38<25:30, 2.86it/s]
103
  2%|▏ | 103/4480 [00:38<26:52, 2.72it/s]
104
  2%|▏ | 104/4480 [00:38<27:32, 2.65it/s]
105
  2%|▏ | 105/4480 [00:39<27:49, 2.62it/s]
106
  2%|▏ | 106/4480 [00:39<28:57, 2.52it/s]
107
  2%|▏ | 107/4480 [00:40<29:45, 2.45it/s]
108
  2%|▏ | 108/4480 [00:40<29:21, 2.48it/s]
109
  2%|▏ | 109/4480 [00:41<30:06, 2.42it/s]
110
  2%|▏ | 110/4480 [00:41<28:50, 2.52it/s]
111
  2%|▏ | 111/4480 [00:41<26:51, 2.71it/s]
112
  2%|▎ | 112/4480 [00:42<26:40, 2.73it/s]
113
  3%|▎ | 113/4480 [00:42<25:18, 2.88it/s]
114
  3%|▎ | 114/4480 [00:42<24:22, 2.98it/s]
115
  3%|▎ | 115/4480 [00:42<24:30, 2.97it/s]
116
  3%|▎ | 116/4480 [00:43<23:50, 3.05it/s]
117
  3%|▎ | 117/4480 [00:43<24:04, 3.02it/s]
118
  3%|▎ | 118/4480 [00:43<25:05, 2.90it/s]
119
  3%|▎ | 119/4480 [00:44<26:54, 2.70it/s]
120
  3%|▎ | 120/4480 [00:44<26:18, 2.76it/s]
121
  3%|▎ | 121/4480 [00:45<25:48, 2.81it/s]
122
  3%|▎ | 122/4480 [00:45<24:31, 2.96it/s]
123
  3%|▎ | 123/4480 [00:45<24:25, 2.97it/s]
124
  3%|▎ | 124/4480 [00:46<26:24, 2.75it/s]
125
  3%|▎ | 125/4480 [00:46<24:42, 2.94it/s]
126
  3%|▎ | 126/4480 [00:46<24:37, 2.95it/s]
127
  3%|▎ | 127/4480 [00:47<23:19, 3.11it/s]
128
  3%|▎ | 128/4480 [00:47<24:13, 2.99it/s]
129
  3%|▎ | 129/4480 [00:47<25:24, 2.85it/s]
130
  3%|▎ | 130/4480 [00:48<26:42, 2.71it/s]
131
  3%|▎ | 131/4480 [00:48<25:07, 2.88it/s]
132
  3%|▎ | 132/4480 [00:48<22:49, 3.18it/s]
133
  3%|▎ | 133/4480 [00:49<23:09, 3.13it/s]
134
  3%|▎ | 134/4480 [00:49<22:16, 3.25it/s]
135
  3%|▎ | 135/4480 [00:49<24:13, 2.99it/s]
136
  3%|▎ | 136/4480 [00:50<29:11, 2.48it/s]
137
  3%|▎ | 137/4480 [00:50<27:13, 2.66it/s]
138
  3%|▎ | 138/4480 [00:50<25:49, 2.80it/s]
139
  3%|▎ | 139/4480 [00:51<23:35, 3.07it/s]
140
  3%|▎ | 140/4480 [00:51<26:01, 2.78it/s]
141
  3%|▎ | 141/4480 [00:51<24:42, 2.93it/s]
142
  3%|▎ | 142/4480 [00:52<25:08, 2.88it/s]
143
  3%|▎ | 143/4480 [00:52<24:12, 2.99it/s]
144
  3%|▎ | 144/4480 [00:53<25:47, 2.80it/s]
145
  3%|▎ | 145/4480 [00:53<27:19, 2.64it/s]
146
  3%|▎ | 146/4480 [00:53<25:50, 2.80it/s]
147
  3%|▎ | 147/4480 [00:54<26:06, 2.77it/s]
148
  3%|▎ | 148/4480 [00:54<28:09, 2.56it/s]
149
  3%|▎ | 149/4480 [00:54<25:11, 2.87it/s]
150
  3%|▎ | 150/4480 [00:55<24:56, 2.89it/s]
151
  3%|▎ | 151/4480 [00:55<25:44, 2.80it/s]
152
  3%|▎ | 152/4480 [00:55<24:55, 2.89it/s]
153
  3%|▎ | 153/4480 [00:56<24:43, 2.92it/s]
154
  3%|▎ | 154/4480 [00:56<26:18, 2.74it/s]
155
  3%|▎ | 155/4480 [00:57<26:55, 2.68it/s]
156
  3%|▎ | 156/4480 [00:57<24:56, 2.89it/s]
157
  4%|▎ | 157/4480 [00:57<23:56, 3.01it/s]
158
  4%|▎ | 158/4480 [00:57<23:58, 3.00it/s]
159
  4%|▎ | 159/4480 [00:58<25:32, 2.82it/s]
160
  4%|▎ | 160/4480 [00:58<23:23, 3.08it/s]
161
  4%|▎ | 161/4480 [00:59<31:10, 2.31it/s]
162
  4%|▎ | 162/4480 [00:59<28:51, 2.49it/s]
163
  4%|▎ | 163/4480 [01:00<30:49, 2.33it/s]
164
  4%|▎ | 164/4480 [01:00<29:43, 2.42it/s]
165
  4%|▎ | 165/4480 [01:00<29:25, 2.44it/s]
166
  4%|▎ | 166/4480 [01:01<29:31, 2.44it/s]
167
  4%|▎ | 167/4480 [01:01<29:34, 2.43it/s]
168
  4%|▍ | 168/4480 [01:02<28:35, 2.51it/s]
169
  4%|▍ | 169/4480 [01:02<28:08, 2.55it/s]
170
  4%|▍ | 170/4480 [01:02<29:51, 2.41it/s]
171
  4%|▍ | 171/4480 [01:03<28:51, 2.49it/s]
172
  4%|▍ | 172/4480 [01:03<28:14, 2.54it/s]
173
  4%|▍ | 173/4480 [01:04<31:39, 2.27it/s]
174
  4%|▍ | 174/4480 [01:04<29:28, 2.43it/s]
175
  4%|▍ | 175/4480 [01:04<27:20, 2.62it/s]
176
  4%|▍ | 176/4480 [01:05<29:32, 2.43it/s]
177
  4%|▍ | 177/4480 [01:05<27:30, 2.61it/s]
178
  4%|▍ | 178/4480 [01:06<26:36, 2.69it/s]
179
  4%|▍ | 179/4480 [01:06<25:08, 2.85it/s]
180
  4%|▍ | 180/4480 [01:06<25:26, 2.82it/s]
181
  4%|▍ | 181/4480 [01:07<25:06, 2.85it/s]
182
  4%|▍ | 182/4480 [01:07<25:35, 2.80it/s]
183
  4%|▍ | 183/4480 [01:07<25:33, 2.80it/s]
184
  4%|▍ | 184/4480 [01:08<25:09, 2.85it/s]
185
  4%|▍ | 185/4480 [01:08<23:36, 3.03it/s]
186
  4%|▍ | 186/4480 [01:08<23:48, 3.01it/s]
187
  4%|▍ | 187/4480 [01:09<27:59, 2.56it/s]
188
  4%|▍ | 188/4480 [01:09<28:01, 2.55it/s]
189
  4%|▍ | 189/4480 [01:10<31:35, 2.26it/s]
190
  4%|▍ | 190/4480 [01:10<31:02, 2.30it/s]
191
  4%|▍ | 191/4480 [01:11<30:53, 2.31it/s]
192
  4%|▍ | 192/4480 [01:11<30:25, 2.35it/s]
193
  4%|▍ | 193/4480 [01:11<27:03, 2.64it/s]
194
  4%|▍ | 194/4480 [01:12<26:22, 2.71it/s]
195
  4%|▍ | 195/4480 [01:12<28:28, 2.51it/s]
196
  4%|▍ | 196/4480 [01:12<27:15, 2.62it/s]
197
  4%|▍ | 197/4480 [01:13<28:00, 2.55it/s]
198
  4%|▍ | 198/4480 [01:13<26:24, 2.70it/s]
199
  4%|▍ | 199/4480 [01:13<26:10, 2.73it/s]
200
  4%|▍ | 200/4480 [01:14<24:50, 2.87it/s]
201
  4%|▍ | 201/4480 [01:14<26:46, 2.66it/s]
202
  5%|▍ | 202/4480 [01:15<25:58, 2.74it/s]
203
  5%|▍ | 203/4480 [01:15<30:23, 2.35it/s]
204
  5%|▍ | 204/4480 [01:16<29:15, 2.44it/s]
205
  5%|▍ | 205/4480 [01:16<28:43, 2.48it/s]
206
  5%|▍ | 206/4480 [01:16<29:46, 2.39it/s]
207
  5%|▍ | 207/4480 [01:17<28:00, 2.54it/s]
208
  5%|▍ | 208/4480 [01:17<28:39, 2.49it/s]
209
  5%|▍ | 209/4480 [01:18<31:11, 2.28it/s]
210
  5%|▍ | 210/4480 [01:18<28:02, 2.54it/s]
211
  5%|▍ | 211/4480 [01:18<26:41, 2.67it/s]
212
  5%|▍ | 212/4480 [01:19<25:53, 2.75it/s]
213
  5%|▍ | 213/4480 [01:19<27:32, 2.58it/s]
214
  5%|▍ | 214/4480 [01:19<26:51, 2.65it/s]
215
  5%|▍ | 215/4480 [01:20<24:20, 2.92it/s]
216
  5%|▍ | 216/4480 [01:20<28:15, 2.52it/s]
217
  5%|▍ | 217/4480 [01:21<27:36, 2.57it/s]
218
  5%|▍ | 218/4480 [01:21<26:30, 2.68it/s]
219
  5%|▍ | 219/4480 [01:21<25:09, 2.82it/s]
220
  5%|▍ | 220/4480 [01:21<23:34, 3.01it/s]
221
  5%|▍ | 221/4480 [01:22<26:54, 2.64it/s]
222
  5%|▍ | 222/4480 [01:22<26:57, 2.63it/s]
223
  5%|▍ | 223/4480 [01:23<26:57, 2.63it/s]
224
  5%|▌ | 224/4480 [01:23<28:06, 2.52it/s]
225
  5%|▌ | 225/4480 [01:24<28:12, 2.51it/s]
226
  5%|▌ | 226/4480 [01:24<27:19, 2.59it/s]
227
  5%|▌ | 227/4480 [01:24<24:48, 2.86it/s]
228
  5%|▌ | 228/4480 [01:25<24:25, 2.90it/s]
229
  5%|▌ | 229/4480 [01:25<29:38, 2.39it/s]
230
  5%|▌ | 230/4480 [01:26<33:43, 2.10it/s]
231
  5%|▌ | 231/4480 [01:26<31:08, 2.27it/s]
232
  5%|▌ | 232/4480 [01:26<29:50, 2.37it/s]
233
  5%|▌ | 233/4480 [01:27<28:29, 2.48it/s]
234
  5%|▌ | 234/4480 [01:27<26:36, 2.66it/s]
235
  5%|▌ | 235/4480 [01:27<25:50, 2.74it/s]
236
  5%|▌ | 236/4480 [01:28<23:42, 2.98it/s]
237
  5%|▌ | 237/4480 [01:28<25:03, 2.82it/s]
238
  5%|▌ | 238/4480 [01:28<25:28, 2.77it/s]
239
  5%|▌ | 239/4480 [01:29<24:08, 2.93it/s]
240
  5%|▌ | 240/4480 [01:29<26:09, 2.70it/s]
241
  5%|▌ | 241/4480 [01:30<25:28, 2.77it/s]
242
  5%|▌ | 242/4480 [01:30<28:03, 2.52it/s]
243
  5%|▌ | 243/4480 [01:31<31:01, 2.28it/s]
244
  5%|▌ | 244/4480 [01:31<28:50, 2.45it/s]
245
  5%|▌ | 245/4480 [01:31<27:57, 2.53it/s]
246
  5%|▌ | 246/4480 [01:32<27:41, 2.55it/s]
247
  6%|▌ | 247/4480 [01:32<26:01, 2.71it/s]
248
  6%|▌ | 248/4480 [01:32<27:11, 2.59it/s]
249
  6%|▌ | 249/4480 [01:33<29:16, 2.41it/s]
250
  6%|▌ | 250/4480 [01:33<29:34, 2.38it/s]
251
  6%|▌ | 251/4480 [01:34<29:48, 2.36it/s]
252
  6%|▌ | 252/4480 [01:34<27:11, 2.59it/s]
253
  6%|▌ | 253/4480 [01:34<25:23, 2.77it/s]
254
  6%|▌ | 254/4480 [01:35<27:49, 2.53it/s]
255
  6%|▌ | 255/4480 [01:35<27:50, 2.53it/s]
256
  6%|▌ | 256/4480 [01:36<27:55, 2.52it/s]
257
  6%|▌ | 257/4480 [01:36<28:58, 2.43it/s]
258
  6%|▌ | 258/4480 [01:36<26:38, 2.64it/s]
259
  6%|▌ | 259/4480 [01:37<24:14, 2.90it/s]
260
  6%|▌ | 260/4480 [01:37<23:31, 2.99it/s]
261
  6%|▌ | 261/4480 [01:37<23:23, 3.01it/s]
262
  6%|▌ | 262/4480 [01:38<24:08, 2.91it/s]
263
  6%|▌ | 263/4480 [01:38<24:19, 2.89it/s]
264
  6%|▌ | 264/4480 [01:38<23:39, 2.97it/s]
265
  6%|▌ | 265/4480 [01:39<24:04, 2.92it/s]
266
  6%|▌ | 266/4480 [01:39<26:08, 2.69it/s]
267
  6%|▌ | 267/4480 [01:40<26:31, 2.65it/s]
268
  6%|▌ | 268/4480 [01:40<27:01, 2.60it/s]
269
  6%|▌ | 269/4480 [01:40<24:13, 2.90it/s]
270
  6%|▌ | 270/4480 [01:40<23:21, 3.00it/s]
271
  6%|▌ | 271/4480 [01:41<22:32, 3.11it/s]
272
  6%|▌ | 272/4480 [01:41<24:53, 2.82it/s]
273
  6%|▌ | 273/4480 [01:42<25:37, 2.74it/s]
274
  6%|▌ | 274/4480 [01:42<25:24, 2.76it/s]
275
  6%|▌ | 275/4480 [01:42<23:07, 3.03it/s]
276
  6%|▌ | 276/4480 [01:42<22:08, 3.16it/s]
277
  6%|▌ | 277/4480 [01:43<28:01, 2.50it/s]
278
  6%|▌ | 278/4480 [01:43<27:53, 2.51it/s]
279
  6%|▌ | 279/4480 [01:44<26:38, 2.63it/s]
280
  6%|▋ | 280/4480 [01:44<28:34, 2.45it/s]
281
  6%|▋ | 281/4480 [01:45<28:37, 2.45it/s]
282
  6%|▋ | 282/4480 [01:45<26:38, 2.63it/s]
283
  6%|▋ | 283/4480 [01:45<26:15, 2.66it/s]
284
  6%|▋ | 284/4480 [01:46<25:05, 2.79it/s]
285
  6%|▋ | 285/4480 [01:46<24:09, 2.89it/s]
286
  6%|▋ | 286/4480 [01:46<23:48, 2.94it/s]
287
  6%|▋ | 287/4480 [01:47<25:43, 2.72it/s]
288
  6%|▋ | 288/4480 [01:47<24:32, 2.85it/s]
289
  6%|▋ | 289/4480 [01:48<26:44, 2.61it/s]
290
  6%|▋ | 290/4480 [01:48<24:31, 2.85it/s]
291
  6%|▋ | 291/4480 [01:48<24:09, 2.89it/s]
292
  7%|▋ | 292/4480 [01:48<24:16, 2.88it/s]
293
  7%|▋ | 293/4480 [01:49<25:05, 2.78it/s]
294
  7%|▋ | 294/4480 [01:49<23:20, 2.99it/s]
295
  7%|▋ | 295/4480 [01:50<23:57, 2.91it/s]
296
  7%|▋ | 296/4480 [01:50<25:32, 2.73it/s]
297
  7%|▋ | 297/4480 [01:50<26:29, 2.63it/s]
298
  7%|▋ | 298/4480 [01:51<26:56, 2.59it/s]
299
  7%|▋ | 299/4480 [01:51<26:20, 2.65it/s]
300
  7%|▋ | 300/4480 [01:51<26:33, 2.62it/s]
301
  7%|▋ | 301/4480 [01:52<25:37, 2.72it/s]
302
  7%|▋ | 302/4480 [01:52<24:44, 2.81it/s]
303
  7%|▋ | 303/4480 [01:52<24:11, 2.88it/s]
304
  7%|▋ | 304/4480 [01:53<24:15, 2.87it/s]
305
  7%|▋ | 305/4480 [01:53<21:53, 3.18it/s]
306
  7%|▋ | 306/4480 [01:53<20:20, 3.42it/s]
307
  7%|▋ | 307/4480 [01:54<21:38, 3.21it/s]
308
  7%|▋ | 308/4480 [01:54<21:18, 3.26it/s]
309
  7%|▋ | 309/4480 [01:54<21:50, 3.18it/s]
310
  7%|▋ | 310/4480 [01:55<20:48, 3.34it/s]
311
  7%|▋ | 311/4480 [01:55<22:58, 3.02it/s]
312
  7%|▋ | 312/4480 [01:55<23:29, 2.96it/s]
313
  7%|▋ | 313/4480 [01:56<24:55, 2.79it/s]
314
  7%|▋ | 314/4480 [01:56<27:16, 2.55it/s]
315
  7%|▋ | 315/4480 [01:57<26:04, 2.66it/s]
316
  7%|▋ | 316/4480 [01:57<29:39, 2.34it/s]
317
  7%|▋ | 317/4480 [01:57<27:06, 2.56it/s]
318
  7%|▋ | 318/4480 [01:58<26:32, 2.61it/s]
319
  7%|▋ | 319/4480 [01:58<25:06, 2.76it/s]
320
  7%|▋ | 320/4480 [01:58<26:29, 2.62it/s]
321
  7%|▋ | 321/4480 [01:59<27:00, 2.57it/s]
322
  7%|▋ | 322/4480 [01:59<28:27, 2.44it/s]
323
  7%|▋ | 323/4480 [02:00<27:55, 2.48it/s]
324
  7%|▋ | 324/4480 [02:00<27:53, 2.48it/s]
325
  7%|▋ | 325/4480 [02:01<27:34, 2.51it/s]
326
  7%|▋ | 326/4480 [02:01<26:56, 2.57it/s]
327
  7%|▋ | 327/4480 [02:01<26:27, 2.62it/s]
328
  7%|▋ | 328/4480 [02:02<26:38, 2.60it/s]
329
  7%|▋ | 329/4480 [02:02<27:01, 2.56it/s]
330
  7%|▋ | 330/4480 [02:02<26:19, 2.63it/s]
331
  7%|▋ | 331/4480 [02:03<27:25, 2.52it/s]
332
  7%|▋ | 332/4480 [02:03<26:34, 2.60it/s]
333
  7%|▋ | 333/4480 [02:04<25:43, 2.69it/s]
334
  7%|▋ | 334/4480 [02:04<28:22, 2.44it/s]
335
  7%|▋ | 335/4480 [02:04<25:24, 2.72it/s]
336
  8%|▊ | 336/4480 [02:05<23:13, 2.97it/s]
337
  8%|▊ | 337/4480 [02:05<25:39, 2.69it/s]
338
  8%|▊ | 338/4480 [02:05<25:55, 2.66it/s]
339
  8%|▊ | 339/4480 [02:06<25:20, 2.72it/s]
340
  8%|▊ | 340/4480 [02:06<29:12, 2.36it/s]
341
  8%|▊ | 341/4480 [02:07<28:56, 2.38it/s]
342
  8%|▊ | 342/4480 [02:07<27:18, 2.53it/s]
343
  8%|▊ | 343/4480 [02:07<26:17, 2.62it/s]
344
  8%|▊ | 344/4480 [02:08<24:50, 2.77it/s]
345
  8%|▊ | 345/4480 [02:08<23:19, 2.95it/s]
346
  8%|▊ | 346/4480 [02:09<26:18, 2.62it/s]
347
  8%|▊ | 347/4480 [02:09<24:52, 2.77it/s]
348
  8%|▊ | 348/4480 [02:10<32:01, 2.15it/s]
349
  8%|▊ | 349/4480 [02:10<27:47, 2.48it/s]
350
  8%|▊ | 350/4480 [02:10<26:33, 2.59it/s]
351
  8%|▊ | 351/4480 [02:11<26:06, 2.64it/s]
352
  8%|▊ | 352/4480 [02:11<26:13, 2.62it/s]
353
  8%|▊ | 353/4480 [02:11<24:48, 2.77it/s]
354
  8%|▊ | 354/4480 [02:12<26:07, 2.63it/s]
355
  8%|▊ | 355/4480 [02:12<24:18, 2.83it/s]
356
  8%|▊ | 356/4480 [02:12<25:29, 2.70it/s]
357
  8%|▊ | 357/4480 [02:13<25:39, 2.68it/s]
358
  8%|▊ | 358/4480 [02:13<25:49, 2.66it/s]
359
  8%|▊ | 359/4480 [02:14<29:37, 2.32it/s]
360
  8%|▊ | 360/4480 [02:14<27:43, 2.48it/s]
361
  8%|▊ | 361/4480 [02:14<26:43, 2.57it/s]
362
  8%|▊ | 362/4480 [02:15<26:27, 2.59it/s]
363
  8%|▊ | 363/4480 [02:15<25:35, 2.68it/s]
364
  8%|▊ | 364/4480 [02:15<25:29, 2.69it/s]
365
  8%|▊ | 365/4480 [02:16<25:11, 2.72it/s]
366
  8%|▊ | 366/4480 [02:16<23:31, 2.91it/s]
367
  8%|▊ | 367/4480 [02:16<24:39, 2.78it/s]
368
  8%|▊ | 368/4480 [02:17<23:11, 2.95it/s]
369
  8%|▊ | 369/4480 [02:17<23:02, 2.97it/s]
370
  8%|▊ | 370/4480 [02:17<23:08, 2.96it/s]
371
  8%|▊ | 371/4480 [02:18<24:48, 2.76it/s]
372
  8%|▊ | 372/4480 [02:18<23:33, 2.91it/s]
373
  8%|▊ | 373/4480 [02:18<22:58, 2.98it/s]
374
  8%|▊ | 374/4480 [02:19<24:29, 2.79it/s]
375
  8%|▊ | 375/4480 [02:19<23:40, 2.89it/s]
376
  8%|▊ | 376/4480 [02:20<23:28, 2.91it/s]
377
  8%|▊ | 377/4480 [02:20<23:46, 2.88it/s]
378
  8%|▊ | 378/4480 [02:20<24:12, 2.82it/s]
379
  8%|▊ | 379/4480 [02:21<23:02, 2.97it/s]
380
  8%|▊ | 380/4480 [02:21<22:01, 3.10it/s]
381
  9%|▊ | 381/4480 [02:21<21:01, 3.25it/s]
382
  9%|▊ | 382/4480 [02:22<23:03, 2.96it/s]
383
  9%|▊ | 383/4480 [02:22<24:25, 2.80it/s]
384
  9%|▊ | 384/4480 [02:22<24:56, 2.74it/s]
385
  9%|▊ | 385/4480 [02:23<23:12, 2.94it/s]
386
  9%|▊ | 386/4480 [02:23<23:14, 2.94it/s]
387
  9%|▊ | 387/4480 [02:23<22:27, 3.04it/s]
388
  9%|▊ | 388/4480 [02:24<23:38, 2.88it/s]
389
  9%|▊ | 389/4480 [02:24<26:11, 2.60it/s]
390
  9%|▊ | 390/4480 [02:24<23:59, 2.84it/s]
391
  9%|▊ | 391/4480 [02:25<24:31, 2.78it/s]
392
  9%|▉ | 392/4480 [02:25<23:50, 2.86it/s]
393
  9%|▉ | 393/4480 [02:25<24:42, 2.76it/s]
394
  9%|▉ | 394/4480 [02:26<24:43, 2.75it/s]
395
  9%|▉ | 395/4480 [02:26<24:10, 2.82it/s]
396
  9%|▉ | 396/4480 [02:27<27:16, 2.50it/s]
397
  9%|▉ | 397/4480 [02:27<26:52, 2.53it/s]
398
  9%|▉ | 398/4480 [02:27<24:58, 2.72it/s]
399
  9%|▉ | 399/4480 [02:28<25:32, 2.66it/s]
400
  9%|▉ | 400/4480 [02:28<25:13, 2.70it/s]
401
  9%|▉ | 401/4480 [02:28<22:55, 2.96it/s]
402
  9%|▉ | 402/4480 [02:29<25:10, 2.70it/s]
403
  9%|▉ | 403/4480 [02:29<25:13, 2.69it/s]
404
  9%|▉ | 404/4480 [02:30<25:15, 2.69it/s]
405
  9%|▉ | 405/4480 [02:30<28:21, 2.39it/s]
406
  9%|▉ | 406/4480 [02:30<24:35, 2.76it/s]
407
  9%|▉ | 407/4480 [02:31<24:30, 2.77it/s]
408
  9%|▉ | 408/4480 [02:31<25:41, 2.64it/s]
409
  9%|▉ | 409/4480 [02:32<30:03, 2.26it/s]
410
  9%|▉ | 410/4480 [02:32<27:13, 2.49it/s]
411
  9%|▉ | 411/4480 [02:32<26:56, 2.52it/s]
412
  9%|▉ | 412/4480 [02:33<24:51, 2.73it/s]
413
  9%|▉ | 413/4480 [02:33<25:04, 2.70it/s]
414
  9%|▉ | 414/4480 [02:33<25:37, 2.64it/s]
415
  9%|▉ | 415/4480 [02:34<24:49, 2.73it/s]
416
  9%|▉ | 416/4480 [02:34<26:02, 2.60it/s]
417
  9%|▉ | 417/4480 [02:35<29:20, 2.31it/s]
418
  9%|▉ | 418/4480 [02:35<31:13, 2.17it/s]
419
  9%|▉ | 419/4480 [02:36<29:03, 2.33it/s]
420
  9%|▉ | 420/4480 [02:36<28:41, 2.36it/s]
421
  9%|▉ | 421/4480 [02:36<27:51, 2.43it/s]
422
  9%|▉ | 422/4480 [02:37<34:14, 1.98it/s]
423
  9%|▉ | 423/4480 [02:38<32:52, 2.06it/s]
424
  9%|▉ | 424/4480 [02:38<32:04, 2.11it/s]
425
  9%|▉ | 425/4480 [02:38<29:52, 2.26it/s]
426
  10%|▉ | 426/4480 [02:39<28:03, 2.41it/s]
427
  10%|▉ | 427/4480 [02:39<26:39, 2.53it/s]
428
  10%|▉ | 428/4480 [02:39<25:56, 2.60it/s]
429
  10%|▉ | 429/4480 [02:40<25:09, 2.68it/s]
430
  10%|▉ | 430/4480 [02:40<25:42, 2.62it/s]
431
  10%|▉ | 431/4480 [02:41<24:50, 2.72it/s]
432
  10%|▉ | 432/4480 [02:41<23:36, 2.86it/s]
433
  10%|▉ | 433/4480 [02:41<26:43, 2.52it/s]
434
  10%|▉ | 434/4480 [02:42<24:37, 2.74it/s]
435
  10%|▉ | 435/4480 [02:42<24:14, 2.78it/s]
436
  10%|▉ | 436/4480 [02:42<24:10, 2.79it/s]
437
  10%|▉ | 437/4480 [02:43<23:16, 2.89it/s]
438
  10%|▉ | 438/4480 [02:43<22:28, 3.00it/s]
439
  10%|▉ | 439/4480 [02:43<24:31, 2.75it/s]
440
  10%|▉ | 440/4480 [02:44<23:08, 2.91it/s]
441
  10%|▉ | 441/4480 [02:44<22:38, 2.97it/s]
442
  10%|▉ | 442/4480 [02:44<23:36, 2.85it/s]
443
  10%|▉ | 443/4480 [02:45<24:33, 2.74it/s]
444
  10%|▉ | 444/4480 [02:45<24:04, 2.79it/s]
445
  10%|▉ | 445/4480 [02:46<24:30, 2.74it/s]
446
  10%|▉ | 446/4480 [02:46<22:49, 2.95it/s]
447
  10%|▉ | 447/4480 [02:46<22:59, 2.92it/s]
448
  10%|█ | 448/4480 [02:47<22:54, 2.93it/s][INFO|trainer.py:811] 2024-09-09 14:17:54,861 >> The following columns in the evaluation set don't have a corresponding argument in `BertForTokenClassification.forward` and have been ignored: id, tokens, ner_tags. If id, tokens, ner_tags are not expected by `BertForTokenClassification.forward`, you can safely ignore this message.
 
 
 
 
 
 
449
  0%| | 0/869 [00:00<?, ?it/s]
 
450
  1%| | 10/869 [00:00<00:09, 92.79it/s]
 
451
  2%|▏ | 20/869 [00:00<00:10, 80.90it/s]
 
452
  3%|▎ | 29/869 [00:00<00:10, 77.67it/s]
 
453
  4%|▍ | 37/869 [00:00<00:11, 75.22it/s]
 
454
  5%|▌ | 46/869 [00:00<00:10, 78.48it/s]
 
455
  6%|▋ | 55/869 [00:00<00:10, 80.85it/s]
 
456
  7%|▋ | 64/869 [00:00<00:10, 76.32it/s]
 
457
  8%|▊ | 72/869 [00:00<00:10, 75.42it/s]
 
458
  9%|▉ | 81/869 [00:01<00:09, 79.55it/s]
 
459
  10%|█ | 90/869 [00:01<00:09, 82.34it/s]
 
460
  12%|█▏ | 100/869 [00:01<00:08, 85.84it/s]
 
461
  13%|█▎ | 109/869 [00:01<00:09, 81.70it/s]
 
462
  14%|█▎ | 118/869 [00:01<00:09, 81.22it/s]
 
463
  15%|█▍ | 127/869 [00:01<00:09, 79.96it/s]
 
464
  16%|█▌ | 136/869 [00:01<00:09, 81.27it/s]
 
465
  17%|█▋ | 145/869 [00:01<00:09, 76.67it/s]
 
466
  18%|█▊ | 154/869 [00:01<00:09, 78.89it/s]
 
467
  19%|█▉ | 163/869 [00:02<00:08, 79.25it/s]
 
468
  20%|█▉ | 171/869 [00:02<00:09, 77.29it/s]
 
469
  21%|██ | 179/869 [00:02<00:09, 76.38it/s]
 
470
  22%|██▏ | 188/869 [00:02<00:08, 77.83it/s]
 
471
  23%|██▎ | 196/869 [00:02<00:08, 75.39it/s]
 
472
  24%|██▎ | 205/869 [00:02<00:08, 77.74it/s]
 
473
  25%|██▍ | 214/869 [00:02<00:08, 79.15it/s]
 
474
  26%|██▌ | 223/869 [00:02<00:08, 80.51it/s]
 
475
  27%|██▋ | 232/869 [00:02<00:08, 77.06it/s]
 
476
  28%|██▊ | 240/869 [00:03<00:08, 76.98it/s]
 
477
  29%|██▊ | 248/869 [00:03<00:08, 72.14it/s]
 
478
  30%|██▉ | 257/869 [00:03<00:08, 75.25it/s]
 
479
  30%|███ | 265/869 [00:03<00:08, 74.46it/s]
 
480
  31%|███▏ | 273/869 [00:03<00:07, 74.61it/s]
 
481
  32%|███▏ | 281/869 [00:03<00:07, 73.92it/s]
 
482
  33%|███▎ | 289/869 [00:03<00:07, 73.26it/s]
 
483
  34%|███▍ | 297/869 [00:03<00:07, 74.39it/s]
 
484
  35%|███▌ | 305/869 [00:03<00:07, 71.09it/s]
 
485
  36%|███▌ | 313/869 [00:04<00:07, 72.71it/s]
 
486
  37%|███▋ | 321/869 [00:04<00:07, 72.16it/s]
 
487
  38%|███▊ | 330/869 [00:04<00:07, 76.38it/s]
 
488
  39%|███▉ | 339/869 [00:04<00:06, 78.09it/s]
 
489
  40%|███▉ | 347/869 [00:04<00:07, 72.56it/s]
 
490
  41%|████ | 355/869 [00:04<00:06, 73.67it/s]
 
491
  42%|████▏ | 364/869 [00:04<00:06, 77.58it/s]
 
492
  43%|████▎ | 373/869 [00:04<00:06, 75.01it/s]
 
493
  44%|████▍ | 381/869 [00:04<00:06, 76.13it/s]
 
494
  45%|████▍ | 389/869 [00:05<00:06, 70.53it/s]
 
495
  46%|████▌ | 398/869 [00:05<00:06, 73.42it/s]
 
496
  47%|████▋ | 407/869 [00:05<00:06, 76.02it/s]
 
497
  48%|████▊ | 416/869 [00:05<00:05, 78.88it/s]
 
498
  49%|████▉ | 425/869 [00:05<00:05, 79.96it/s]
 
499
  50%|████▉ | 434/869 [00:05<00:05, 80.34it/s]
 
500
  51%|█████ | 443/869 [00:05<00:05, 75.42it/s]
 
501
  52%|█████▏ | 452/869 [00:05<00:05, 78.65it/s]
 
502
  53%|█████▎ | 460/869 [00:05<00:05, 77.89it/s]
 
503
  54%|█████▍ | 468/869 [00:06<00:05, 77.51it/s]
 
504
  55%|█████▌ | 478/869 [00:06<00:04, 82.03it/s]
 
505
  56%|█████▌ | 487/869 [00:06<00:04, 82.20it/s]
 
506
  57%|█████▋ | 496/869 [00:06<00:04, 76.78it/s]
 
507
  58%|█████▊ | 504/869 [00:06<00:04, 74.30it/s]
 
508
  59%|█████▉ | 512/869 [00:06<00:04, 75.36it/s]
 
509
  60%|█████▉ | 521/869 [00:06<00:04, 78.56it/s]
 
510
  61%|██████ | 529/869 [00:06<00:04, 72.22it/s]
 
511
  62%|██████▏ | 537/869 [00:06<00:04, 73.11it/s]
 
512
  63%|██████▎ | 545/869 [00:07<00:04, 71.36it/s]
 
513
  64%|██████▍ | 554/869 [00:07<00:04, 74.37it/s]
 
514
  65%|██████▍ | 562/869 [00:07<00:04, 75.80it/s]
 
515
  66%|██████▌ | 570/869 [00:07<00:04, 74.62it/s]
 
516
  67%|██████▋ | 579/869 [00:07<00:03, 77.57it/s]
 
517
  68%|██████▊ | 587/869 [00:07<00:03, 74.27it/s]
 
518
  68%|██████▊ | 595/869 [00:07<00:03, 75.65it/s]
 
519
  70%|██████▉ | 604/869 [00:07<00:03, 78.50it/s]
 
520
  70%|███████ | 612/869 [00:07<00:03, 77.23it/s]
 
521
  71%|███████▏ | 620/869 [00:08<00:03, 77.57it/s]
 
522
  72%|███████▏ | 628/869 [00:08<00:03, 75.04it/s]
 
523
  73%|███████▎ | 636/869 [00:08<00:03, 73.98it/s]
 
524
  74%|███████▍ | 645/869 [00:08<00:02, 77.26it/s]
 
525
  75%|███████▌ | 654/869 [00:08<00:02, 78.96it/s]
 
526
  76%|███████▌ | 662/869 [00:08<00:02, 78.16it/s]
 
527
  77%|███████▋ | 671/869 [00:08<00:02, 81.02it/s]
 
528
  78%|███████▊ | 680/869 [00:08<00:02, 82.95it/s]
 
529
  79%|███████▉ | 689/869 [00:08<00:02, 71.57it/s]
 
530
  80%|████████ | 697/869 [00:09<00:02, 72.76it/s]
 
531
  81%|████████ | 705/869 [00:09<00:02, 73.06it/s]
 
532
  82%|████████▏ | 714/869 [00:09<00:02, 76.13it/s]
 
533
  83%|████████▎ | 722/869 [00:09<00:01, 76.22it/s]
 
534
  84%|████████▍ | 731/869 [00:09<00:01, 77.06it/s]
 
535
  85%|████████▌ | 739/869 [00:09<00:01, 77.04it/s]
 
536
  86%|████████▌ | 747/869 [00:09<00:01, 77.31it/s]
 
537
  87%|████████▋ | 755/869 [00:09<00:01, 75.96it/s]
 
538
  88%|████████▊ | 764/869 [00:09<00:01, 79.21it/s]
 
539
  89%|████████▉ | 772/869 [00:10<00:01, 73.60it/s]
 
540
  90%|████████▉ | 780/869 [00:10<00:01, 64.89it/s]
 
541
  91%|█████████ | 788/869 [00:10<00:01, 68.63it/s]
 
542
  92%|█████████▏| 797/869 [00:10<00:00, 72.49it/s]
 
543
  93%|█████████▎| 805/869 [00:10<00:00, 73.39it/s]
 
544
  94%|█████████▎| 814/869 [00:10<00:00, 75.71it/s]
 
545
  95%|█████████▍| 822/869 [00:10<00:00, 75.42it/s]
 
546
  96%|█████████▌| 831/869 [00:10<00:00, 76.65it/s]
 
547
  97%|█████████▋| 840/869 [00:10<00:00, 78.44it/s]
 
548
  98%|█████████▊| 849/869 [00:11<00:00, 80.04it/s]
 
549
  99%|█████████▊| 858/869 [00:11<00:00, 79.59it/s]
 
550
 
 
551
 
552
  10%|█ | 448/4480 [03:02<22:54, 2.93it/s]
 
 
553
  [INFO|trainer.py:3503] 2024-09-09 14:18:09,952 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-448
 
 
 
 
 
 
 
554
  10%|█ | 449/4480 [03:06<6:41:43, 5.98s/it]
555
  10%|█ | 450/4480 [03:06<4:51:00, 4.33s/it]
556
  10%|█ | 451/4480 [03:07<3:31:43, 3.15s/it]
557
  10%|█ | 452/4480 [03:07<2:36:10, 2.33s/it]
558
  10%|█ | 453/4480 [03:07<1:54:40, 1.71s/it]
559
  10%|█ | 454/4480 [03:08<1:28:07, 1.31s/it]
560
  10%|█ | 455/4480 [03:08<1:08:58, 1.03s/it]
561
  10%|█ | 456/4480 [03:08<53:19, 1.26it/s]
562
  10%|█ | 457/4480 [03:09<43:53, 1.53it/s]
563
  10%|█ | 458/4480 [03:09<37:31, 1.79it/s]
564
  10%|█ | 459/4480 [03:09<38:22, 1.75it/s]
565
  10%|█ | 460/4480 [03:10<33:39, 1.99it/s]
566
  10%|█ | 461/4480 [03:10<31:32, 2.12it/s]
567
  10%|█ | 462/4480 [03:11<28:45, 2.33it/s]
568
  10%|█ | 463/4480 [03:11<27:17, 2.45it/s]
569
  10%|█ | 464/4480 [03:11<26:13, 2.55it/s]
570
  10%|█ | 465/4480 [03:12<25:11, 2.66it/s]
571
  10%|█ | 466/4480 [03:12<23:50, 2.81it/s]
572
  10%|█ | 467/4480 [03:12<23:50, 2.81it/s]
573
  10%|█ | 468/4480 [03:13<27:53, 2.40it/s]
574
  10%|█ | 469/4480 [03:13<25:14, 2.65it/s]
575
  10%|█ | 470/4480 [03:13<24:07, 2.77it/s]
576
  11%|█ | 471/4480 [03:14<23:45, 2.81it/s]
577
  11%|█ | 472/4480 [03:14<23:26, 2.85it/s]
578
  11%|█ | 473/4480 [03:15<24:05, 2.77it/s]
579
  11%|█ | 474/4480 [03:15<24:20, 2.74it/s]
580
  11%|█ | 475/4480 [03:15<25:03, 2.66it/s]
581
  11%|█ | 476/4480 [03:16<23:49, 2.80it/s]
582
  11%|█ | 477/4480 [03:16<23:51, 2.80it/s]
583
  11%|█ | 478/4480 [03:16<22:26, 2.97it/s]
584
  11%|█ | 479/4480 [03:17<21:31, 3.10it/s]
585
  11%|█ | 480/4480 [03:17<21:46, 3.06it/s]
586
  11%|█ | 481/4480 [03:17<23:15, 2.87it/s]
587
  11%|█ | 482/4480 [03:18<24:33, 2.71it/s]
588
  11%|█ | 483/4480 [03:18<24:43, 2.69it/s]
589
  11%|█ | 484/4480 [03:18<25:12, 2.64it/s]
590
  11%|█ | 485/4480 [03:19<24:29, 2.72it/s]
591
  11%|█ | 486/4480 [03:19<27:55, 2.38it/s]
592
  11%|█ | 487/4480 [03:20<32:18, 2.06it/s]
593
  11%|█ | 488/4480 [03:20<31:42, 2.10it/s]
594
  11%|█ | 489/4480 [03:21<28:55, 2.30it/s]
595
  11%|█ | 490/4480 [03:21<27:55, 2.38it/s]
596
  11%|█ | 491/4480 [03:21<25:09, 2.64it/s]
597
  11%|█ | 492/4480 [03:22<24:27, 2.72it/s]
598
  11%|█ | 493/4480 [03:22<24:30, 2.71it/s]
599
  11%|█ | 494/4480 [03:23<23:53, 2.78it/s]
600
  11%|█ | 495/4480 [03:23<23:30, 2.82it/s]
601
  11%|█ | 496/4480 [03:23<23:04, 2.88it/s]
602
  11%|█ | 497/4480 [03:24<23:29, 2.82it/s]
603
  11%|█ | 498/4480 [03:24<23:06, 2.87it/s]
604
  11%|█ | 499/4480 [03:24<22:46, 2.91it/s]
605
  11%|█ | 500/4480 [03:25<27:16, 2.43it/s]
606
 
607
  11%|█ | 500/4480 [03:25<27:16, 2.43it/s]
608
  11%|█ | 501/4480 [03:25<31:27, 2.11it/s]
609
  11%|█ | 502/4480 [03:26<28:12, 2.35it/s]
610
  11%|█ | 503/4480 [03:26<26:23, 2.51it/s]
611
  11%|█▏ | 504/4480 [03:26<25:09, 2.63it/s]
612
  11%|█▏ | 505/4480 [03:27<24:50, 2.67it/s]
613
  11%|█▏ | 506/4480 [03:27<27:31, 2.41it/s]
614
  11%|█▏ | 507/4480 [03:28<24:50, 2.66it/s]
615
  11%|█▏ | 508/4480 [03:28<27:23, 2.42it/s]
616
  11%|█▏ | 509/4480 [03:28<24:41, 2.68it/s]
617
  11%|█▏ | 510/4480 [03:29<23:15, 2.85it/s]
618
  11%|█▏ | 511/4480 [03:29<22:12, 2.98it/s]
619
  11%|█▏ | 512/4480 [03:29<23:53, 2.77it/s]
620
  11%|█▏ | 513/4480 [03:30<22:50, 2.89it/s]
621
  11%|█▏ | 514/4480 [03:30<23:24, 2.82it/s]
622
  11%|█▏ | 515/4480 [03:30<21:48, 3.03it/s]
623
  12%|█▏ | 516/4480 [03:31<21:58, 3.01it/s]
624
  12%|█▏ | 517/4480 [03:31<21:40, 3.05it/s]
625
  12%|█▏ | 518/4480 [03:31<23:52, 2.77it/s]
626
  12%|█▏ | 519/4480 [03:32<22:42, 2.91it/s]
627
  12%|█▏ | 520/4480 [03:32<22:14, 2.97it/s]
628
  12%|█▏ | 521/4480 [03:32<21:35, 3.06it/s]
629
  12%|█▏ | 522/4480 [03:33<23:50, 2.77it/s]
630
  12%|█▏ | 523/4480 [03:33<24:23, 2.70it/s]
631
  12%|█▏ | 524/4480 [03:33<21:43, 3.03it/s]
632
  12%|█▏ | 525/4480 [03:34<23:16, 2.83it/s]
633
  12%|█▏ | 526/4480 [03:34<23:03, 2.86it/s]
634
  12%|█▏ | 527/4480 [03:34<22:30, 2.93it/s]
635
  12%|█▏ | 528/4480 [03:35<21:39, 3.04it/s]
636
  12%|█▏ | 529/4480 [03:35<23:01, 2.86it/s]
637
  12%|█▏ | 530/4480 [03:36<23:29, 2.80it/s]
638
  12%|█▏ | 531/4480 [03:36<25:11, 2.61it/s]
639
  12%|█▏ | 532/4480 [03:36<24:50, 2.65it/s]
640
  12%|█▏ | 533/4480 [03:37<28:27, 2.31it/s]
641
  12%|█▏ | 534/4480 [03:37<27:49, 2.36it/s]
642
  12%|█▏ | 535/4480 [03:38<27:50, 2.36it/s]
643
  12%|█▏ | 536/4480 [03:38<25:21, 2.59it/s]
644
  12%|█▏ | 537/4480 [03:38<26:08, 2.51it/s]
645
  12%|█▏ | 538/4480 [03:39<25:05, 2.62it/s]
646
  12%|█▏ | 539/4480 [03:39<25:29, 2.58it/s]
647
  12%|█▏ | 540/4480 [03:40<25:05, 2.62it/s]
648
  12%|█▏ | 541/4480 [03:40<24:07, 2.72it/s]
649
  12%|█▏ | 542/4480 [03:40<22:54, 2.86it/s]
650
  12%|█▏ | 543/4480 [03:41<21:59, 2.98it/s]
651
  12%|█▏ | 544/4480 [03:41<25:18, 2.59it/s]
652
  12%|█▏ | 545/4480 [03:41<25:08, 2.61it/s]
653
  12%|█▏ | 546/4480 [03:42<27:46, 2.36it/s]
654
  12%|█▏ | 547/4480 [03:42<26:14, 2.50it/s]
655
  12%|█▏ | 548/4480 [03:43<25:27, 2.57it/s]
656
  12%|█▏ | 549/4480 [03:43<26:18, 2.49it/s]
657
  12%|█▏ | 550/4480 [03:44<28:02, 2.34it/s]
658
  12%|█▏ | 551/4480 [03:44<27:01, 2.42it/s]
659
  12%|█▏ | 552/4480 [03:44<29:30, 2.22it/s]
660
  12%|█▏ | 553/4480 [03:45<26:33, 2.46it/s]
661
  12%|█▏ | 554/4480 [03:45<24:58, 2.62it/s]
662
  12%|█▏ | 555/4480 [03:45<23:37, 2.77it/s]
663
  12%|█▏ | 556/4480 [03:46<25:37, 2.55it/s]
664
  12%|█▏ | 557/4480 [03:46<24:21, 2.68it/s]
665
  12%|█▏ | 558/4480 [03:46<22:27, 2.91it/s]
666
  12%|█▏ | 559/4480 [03:47<21:36, 3.02it/s]
667
  12%|█▎ | 560/4480 [03:47<21:46, 3.00it/s]
668
  13%|█▎ | 561/4480 [03:47<22:41, 2.88it/s]
669
  13%|█▎ | 562/4480 [03:48<23:15, 2.81it/s]
670
  13%|█▎ | 563/4480 [03:49<29:23, 2.22it/s]
671
  13%|█▎ | 564/4480 [03:49<28:08, 2.32it/s]
672
  13%|█▎ | 565/4480 [03:49<28:23, 2.30it/s]
673
  13%|█▎ | 566/4480 [03:50<26:58, 2.42it/s]
674
  13%|█▎ | 567/4480 [03:50<27:07, 2.40it/s]
675
  13%|█▎ | 568/4480 [03:51<26:20, 2.48it/s]
676
  13%|█▎ | 569/4480 [03:51<25:58, 2.51it/s]
677
  13%|█▎ | 570/4480 [03:51<23:38, 2.76it/s]
 
1
+ 2024-09-09 14:14:39.290280: I tensorflow/core/util/port.cc:153] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2
+ 2024-09-09 14:14:39.308004: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:485] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
3
+ 2024-09-09 14:14:39.329151: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:8454] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
4
+ 2024-09-09 14:14:39.335520: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1452] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
5
+ 2024-09-09 14:14:39.350729: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
6
+ To enable the following instructions: AVX2 AVX512F AVX512_VNNI FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.
7
+ 2024-09-09 14:14:40.598840: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT
8
+ /usr/local/lib/python3.10/dist-packages/transformers/training_args.py:1525: FutureWarning: `evaluation_strategy` is deprecated and will be removed in version 4.46 of 🤗 Transformers. Use `eval_strategy` instead
9
+ warnings.warn(
10
+ 09/09/2024 14:14:42 - WARNING - __main__ - Process rank: 0, device: cuda:0, n_gpu: 1distributed training: True, 16-bits training: False
11
+ 09/09/2024 14:14:42 - INFO - __main__ - Training/evaluation parameters TrainingArguments(
12
+ _n_gpu=1,
13
+ accelerator_config={'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None, 'use_configured_state': False},
14
+ adafactor=False,
15
+ adam_beta1=0.9,
16
+ adam_beta2=0.999,
17
+ adam_epsilon=1e-08,
18
+ auto_find_batch_size=False,
19
+ batch_eval_metrics=False,
20
+ bf16=False,
21
+ bf16_full_eval=False,
22
+ data_seed=None,
23
+ dataloader_drop_last=False,
24
+ dataloader_num_workers=0,
25
+ dataloader_persistent_workers=False,
26
+ dataloader_pin_memory=True,
27
+ dataloader_prefetch_factor=None,
28
+ ddp_backend=None,
29
+ ddp_broadcast_buffers=None,
30
+ ddp_bucket_cap_mb=None,
31
+ ddp_find_unused_parameters=None,
32
+ ddp_timeout=1800,
33
+ debug=[],
34
+ deepspeed=None,
35
+ disable_tqdm=False,
36
+ dispatch_batches=None,
37
+ do_eval=True,
38
+ do_predict=True,
39
+ do_train=True,
40
+ eval_accumulation_steps=None,
41
+ eval_delay=0,
42
+ eval_do_concat_batches=True,
43
+ eval_on_start=False,
44
+ eval_steps=None,
45
+ eval_strategy=epoch,
46
+ eval_use_gather_object=False,
47
+ evaluation_strategy=epoch,
48
+ fp16=False,
49
+ fp16_backend=auto,
50
+ fp16_full_eval=False,
51
+ fp16_opt_level=O1,
52
+ fsdp=[],
53
+ fsdp_config={'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False},
54
+ fsdp_min_num_params=0,
55
+ fsdp_transformer_layer_cls_to_wrap=None,
56
+ full_determinism=False,
57
+ gradient_accumulation_steps=2,
58
+ gradient_checkpointing=False,
59
+ gradient_checkpointing_kwargs=None,
60
+ greater_is_better=True,
61
+ group_by_length=False,
62
+ half_precision_backend=auto,
63
+ hub_always_push=False,
64
+ hub_model_id=None,
65
+ hub_private_repo=False,
66
+ hub_strategy=every_save,
67
+ hub_token=<HUB_TOKEN>,
68
+ ignore_data_skip=False,
69
+ include_inputs_for_metrics=False,
70
+ include_num_input_tokens_seen=False,
71
+ include_tokens_per_second=False,
72
+ jit_mode_eval=False,
73
+ label_names=None,
74
+ label_smoothing_factor=0.0,
75
+ learning_rate=5e-05,
76
+ length_column_name=length,
77
+ load_best_model_at_end=True,
78
+ local_rank=0,
79
+ log_level=passive,
80
+ log_level_replica=warning,
81
+ log_on_each_node=True,
82
+ logging_dir=/content/dissertation/scripts/ner/output/tb,
83
+ logging_first_step=False,
84
+ logging_nan_inf_filter=True,
85
+ logging_steps=500,
86
+ logging_strategy=steps,
87
+ lr_scheduler_kwargs={},
88
+ lr_scheduler_type=linear,
89
+ max_grad_norm=1.0,
90
+ max_steps=-1,
91
+ metric_for_best_model=f1,
92
+ mp_parameters=,
93
+ neftune_noise_alpha=None,
94
+ no_cuda=False,
95
+ num_train_epochs=10.0,
96
+ optim=adamw_torch,
97
+ optim_args=None,
98
+ optim_target_modules=None,
99
+ output_dir=/content/dissertation/scripts/ner/output,
100
+ overwrite_output_dir=True,
101
+ past_index=-1,
102
+ per_device_eval_batch_size=8,
103
+ per_device_train_batch_size=32,
104
+ prediction_loss_only=False,
105
+ push_to_hub=True,
106
+ push_to_hub_model_id=None,
107
+ push_to_hub_organization=None,
108
+ push_to_hub_token=<PUSH_TO_HUB_TOKEN>,
109
+ ray_scope=last,
110
+ remove_unused_columns=True,
111
+ report_to=['tensorboard'],
112
+ restore_callback_states_from_checkpoint=False,
113
+ resume_from_checkpoint=None,
114
+ run_name=/content/dissertation/scripts/ner/output,
115
+ save_on_each_node=False,
116
+ save_only_model=False,
117
+ save_safetensors=True,
118
+ save_steps=500,
119
+ save_strategy=epoch,
120
+ save_total_limit=None,
121
+ seed=42,
122
+ skip_memory_metrics=True,
123
+ split_batches=None,
124
+ tf32=None,
125
+ torch_compile=False,
126
+ torch_compile_backend=None,
127
+ torch_compile_mode=None,
128
+ torch_empty_cache_steps=None,
129
+ torchdynamo=None,
130
+ tpu_metrics_debug=False,
131
+ tpu_num_cores=None,
132
+ use_cpu=False,
133
+ use_ipex=False,
134
+ use_legacy_prediction_loop=False,
135
+ use_mps_device=False,
136
+ warmup_ratio=0.0,
137
+ warmup_steps=0,
138
+ weight_decay=0.0,
139
+ )
140
+
141
+
142
+
143
+
144
+
145
+
146
+
147
+ [INFO|configuration_utils.py:733] 2024-09-09 14:15:00,004 >> loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/config.json
148
+ [INFO|configuration_utils.py:800] 2024-09-09 14:15:00,008 >> Model config BertConfig {
149
+ "_name_or_path": "michiyasunaga/BioLinkBERT-base",
150
+ "architectures": [
151
+ "BertModel"
152
+ ],
153
+ "attention_probs_dropout_prob": 0.1,
154
+ "classifier_dropout": null,
155
+ "finetuning_task": "ner",
156
+ "gradient_checkpointing": false,
157
+ "hidden_act": "gelu",
158
+ "hidden_dropout_prob": 0.1,
159
+ "hidden_size": 768,
160
+ "id2label": {
161
+ "0": "O",
162
+ "1": "B-FARMACO",
163
+ "2": "I-FARMACO"
164
+ },
165
+ "initializer_range": 0.02,
166
+ "intermediate_size": 3072,
167
+ "label2id": {
168
+ "B-FARMACO": 1,
169
+ "I-FARMACO": 2,
170
+ "O": 0
171
+ },
172
+ "layer_norm_eps": 1e-12,
173
+ "max_position_embeddings": 512,
174
+ "model_type": "bert",
175
+ "num_attention_heads": 12,
176
+ "num_hidden_layers": 12,
177
+ "pad_token_id": 0,
178
+ "position_embedding_type": "absolute",
179
+ "transformers_version": "4.44.2",
180
+ "type_vocab_size": 2,
181
+ "use_cache": true,
182
+ "vocab_size": 28895
183
+ }
184
+
185
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 14:15:00,242 >> loading file vocab.txt from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/vocab.txt
186
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 14:15:00,242 >> loading file tokenizer.json from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/tokenizer.json
187
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 14:15:00,242 >> loading file added_tokens.json from cache at None
188
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 14:15:00,242 >> loading file special_tokens_map.json from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/special_tokens_map.json
189
+ [INFO|tokenization_utils_base.py:2269] 2024-09-09 14:15:00,242 >> loading file tokenizer_config.json from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/tokenizer_config.json
190
+ /usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884
191
+ warnings.warn(
192
+ [INFO|modeling_utils.py:3678] 2024-09-09 14:15:00,548 >> loading weights file pytorch_model.bin from cache at /root/.cache/huggingface/hub/models--michiyasunaga--BioLinkBERT-base/snapshots/b71f5d70f063d1c8f1124070ce86f1ee463ca1fe/pytorch_model.bin
193
+ [INFO|modeling_utils.py:4497] 2024-09-09 14:15:00,628 >> Some weights of the model checkpoint at michiyasunaga/BioLinkBERT-base were not used when initializing BertForTokenClassification: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
194
+ - This IS expected if you are initializing BertForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
195
+ - This IS NOT expected if you are initializing BertForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
196
+ [WARNING|modeling_utils.py:4509] 2024-09-09 14:15:00,628 >> Some weights of BertForTokenClassification were not initialized from the model checkpoint at michiyasunaga/BioLinkBERT-base and are newly initialized: ['classifier.bias', 'classifier.weight']
197
+ You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
198
+
199
+
200
+
201
+ /content/dissertation/scripts/ner/run_ner_train.py:397: FutureWarning: load_metric is deprecated and will be removed in the next major version of datasets. Use 'evaluate.load' instead, from the new library 🤗 Evaluate: https://huggingface.co/docs/evaluate
202
+ metric = load_metric("seqeval", trust_remote_code=True)
203
+ [INFO|trainer.py:811] 2024-09-09 14:15:07,256 >> The following columns in the training set don't have a corresponding argument in `BertForTokenClassification.forward` and have been ignored: id, tokens, ner_tags. If id, tokens, ner_tags are not expected by `BertForTokenClassification.forward`, you can safely ignore this message.
204
+ [INFO|trainer.py:2134] 2024-09-09 14:15:07,820 >> ***** Running training *****
205
+ [INFO|trainer.py:2135] 2024-09-09 14:15:07,820 >> Num examples = 28,668
206
+ [INFO|trainer.py:2136] 2024-09-09 14:15:07,820 >> Num Epochs = 10
207
+ [INFO|trainer.py:2137] 2024-09-09 14:15:07,820 >> Instantaneous batch size per device = 32
208
+ [INFO|trainer.py:2140] 2024-09-09 14:15:07,820 >> Total train batch size (w. parallel, distributed & accumulation) = 64
209
+ [INFO|trainer.py:2141] 2024-09-09 14:15:07,820 >> Gradient Accumulation steps = 2
210
+ [INFO|trainer.py:2142] 2024-09-09 14:15:07,820 >> Total optimization steps = 4,480
211
+ [INFO|trainer.py:2143] 2024-09-09 14:15:07,820 >> Number of trainable parameters = 107,644,419
212
+
213
  0%| | 0/4480 [00:00<?, ?it/s]
214
  0%| | 1/4480 [00:01<1:27:13, 1.17s/it]
215
  0%| | 2/4480 [00:01<58:18, 1.28it/s]
216
  0%| | 3/4480 [00:01<42:36, 1.75it/s]
217
  0%| | 4/4480 [00:02<40:37, 1.84it/s]
218
  0%| | 5/4480 [00:02<38:44, 1.93it/s]
219
  0%| | 6/4480 [00:03<38:28, 1.94it/s]
220
  0%| | 7/4480 [00:04<40:28, 1.84it/s]
221
  0%| | 8/4480 [00:04<33:34, 2.22it/s]
222
  0%| | 9/4480 [00:05<43:45, 1.70it/s]
223
  0%| | 10/4480 [00:05<37:41, 1.98it/s]
224
  0%| | 11/4480 [00:05<33:46, 2.21it/s]
225
  0%| | 12/4480 [00:06<29:48, 2.50it/s]
226
  0%| | 13/4480 [00:06<27:25, 2.71it/s]
227
  0%| | 14/4480 [00:06<26:26, 2.81it/s]
228
  0%| | 15/4480 [00:07<27:19, 2.72it/s]
229
  0%| | 16/4480 [00:07<26:01, 2.86it/s]
230
  0%| | 17/4480 [00:07<25:55, 2.87it/s]
231
  0%| | 18/4480 [00:08<25:52, 2.87it/s]
232
  0%| | 19/4480 [00:08<26:25, 2.81it/s]
233
  0%| | 20/4480 [00:09<29:47, 2.50it/s]
234
  0%| | 21/4480 [00:09<27:56, 2.66it/s]
235
  0%| | 22/4480 [00:09<26:06, 2.85it/s]
236
  1%| | 23/4480 [00:10<29:12, 2.54it/s]
237
  1%| | 24/4480 [00:10<29:18, 2.53it/s]
238
  1%| | 25/4480 [00:10<28:01, 2.65it/s]
239
  1%| | 26/4480 [00:11<27:24, 2.71it/s]
240
  1%| | 27/4480 [00:11<26:48, 2.77it/s]
241
  1%| | 28/4480 [00:11<24:44, 3.00it/s]
242
  1%| | 29/4480 [00:12<23:45, 3.12it/s]
243
  1%| | 30/4480 [00:12<24:01, 3.09it/s]
244
  1%| | 31/4480 [00:12<25:11, 2.94it/s]
245
  1%| | 32/4480 [00:13<31:17, 2.37it/s]
246
  1%| | 33/4480 [00:13<29:50, 2.48it/s]
247
  1%| | 34/4480 [00:14<28:19, 2.62it/s]
248
  1%| | 35/4480 [00:14<27:06, 2.73it/s]
249
  1%| | 36/4480 [00:14<25:14, 2.93it/s]
250
  1%| | 37/4480 [00:15<25:46, 2.87it/s]
251
  1%| | 38/4480 [00:15<25:39, 2.89it/s]
252
  1%| | 39/4480 [00:15<25:19, 2.92it/s]
253
  1%| | 40/4480 [00:16<23:37, 3.13it/s]
254
  1%| | 41/4480 [00:16<26:05, 2.84it/s]
255
  1%| | 42/4480 [00:16<27:16, 2.71it/s]
256
  1%| | 43/4480 [00:17<27:36, 2.68it/s]
257
  1%| | 44/4480 [00:17<25:25, 2.91it/s]
258
  1%| | 45/4480 [00:17<26:45, 2.76it/s]
259
  1%| | 46/4480 [00:18<27:15, 2.71it/s]
260
  1%| | 47/4480 [00:18<24:30, 3.01it/s]
261
  1%| | 48/4480 [00:18<23:58, 3.08it/s]
262
  1%| | 49/4480 [00:19<27:39, 2.67it/s]
263
  1%| | 50/4480 [00:19<27:03, 2.73it/s]
264
  1%| | 51/4480 [00:20<26:51, 2.75it/s]
265
  1%| | 52/4480 [00:20<26:28, 2.79it/s]
266
  1%| | 53/4480 [00:20<25:58, 2.84it/s]
267
  1%| | 54/4480 [00:21<25:34, 2.88it/s]
268
  1%| | 55/4480 [00:21<26:41, 2.76it/s]
269
  1%|▏ | 56/4480 [00:21<25:43, 2.87it/s]
270
  1%|▏ | 57/4480 [00:22<25:10, 2.93it/s]
271
  1%|▏ | 58/4480 [00:22<24:48, 2.97it/s]
272
  1%|▏ | 59/4480 [00:22<27:00, 2.73it/s]
273
  1%|▏ | 60/4480 [00:23<25:08, 2.93it/s]
274
  1%|▏ | 61/4480 [00:23<23:47, 3.10it/s]
275
  1%|▏ | 62/4480 [00:23<24:58, 2.95it/s]
276
  1%|▏ | 63/4480 [00:24<25:04, 2.94it/s]
277
  1%|▏ | 64/4480 [00:24<25:28, 2.89it/s]
278
  1%|▏ | 65/4480 [00:24<26:23, 2.79it/s]
279
  1%|▏ | 66/4480 [00:25<27:05, 2.72it/s]
280
  1%|▏ | 67/4480 [00:25<24:30, 3.00it/s]
281
  2%|▏ | 68/4480 [00:26<27:07, 2.71it/s]
282
  2%|▏ | 69/4480 [00:26<24:36, 2.99it/s]
283
  2%|▏ | 70/4480 [00:26<23:24, 3.14it/s]
284
  2%|▏ | 71/4480 [00:26<23:37, 3.11it/s]
285
  2%|▏ | 72/4480 [00:27<25:38, 2.87it/s]
286
  2%|▏ | 73/4480 [00:27<25:22, 2.89it/s]
287
  2%|▏ | 74/4480 [00:28<29:49, 2.46it/s]
288
  2%|▏ | 75/4480 [00:28<27:22, 2.68it/s]
289
  2%|▏ | 76/4480 [00:28<28:53, 2.54it/s]
290
  2%|▏ | 77/4480 [00:29<26:12, 2.80it/s]
291
  2%|▏ | 78/4480 [00:29<25:33, 2.87it/s]
292
  2%|▏ | 79/4480 [00:29<24:38, 2.98it/s]
293
  2%|▏ | 80/4480 [00:30<23:06, 3.17it/s]
294
  2%|▏ | 81/4480 [00:30<21:32, 3.40it/s]
295
  2%|▏ | 82/4480 [00:30<23:59, 3.06it/s]
296
  2%|▏ | 83/4480 [00:31<25:23, 2.89it/s]
297
  2%|▏ | 84/4480 [00:31<23:38, 3.10it/s]
298
  2%|▏ | 85/4480 [00:31<26:33, 2.76it/s]
299
  2%|▏ | 86/4480 [00:32<25:19, 2.89it/s]
300
  2%|▏ | 87/4480 [00:32<26:24, 2.77it/s]
301
  2%|▏ | 88/4480 [00:32<26:14, 2.79it/s]
302
  2%|▏ | 89/4480 [00:33<27:43, 2.64it/s]
303
  2%|▏ | 90/4480 [00:33<27:35, 2.65it/s]
304
  2%|▏ | 91/4480 [00:34<26:44, 2.73it/s]
305
  2%|▏ | 92/4480 [00:34<25:58, 2.82it/s]
306
  2%|▏ | 93/4480 [00:34<29:40, 2.46it/s]
307
  2%|▏ | 94/4480 [00:35<31:01, 2.36it/s]
308
  2%|▏ | 95/4480 [00:35<28:40, 2.55it/s]
309
  2%|▏ | 96/4480 [00:36<29:02, 2.52it/s]
310
  2%|▏ | 97/4480 [00:36<27:33, 2.65it/s]
311
  2%|▏ | 98/4480 [00:36<25:41, 2.84it/s]
312
  2%|▏ | 99/4480 [00:37<25:00, 2.92it/s]
313
  2%|▏ | 100/4480 [00:37<24:27, 2.98it/s]
314
  2%|▏ | 101/4480 [00:37<23:31, 3.10it/s]
315
  2%|▏ | 102/4480 [00:38<25:30, 2.86it/s]
316
  2%|▏ | 103/4480 [00:38<26:52, 2.72it/s]
317
  2%|▏ | 104/4480 [00:38<27:32, 2.65it/s]
318
  2%|▏ | 105/4480 [00:39<27:49, 2.62it/s]
319
  2%|▏ | 106/4480 [00:39<28:57, 2.52it/s]
320
  2%|▏ | 107/4480 [00:40<29:45, 2.45it/s]
321
  2%|▏ | 108/4480 [00:40<29:21, 2.48it/s]
322
  2%|▏ | 109/4480 [00:41<30:06, 2.42it/s]
323
  2%|▏ | 110/4480 [00:41<28:50, 2.52it/s]
324
  2%|▏ | 111/4480 [00:41<26:51, 2.71it/s]
325
  2%|▎ | 112/4480 [00:42<26:40, 2.73it/s]
326
  3%|▎ | 113/4480 [00:42<25:18, 2.88it/s]
327
  3%|▎ | 114/4480 [00:42<24:22, 2.98it/s]
328
  3%|▎ | 115/4480 [00:42<24:30, 2.97it/s]
329
  3%|▎ | 116/4480 [00:43<23:50, 3.05it/s]
330
  3%|▎ | 117/4480 [00:43<24:04, 3.02it/s]
331
  3%|▎ | 118/4480 [00:43<25:05, 2.90it/s]
332
  3%|▎ | 119/4480 [00:44<26:54, 2.70it/s]
333
  3%|▎ | 120/4480 [00:44<26:18, 2.76it/s]
334
  3%|▎ | 121/4480 [00:45<25:48, 2.81it/s]
335
  3%|▎ | 122/4480 [00:45<24:31, 2.96it/s]
336
  3%|▎ | 123/4480 [00:45<24:25, 2.97it/s]
337
  3%|▎ | 124/4480 [00:46<26:24, 2.75it/s]
338
  3%|▎ | 125/4480 [00:46<24:42, 2.94it/s]
339
  3%|▎ | 126/4480 [00:46<24:37, 2.95it/s]
340
  3%|▎ | 127/4480 [00:47<23:19, 3.11it/s]
341
  3%|▎ | 128/4480 [00:47<24:13, 2.99it/s]
342
  3%|▎ | 129/4480 [00:47<25:24, 2.85it/s]
343
  3%|▎ | 130/4480 [00:48<26:42, 2.71it/s]
344
  3%|▎ | 131/4480 [00:48<25:07, 2.88it/s]
345
  3%|▎ | 132/4480 [00:48<22:49, 3.18it/s]
346
  3%|▎ | 133/4480 [00:49<23:09, 3.13it/s]
347
  3%|▎ | 134/4480 [00:49<22:16, 3.25it/s]
348
  3%|▎ | 135/4480 [00:49<24:13, 2.99it/s]
349
  3%|▎ | 136/4480 [00:50<29:11, 2.48it/s]
350
  3%|▎ | 137/4480 [00:50<27:13, 2.66it/s]
351
  3%|▎ | 138/4480 [00:50<25:49, 2.80it/s]
352
  3%|▎ | 139/4480 [00:51<23:35, 3.07it/s]
353
  3%|▎ | 140/4480 [00:51<26:01, 2.78it/s]
354
  3%|▎ | 141/4480 [00:51<24:42, 2.93it/s]
355
  3%|▎ | 142/4480 [00:52<25:08, 2.88it/s]
356
  3%|▎ | 143/4480 [00:52<24:12, 2.99it/s]
357
  3%|▎ | 144/4480 [00:53<25:47, 2.80it/s]
358
  3%|▎ | 145/4480 [00:53<27:19, 2.64it/s]
359
  3%|▎ | 146/4480 [00:53<25:50, 2.80it/s]
360
  3%|▎ | 147/4480 [00:54<26:06, 2.77it/s]
361
  3%|▎ | 148/4480 [00:54<28:09, 2.56it/s]
362
  3%|▎ | 149/4480 [00:54<25:11, 2.87it/s]
363
  3%|▎ | 150/4480 [00:55<24:56, 2.89it/s]
364
  3%|▎ | 151/4480 [00:55<25:44, 2.80it/s]
365
  3%|▎ | 152/4480 [00:55<24:55, 2.89it/s]
366
  3%|▎ | 153/4480 [00:56<24:43, 2.92it/s]
367
  3%|▎ | 154/4480 [00:56<26:18, 2.74it/s]
368
  3%|▎ | 155/4480 [00:57<26:55, 2.68it/s]
369
  3%|▎ | 156/4480 [00:57<24:56, 2.89it/s]
370
  4%|▎ | 157/4480 [00:57<23:56, 3.01it/s]
371
  4%|▎ | 158/4480 [00:57<23:58, 3.00it/s]
372
  4%|▎ | 159/4480 [00:58<25:32, 2.82it/s]
373
  4%|▎ | 160/4480 [00:58<23:23, 3.08it/s]
374
  4%|▎ | 161/4480 [00:59<31:10, 2.31it/s]
375
  4%|▎ | 162/4480 [00:59<28:51, 2.49it/s]
376
  4%|▎ | 163/4480 [01:00<30:49, 2.33it/s]
377
  4%|▎ | 164/4480 [01:00<29:43, 2.42it/s]
378
  4%|▎ | 165/4480 [01:00<29:25, 2.44it/s]
379
  4%|▎ | 166/4480 [01:01<29:31, 2.44it/s]
380
  4%|▎ | 167/4480 [01:01<29:34, 2.43it/s]
381
  4%|▍ | 168/4480 [01:02<28:35, 2.51it/s]
382
  4%|▍ | 169/4480 [01:02<28:08, 2.55it/s]
383
  4%|▍ | 170/4480 [01:02<29:51, 2.41it/s]
384
  4%|▍ | 171/4480 [01:03<28:51, 2.49it/s]
385
  4%|▍ | 172/4480 [01:03<28:14, 2.54it/s]
386
  4%|▍ | 173/4480 [01:04<31:39, 2.27it/s]
387
  4%|▍ | 174/4480 [01:04<29:28, 2.43it/s]
388
  4%|▍ | 175/4480 [01:04<27:20, 2.62it/s]
389
  4%|▍ | 176/4480 [01:05<29:32, 2.43it/s]
390
  4%|▍ | 177/4480 [01:05<27:30, 2.61it/s]
391
  4%|▍ | 178/4480 [01:06<26:36, 2.69it/s]
392
  4%|▍ | 179/4480 [01:06<25:08, 2.85it/s]
393
  4%|▍ | 180/4480 [01:06<25:26, 2.82it/s]
394
  4%|▍ | 181/4480 [01:07<25:06, 2.85it/s]
395
  4%|▍ | 182/4480 [01:07<25:35, 2.80it/s]
396
  4%|▍ | 183/4480 [01:07<25:33, 2.80it/s]
397
  4%|▍ | 184/4480 [01:08<25:09, 2.85it/s]
398
  4%|▍ | 185/4480 [01:08<23:36, 3.03it/s]
399
  4%|▍ | 186/4480 [01:08<23:48, 3.01it/s]
400
  4%|▍ | 187/4480 [01:09<27:59, 2.56it/s]
401
  4%|▍ | 188/4480 [01:09<28:01, 2.55it/s]
402
  4%|▍ | 189/4480 [01:10<31:35, 2.26it/s]
403
  4%|▍ | 190/4480 [01:10<31:02, 2.30it/s]
404
  4%|▍ | 191/4480 [01:11<30:53, 2.31it/s]
405
  4%|▍ | 192/4480 [01:11<30:25, 2.35it/s]
406
  4%|▍ | 193/4480 [01:11<27:03, 2.64it/s]
407
  4%|▍ | 194/4480 [01:12<26:22, 2.71it/s]
408
  4%|▍ | 195/4480 [01:12<28:28, 2.51it/s]
409
  4%|▍ | 196/4480 [01:12<27:15, 2.62it/s]
410
  4%|▍ | 197/4480 [01:13<28:00, 2.55it/s]
411
  4%|▍ | 198/4480 [01:13<26:24, 2.70it/s]
412
  4%|▍ | 199/4480 [01:13<26:10, 2.73it/s]
413
  4%|▍ | 200/4480 [01:14<24:50, 2.87it/s]
414
  4%|▍ | 201/4480 [01:14<26:46, 2.66it/s]
415
  5%|▍ | 202/4480 [01:15<25:58, 2.74it/s]
416
  5%|▍ | 203/4480 [01:15<30:23, 2.35it/s]
417
  5%|▍ | 204/4480 [01:16<29:15, 2.44it/s]
418
  5%|▍ | 205/4480 [01:16<28:43, 2.48it/s]
419
  5%|▍ | 206/4480 [01:16<29:46, 2.39it/s]
420
  5%|▍ | 207/4480 [01:17<28:00, 2.54it/s]
421
  5%|▍ | 208/4480 [01:17<28:39, 2.49it/s]
422
  5%|▍ | 209/4480 [01:18<31:11, 2.28it/s]
423
  5%|▍ | 210/4480 [01:18<28:02, 2.54it/s]
424
  5%|▍ | 211/4480 [01:18<26:41, 2.67it/s]
425
  5%|▍ | 212/4480 [01:19<25:53, 2.75it/s]
426
  5%|▍ | 213/4480 [01:19<27:32, 2.58it/s]
427
  5%|▍ | 214/4480 [01:19<26:51, 2.65it/s]
428
  5%|▍ | 215/4480 [01:20<24:20, 2.92it/s]
429
  5%|▍ | 216/4480 [01:20<28:15, 2.52it/s]
430
  5%|▍ | 217/4480 [01:21<27:36, 2.57it/s]
431
  5%|▍ | 218/4480 [01:21<26:30, 2.68it/s]
432
  5%|▍ | 219/4480 [01:21<25:09, 2.82it/s]
433
  5%|▍ | 220/4480 [01:21<23:34, 3.01it/s]
434
  5%|▍ | 221/4480 [01:22<26:54, 2.64it/s]
435
  5%|▍ | 222/4480 [01:22<26:57, 2.63it/s]
436
  5%|▍ | 223/4480 [01:23<26:57, 2.63it/s]
437
  5%|▌ | 224/4480 [01:23<28:06, 2.52it/s]
438
  5%|▌ | 225/4480 [01:24<28:12, 2.51it/s]
439
  5%|▌ | 226/4480 [01:24<27:19, 2.59it/s]
440
  5%|▌ | 227/4480 [01:24<24:48, 2.86it/s]
441
  5%|▌ | 228/4480 [01:25<24:25, 2.90it/s]
442
  5%|▌ | 229/4480 [01:25<29:38, 2.39it/s]
443
  5%|▌ | 230/4480 [01:26<33:43, 2.10it/s]
444
  5%|▌ | 231/4480 [01:26<31:08, 2.27it/s]
445
  5%|▌ | 232/4480 [01:26<29:50, 2.37it/s]
446
  5%|▌ | 233/4480 [01:27<28:29, 2.48it/s]
447
  5%|▌ | 234/4480 [01:27<26:36, 2.66it/s]
448
  5%|▌ | 235/4480 [01:27<25:50, 2.74it/s]
449
  5%|▌ | 236/4480 [01:28<23:42, 2.98it/s]
450
  5%|▌ | 237/4480 [01:28<25:03, 2.82it/s]
451
  5%|▌ | 238/4480 [01:28<25:28, 2.77it/s]
452
  5%|▌ | 239/4480 [01:29<24:08, 2.93it/s]
453
  5%|▌ | 240/4480 [01:29<26:09, 2.70it/s]
454
  5%|▌ | 241/4480 [01:30<25:28, 2.77it/s]
455
  5%|▌ | 242/4480 [01:30<28:03, 2.52it/s]
456
  5%|▌ | 243/4480 [01:31<31:01, 2.28it/s]
457
  5%|▌ | 244/4480 [01:31<28:50, 2.45it/s]
458
  5%|▌ | 245/4480 [01:31<27:57, 2.53it/s]
459
  5%|▌ | 246/4480 [01:32<27:41, 2.55it/s]
460
  6%|▌ | 247/4480 [01:32<26:01, 2.71it/s]
461
  6%|▌ | 248/4480 [01:32<27:11, 2.59it/s]
462
  6%|▌ | 249/4480 [01:33<29:16, 2.41it/s]
463
  6%|▌ | 250/4480 [01:33<29:34, 2.38it/s]
464
  6%|▌ | 251/4480 [01:34<29:48, 2.36it/s]
465
  6%|▌ | 252/4480 [01:34<27:11, 2.59it/s]
466
  6%|▌ | 253/4480 [01:34<25:23, 2.77it/s]
467
  6%|▌ | 254/4480 [01:35<27:49, 2.53it/s]
468
  6%|▌ | 255/4480 [01:35<27:50, 2.53it/s]
469
  6%|▌ | 256/4480 [01:36<27:55, 2.52it/s]
470
  6%|▌ | 257/4480 [01:36<28:58, 2.43it/s]
471
  6%|▌ | 258/4480 [01:36<26:38, 2.64it/s]
472
  6%|▌ | 259/4480 [01:37<24:14, 2.90it/s]
473
  6%|▌ | 260/4480 [01:37<23:31, 2.99it/s]
474
  6%|▌ | 261/4480 [01:37<23:23, 3.01it/s]
475
  6%|▌ | 262/4480 [01:38<24:08, 2.91it/s]
476
  6%|▌ | 263/4480 [01:38<24:19, 2.89it/s]
477
  6%|▌ | 264/4480 [01:38<23:39, 2.97it/s]
478
  6%|▌ | 265/4480 [01:39<24:04, 2.92it/s]
479
  6%|▌ | 266/4480 [01:39<26:08, 2.69it/s]
480
  6%|▌ | 267/4480 [01:40<26:31, 2.65it/s]
481
  6%|▌ | 268/4480 [01:40<27:01, 2.60it/s]
482
  6%|▌ | 269/4480 [01:40<24:13, 2.90it/s]
483
  6%|▌ | 270/4480 [01:40<23:21, 3.00it/s]
484
  6%|▌ | 271/4480 [01:41<22:32, 3.11it/s]
485
  6%|▌ | 272/4480 [01:41<24:53, 2.82it/s]
486
  6%|▌ | 273/4480 [01:42<25:37, 2.74it/s]
487
  6%|▌ | 274/4480 [01:42<25:24, 2.76it/s]
488
  6%|▌ | 275/4480 [01:42<23:07, 3.03it/s]
489
  6%|▌ | 276/4480 [01:42<22:08, 3.16it/s]
490
  6%|▌ | 277/4480 [01:43<28:01, 2.50it/s]
491
  6%|▌ | 278/4480 [01:43<27:53, 2.51it/s]
492
  6%|▌ | 279/4480 [01:44<26:38, 2.63it/s]
493
  6%|▋ | 280/4480 [01:44<28:34, 2.45it/s]
494
  6%|▋ | 281/4480 [01:45<28:37, 2.45it/s]
495
  6%|▋ | 282/4480 [01:45<26:38, 2.63it/s]
496
  6%|▋ | 283/4480 [01:45<26:15, 2.66it/s]
497
  6%|▋ | 284/4480 [01:46<25:05, 2.79it/s]
498
  6%|▋ | 285/4480 [01:46<24:09, 2.89it/s]
499
  6%|▋ | 286/4480 [01:46<23:48, 2.94it/s]
500
  6%|▋ | 287/4480 [01:47<25:43, 2.72it/s]
501
  6%|▋ | 288/4480 [01:47<24:32, 2.85it/s]
502
  6%|▋ | 289/4480 [01:48<26:44, 2.61it/s]
503
  6%|▋ | 290/4480 [01:48<24:31, 2.85it/s]
504
  6%|▋ | 291/4480 [01:48<24:09, 2.89it/s]
505
  7%|▋ | 292/4480 [01:48<24:16, 2.88it/s]
506
  7%|▋ | 293/4480 [01:49<25:05, 2.78it/s]
507
  7%|▋ | 294/4480 [01:49<23:20, 2.99it/s]
508
  7%|▋ | 295/4480 [01:50<23:57, 2.91it/s]
509
  7%|▋ | 296/4480 [01:50<25:32, 2.73it/s]
510
  7%|▋ | 297/4480 [01:50<26:29, 2.63it/s]
511
  7%|▋ | 298/4480 [01:51<26:56, 2.59it/s]
512
  7%|▋ | 299/4480 [01:51<26:20, 2.65it/s]
513
  7%|▋ | 300/4480 [01:51<26:33, 2.62it/s]
514
  7%|▋ | 301/4480 [01:52<25:37, 2.72it/s]
515
  7%|▋ | 302/4480 [01:52<24:44, 2.81it/s]
516
  7%|▋ | 303/4480 [01:52<24:11, 2.88it/s]
517
  7%|▋ | 304/4480 [01:53<24:15, 2.87it/s]
518
  7%|▋ | 305/4480 [01:53<21:53, 3.18it/s]
519
  7%|▋ | 306/4480 [01:53<20:20, 3.42it/s]
520
  7%|▋ | 307/4480 [01:54<21:38, 3.21it/s]
521
  7%|▋ | 308/4480 [01:54<21:18, 3.26it/s]
522
  7%|▋ | 309/4480 [01:54<21:50, 3.18it/s]
523
  7%|▋ | 310/4480 [01:55<20:48, 3.34it/s]
524
  7%|▋ | 311/4480 [01:55<22:58, 3.02it/s]
525
  7%|▋ | 312/4480 [01:55<23:29, 2.96it/s]
526
  7%|▋ | 313/4480 [01:56<24:55, 2.79it/s]
527
  7%|▋ | 314/4480 [01:56<27:16, 2.55it/s]
528
  7%|▋ | 315/4480 [01:57<26:04, 2.66it/s]
529
  7%|▋ | 316/4480 [01:57<29:39, 2.34it/s]
530
  7%|▋ | 317/4480 [01:57<27:06, 2.56it/s]
531
  7%|▋ | 318/4480 [01:58<26:32, 2.61it/s]
532
  7%|▋ | 319/4480 [01:58<25:06, 2.76it/s]
533
  7%|▋ | 320/4480 [01:58<26:29, 2.62it/s]
534
  7%|▋ | 321/4480 [01:59<27:00, 2.57it/s]
535
  7%|▋ | 322/4480 [01:59<28:27, 2.44it/s]
536
  7%|▋ | 323/4480 [02:00<27:55, 2.48it/s]
537
  7%|▋ | 324/4480 [02:00<27:53, 2.48it/s]
538
  7%|▋ | 325/4480 [02:01<27:34, 2.51it/s]
539
  7%|▋ | 326/4480 [02:01<26:56, 2.57it/s]
540
  7%|▋ | 327/4480 [02:01<26:27, 2.62it/s]
541
  7%|▋ | 328/4480 [02:02<26:38, 2.60it/s]
542
  7%|▋ | 329/4480 [02:02<27:01, 2.56it/s]
543
  7%|▋ | 330/4480 [02:02<26:19, 2.63it/s]
544
  7%|▋ | 331/4480 [02:03<27:25, 2.52it/s]
545
  7%|▋ | 332/4480 [02:03<26:34, 2.60it/s]
546
  7%|▋ | 333/4480 [02:04<25:43, 2.69it/s]
547
  7%|▋ | 334/4480 [02:04<28:22, 2.44it/s]
548
  7%|▋ | 335/4480 [02:04<25:24, 2.72it/s]
549
  8%|▊ | 336/4480 [02:05<23:13, 2.97it/s]
550
  8%|▊ | 337/4480 [02:05<25:39, 2.69it/s]
551
  8%|▊ | 338/4480 [02:05<25:55, 2.66it/s]
552
  8%|▊ | 339/4480 [02:06<25:20, 2.72it/s]
553
  8%|▊ | 340/4480 [02:06<29:12, 2.36it/s]
554
  8%|▊ | 341/4480 [02:07<28:56, 2.38it/s]
555
  8%|▊ | 342/4480 [02:07<27:18, 2.53it/s]
556
  8%|▊ | 343/4480 [02:07<26:17, 2.62it/s]
557
  8%|▊ | 344/4480 [02:08<24:50, 2.77it/s]
558
  8%|▊ | 345/4480 [02:08<23:19, 2.95it/s]
559
  8%|▊ | 346/4480 [02:09<26:18, 2.62it/s]
560
  8%|▊ | 347/4480 [02:09<24:52, 2.77it/s]
561
  8%|▊ | 348/4480 [02:10<32:01, 2.15it/s]
562
  8%|▊ | 349/4480 [02:10<27:47, 2.48it/s]
563
  8%|▊ | 350/4480 [02:10<26:33, 2.59it/s]
564
  8%|▊ | 351/4480 [02:11<26:06, 2.64it/s]
565
  8%|▊ | 352/4480 [02:11<26:13, 2.62it/s]
566
  8%|▊ | 353/4480 [02:11<24:48, 2.77it/s]
567
  8%|▊ | 354/4480 [02:12<26:07, 2.63it/s]
568
  8%|▊ | 355/4480 [02:12<24:18, 2.83it/s]
569
  8%|▊ | 356/4480 [02:12<25:29, 2.70it/s]
570
  8%|▊ | 357/4480 [02:13<25:39, 2.68it/s]
571
  8%|▊ | 358/4480 [02:13<25:49, 2.66it/s]
572
  8%|▊ | 359/4480 [02:14<29:37, 2.32it/s]
573
  8%|▊ | 360/4480 [02:14<27:43, 2.48it/s]
574
  8%|▊ | 361/4480 [02:14<26:43, 2.57it/s]
575
  8%|▊ | 362/4480 [02:15<26:27, 2.59it/s]
576
  8%|▊ | 363/4480 [02:15<25:35, 2.68it/s]
577
  8%|▊ | 364/4480 [02:15<25:29, 2.69it/s]
578
  8%|▊ | 365/4480 [02:16<25:11, 2.72it/s]
579
  8%|▊ | 366/4480 [02:16<23:31, 2.91it/s]
580
  8%|▊ | 367/4480 [02:16<24:39, 2.78it/s]
581
  8%|▊ | 368/4480 [02:17<23:11, 2.95it/s]
582
  8%|▊ | 369/4480 [02:17<23:02, 2.97it/s]
583
  8%|▊ | 370/4480 [02:17<23:08, 2.96it/s]
584
  8%|▊ | 371/4480 [02:18<24:48, 2.76it/s]
585
  8%|▊ | 372/4480 [02:18<23:33, 2.91it/s]
586
  8%|▊ | 373/4480 [02:18<22:58, 2.98it/s]
587
  8%|▊ | 374/4480 [02:19<24:29, 2.79it/s]
588
  8%|▊ | 375/4480 [02:19<23:40, 2.89it/s]
589
  8%|▊ | 376/4480 [02:20<23:28, 2.91it/s]
590
  8%|▊ | 377/4480 [02:20<23:46, 2.88it/s]
591
  8%|▊ | 378/4480 [02:20<24:12, 2.82it/s]
592
  8%|▊ | 379/4480 [02:21<23:02, 2.97it/s]
593
  8%|▊ | 380/4480 [02:21<22:01, 3.10it/s]
594
  9%|▊ | 381/4480 [02:21<21:01, 3.25it/s]
595
  9%|▊ | 382/4480 [02:22<23:03, 2.96it/s]
596
  9%|▊ | 383/4480 [02:22<24:25, 2.80it/s]
597
  9%|▊ | 384/4480 [02:22<24:56, 2.74it/s]
598
  9%|▊ | 385/4480 [02:23<23:12, 2.94it/s]
599
  9%|▊ | 386/4480 [02:23<23:14, 2.94it/s]
600
  9%|▊ | 387/4480 [02:23<22:27, 3.04it/s]
601
  9%|▊ | 388/4480 [02:24<23:38, 2.88it/s]
602
  9%|▊ | 389/4480 [02:24<26:11, 2.60it/s]
603
  9%|▊ | 390/4480 [02:24<23:59, 2.84it/s]
604
  9%|▊ | 391/4480 [02:25<24:31, 2.78it/s]
605
  9%|▉ | 392/4480 [02:25<23:50, 2.86it/s]
606
  9%|▉ | 393/4480 [02:25<24:42, 2.76it/s]
607
  9%|▉ | 394/4480 [02:26<24:43, 2.75it/s]
608
  9%|▉ | 395/4480 [02:26<24:10, 2.82it/s]
609
  9%|▉ | 396/4480 [02:27<27:16, 2.50it/s]
610
  9%|▉ | 397/4480 [02:27<26:52, 2.53it/s]
611
  9%|▉ | 398/4480 [02:27<24:58, 2.72it/s]
612
  9%|▉ | 399/4480 [02:28<25:32, 2.66it/s]
613
  9%|▉ | 400/4480 [02:28<25:13, 2.70it/s]
614
  9%|▉ | 401/4480 [02:28<22:55, 2.96it/s]
615
  9%|▉ | 402/4480 [02:29<25:10, 2.70it/s]
616
  9%|▉ | 403/4480 [02:29<25:13, 2.69it/s]
617
  9%|▉ | 404/4480 [02:30<25:15, 2.69it/s]
618
  9%|▉ | 405/4480 [02:30<28:21, 2.39it/s]
619
  9%|▉ | 406/4480 [02:30<24:35, 2.76it/s]
620
  9%|▉ | 407/4480 [02:31<24:30, 2.77it/s]
621
  9%|▉ | 408/4480 [02:31<25:41, 2.64it/s]
622
  9%|▉ | 409/4480 [02:32<30:03, 2.26it/s]
623
  9%|▉ | 410/4480 [02:32<27:13, 2.49it/s]
624
  9%|▉ | 411/4480 [02:32<26:56, 2.52it/s]
625
  9%|▉ | 412/4480 [02:33<24:51, 2.73it/s]
626
  9%|▉ | 413/4480 [02:33<25:04, 2.70it/s]
627
  9%|▉ | 414/4480 [02:33<25:37, 2.64it/s]
628
  9%|▉ | 415/4480 [02:34<24:49, 2.73it/s]
629
  9%|▉ | 416/4480 [02:34<26:02, 2.60it/s]
630
  9%|▉ | 417/4480 [02:35<29:20, 2.31it/s]
631
  9%|▉ | 418/4480 [02:35<31:13, 2.17it/s]
632
  9%|▉ | 419/4480 [02:36<29:03, 2.33it/s]
633
  9%|▉ | 420/4480 [02:36<28:41, 2.36it/s]
634
  9%|▉ | 421/4480 [02:36<27:51, 2.43it/s]
635
  9%|▉ | 422/4480 [02:37<34:14, 1.98it/s]
636
  9%|▉ | 423/4480 [02:38<32:52, 2.06it/s]
637
  9%|▉ | 424/4480 [02:38<32:04, 2.11it/s]
638
  9%|▉ | 425/4480 [02:38<29:52, 2.26it/s]
639
  10%|▉ | 426/4480 [02:39<28:03, 2.41it/s]
640
  10%|▉ | 427/4480 [02:39<26:39, 2.53it/s]
641
  10%|▉ | 428/4480 [02:39<25:56, 2.60it/s]
642
  10%|▉ | 429/4480 [02:40<25:09, 2.68it/s]
643
  10%|▉ | 430/4480 [02:40<25:42, 2.62it/s]
644
  10%|▉ | 431/4480 [02:41<24:50, 2.72it/s]
645
  10%|▉ | 432/4480 [02:41<23:36, 2.86it/s]
646
  10%|▉ | 433/4480 [02:41<26:43, 2.52it/s]
647
  10%|▉ | 434/4480 [02:42<24:37, 2.74it/s]
648
  10%|▉ | 435/4480 [02:42<24:14, 2.78it/s]
649
  10%|▉ | 436/4480 [02:42<24:10, 2.79it/s]
650
  10%|▉ | 437/4480 [02:43<23:16, 2.89it/s]
651
  10%|▉ | 438/4480 [02:43<22:28, 3.00it/s]
652
  10%|▉ | 439/4480 [02:43<24:31, 2.75it/s]
653
  10%|▉ | 440/4480 [02:44<23:08, 2.91it/s]
654
  10%|▉ | 441/4480 [02:44<22:38, 2.97it/s]
655
  10%|▉ | 442/4480 [02:44<23:36, 2.85it/s]
656
  10%|▉ | 443/4480 [02:45<24:33, 2.74it/s]
657
  10%|▉ | 444/4480 [02:45<24:04, 2.79it/s]
658
  10%|▉ | 445/4480 [02:46<24:30, 2.74it/s]
659
  10%|▉ | 446/4480 [02:46<22:49, 2.95it/s]
660
  10%|▉ | 447/4480 [02:46<22:59, 2.92it/s]
661
  10%|█ | 448/4480 [02:47<22:54, 2.93it/s][INFO|trainer.py:811] 2024-09-09 14:17:54,861 >> The following columns in the evaluation set don't have a corresponding argument in `BertForTokenClassification.forward` and have been ignored: id, tokens, ner_tags. If id, tokens, ner_tags are not expected by `BertForTokenClassification.forward`, you can safely ignore this message.
662
+ [INFO|trainer.py:3819] 2024-09-09 14:17:54,863 >>
663
+ ***** Running Evaluation *****
664
+ [INFO|trainer.py:3821] 2024-09-09 14:17:54,863 >> Num examples = 6946
665
+ [INFO|trainer.py:3824] 2024-09-09 14:17:54,863 >> Batch size = 8
666
+
667
+
668
  0%| | 0/869 [00:00<?, ?it/s]
669
+
670
  1%| | 10/869 [00:00<00:09, 92.79it/s]
671
+
672
  2%|▏ | 20/869 [00:00<00:10, 80.90it/s]
673
+
674
  3%|▎ | 29/869 [00:00<00:10, 77.67it/s]
675
+
676
  4%|▍ | 37/869 [00:00<00:11, 75.22it/s]
677
+
678
  5%|▌ | 46/869 [00:00<00:10, 78.48it/s]
679
+
680
  6%|▋ | 55/869 [00:00<00:10, 80.85it/s]
681
+
682
  7%|▋ | 64/869 [00:00<00:10, 76.32it/s]
683
+
684
  8%|▊ | 72/869 [00:00<00:10, 75.42it/s]
685
+
686
  9%|▉ | 81/869 [00:01<00:09, 79.55it/s]
687
+
688
  10%|█ | 90/869 [00:01<00:09, 82.34it/s]
689
+
690
  12%|█▏ | 100/869 [00:01<00:08, 85.84it/s]
691
+
692
  13%|█▎ | 109/869 [00:01<00:09, 81.70it/s]
693
+
694
  14%|█▎ | 118/869 [00:01<00:09, 81.22it/s]
695
+
696
  15%|█▍ | 127/869 [00:01<00:09, 79.96it/s]
697
+
698
  16%|█▌ | 136/869 [00:01<00:09, 81.27it/s]
699
+
700
  17%|█▋ | 145/869 [00:01<00:09, 76.67it/s]
701
+
702
  18%|█▊ | 154/869 [00:01<00:09, 78.89it/s]
703
+
704
  19%|█▉ | 163/869 [00:02<00:08, 79.25it/s]
705
+
706
  20%|█▉ | 171/869 [00:02<00:09, 77.29it/s]
707
+
708
  21%|██ | 179/869 [00:02<00:09, 76.38it/s]
709
+
710
  22%|██▏ | 188/869 [00:02<00:08, 77.83it/s]
711
+
712
  23%|██▎ | 196/869 [00:02<00:08, 75.39it/s]
713
+
714
  24%|██▎ | 205/869 [00:02<00:08, 77.74it/s]
715
+
716
  25%|██▍ | 214/869 [00:02<00:08, 79.15it/s]
717
+
718
  26%|██▌ | 223/869 [00:02<00:08, 80.51it/s]
719
+
720
  27%|██▋ | 232/869 [00:02<00:08, 77.06it/s]
721
+
722
  28%|██▊ | 240/869 [00:03<00:08, 76.98it/s]
723
+
724
  29%|██▊ | 248/869 [00:03<00:08, 72.14it/s]
725
+
726
  30%|██▉ | 257/869 [00:03<00:08, 75.25it/s]
727
+
728
  30%|███ | 265/869 [00:03<00:08, 74.46it/s]
729
+
730
  31%|███▏ | 273/869 [00:03<00:07, 74.61it/s]
731
+
732
  32%|███▏ | 281/869 [00:03<00:07, 73.92it/s]
733
+
734
  33%|███▎ | 289/869 [00:03<00:07, 73.26it/s]
735
+
736
  34%|███▍ | 297/869 [00:03<00:07, 74.39it/s]
737
+
738
  35%|███▌ | 305/869 [00:03<00:07, 71.09it/s]
739
+
740
  36%|███▌ | 313/869 [00:04<00:07, 72.71it/s]
741
+
742
  37%|███▋ | 321/869 [00:04<00:07, 72.16it/s]
743
+
744
  38%|███▊ | 330/869 [00:04<00:07, 76.38it/s]
745
+
746
  39%|███▉ | 339/869 [00:04<00:06, 78.09it/s]
747
+
748
  40%|███▉ | 347/869 [00:04<00:07, 72.56it/s]
749
+
750
  41%|████ | 355/869 [00:04<00:06, 73.67it/s]
751
+
752
  42%|████▏ | 364/869 [00:04<00:06, 77.58it/s]
753
+
754
  43%|████▎ | 373/869 [00:04<00:06, 75.01it/s]
755
+
756
  44%|████▍ | 381/869 [00:04<00:06, 76.13it/s]
757
+
758
  45%|████▍ | 389/869 [00:05<00:06, 70.53it/s]
759
+
760
  46%|████▌ | 398/869 [00:05<00:06, 73.42it/s]
761
+
762
  47%|████▋ | 407/869 [00:05<00:06, 76.02it/s]
763
+
764
  48%|████▊ | 416/869 [00:05<00:05, 78.88it/s]
765
+
766
  49%|████▉ | 425/869 [00:05<00:05, 79.96it/s]
767
+
768
  50%|████▉ | 434/869 [00:05<00:05, 80.34it/s]
769
+
770
  51%|█████ | 443/869 [00:05<00:05, 75.42it/s]
771
+
772
  52%|█████▏ | 452/869 [00:05<00:05, 78.65it/s]
773
+
774
  53%|█████▎ | 460/869 [00:05<00:05, 77.89it/s]
775
+
776
  54%|█████▍ | 468/869 [00:06<00:05, 77.51it/s]
777
+
778
  55%|█████▌ | 478/869 [00:06<00:04, 82.03it/s]
779
+
780
  56%|█████▌ | 487/869 [00:06<00:04, 82.20it/s]
781
+
782
  57%|█████▋ | 496/869 [00:06<00:04, 76.78it/s]
783
+
784
  58%|█████▊ | 504/869 [00:06<00:04, 74.30it/s]
785
+
786
  59%|█████▉ | 512/869 [00:06<00:04, 75.36it/s]
787
+
788
  60%|█████▉ | 521/869 [00:06<00:04, 78.56it/s]
789
+
790
  61%|██████ | 529/869 [00:06<00:04, 72.22it/s]
791
+
792
  62%|██████▏ | 537/869 [00:06<00:04, 73.11it/s]
793
+
794
  63%|██████▎ | 545/869 [00:07<00:04, 71.36it/s]
795
+
796
  64%|██████▍ | 554/869 [00:07<00:04, 74.37it/s]
797
+
798
  65%|██████▍ | 562/869 [00:07<00:04, 75.80it/s]
799
+
800
  66%|██████▌ | 570/869 [00:07<00:04, 74.62it/s]
801
+
802
  67%|██████▋ | 579/869 [00:07<00:03, 77.57it/s]
803
+
804
  68%|██████▊ | 587/869 [00:07<00:03, 74.27it/s]
805
+
806
  68%|██████▊ | 595/869 [00:07<00:03, 75.65it/s]
807
+
808
  70%|██████▉ | 604/869 [00:07<00:03, 78.50it/s]
809
+
810
  70%|███████ | 612/869 [00:07<00:03, 77.23it/s]
811
+
812
  71%|███████▏ | 620/869 [00:08<00:03, 77.57it/s]
813
+
814
  72%|███████▏ | 628/869 [00:08<00:03, 75.04it/s]
815
+
816
  73%|███████▎ | 636/869 [00:08<00:03, 73.98it/s]
817
+
818
  74%|███████▍ | 645/869 [00:08<00:02, 77.26it/s]
819
+
820
  75%|███████▌ | 654/869 [00:08<00:02, 78.96it/s]
821
+
822
  76%|███████▌ | 662/869 [00:08<00:02, 78.16it/s]
823
+
824
  77%|███████▋ | 671/869 [00:08<00:02, 81.02it/s]
825
+
826
  78%|███████▊ | 680/869 [00:08<00:02, 82.95it/s]
827
+
828
  79%|███████▉ | 689/869 [00:08<00:02, 71.57it/s]
829
+
830
  80%|████████ | 697/869 [00:09<00:02, 72.76it/s]
831
+
832
  81%|████████ | 705/869 [00:09<00:02, 73.06it/s]
833
+
834
  82%|████████▏ | 714/869 [00:09<00:02, 76.13it/s]
835
+
836
  83%|████████▎ | 722/869 [00:09<00:01, 76.22it/s]
837
+
838
  84%|████████▍ | 731/869 [00:09<00:01, 77.06it/s]
839
+
840
  85%|████████▌ | 739/869 [00:09<00:01, 77.04it/s]
841
+
842
  86%|████████▌ | 747/869 [00:09<00:01, 77.31it/s]
843
+
844
  87%|████████▋ | 755/869 [00:09<00:01, 75.96it/s]
845
+
846
  88%|████████▊ | 764/869 [00:09<00:01, 79.21it/s]
847
+
848
  89%|████████▉ | 772/869 [00:10<00:01, 73.60it/s]
849
+
850
  90%|████████▉ | 780/869 [00:10<00:01, 64.89it/s]
851
+
852
  91%|█████████ | 788/869 [00:10<00:01, 68.63it/s]
853
+
854
  92%|█████████▏| 797/869 [00:10<00:00, 72.49it/s]
855
+
856
  93%|█████████▎| 805/869 [00:10<00:00, 73.39it/s]
857
+
858
  94%|█████████▎| 814/869 [00:10<00:00, 75.71it/s]
859
+
860
  95%|█████████▍| 822/869 [00:10<00:00, 75.42it/s]
861
+
862
  96%|█████████▌| 831/869 [00:10<00:00, 76.65it/s]
863
+
864
  97%|█████████▋| 840/869 [00:10<00:00, 78.44it/s]
865
+
866
  98%|█████████▊| 849/869 [00:11<00:00, 80.04it/s]
867
+
868
  99%|█████████▊| 858/869 [00:11<00:00, 79.59it/s]
869
+
870
 
871
+
872
 
873
  10%|█ | 448/4480 [03:02<22:54, 2.93it/s]
874
+
875
+
876
  [INFO|trainer.py:3503] 2024-09-09 14:18:09,952 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-448
877
+ [INFO|configuration_utils.py:472] 2024-09-09 14:18:09,953 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-448/config.json
878
+ [INFO|modeling_utils.py:2799] 2024-09-09 14:18:10,847 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-448/model.safetensors
879
+ [INFO|tokenization_utils_base.py:2684] 2024-09-09 14:18:10,848 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-448/tokenizer_config.json
880
+ [INFO|tokenization_utils_base.py:2693] 2024-09-09 14:18:10,848 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-448/special_tokens_map.json
881
+ [INFO|tokenization_utils_base.py:2684] 2024-09-09 14:18:13,510 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json
882
+ [INFO|tokenization_utils_base.py:2693] 2024-09-09 14:18:13,510 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json
883
+
884
  10%|█ | 449/4480 [03:06<6:41:43, 5.98s/it]
885
  10%|█ | 450/4480 [03:06<4:51:00, 4.33s/it]
886
  10%|█ | 451/4480 [03:07<3:31:43, 3.15s/it]
887
  10%|█ | 452/4480 [03:07<2:36:10, 2.33s/it]
888
  10%|█ | 453/4480 [03:07<1:54:40, 1.71s/it]
889
  10%|█ | 454/4480 [03:08<1:28:07, 1.31s/it]
890
  10%|█ | 455/4480 [03:08<1:08:58, 1.03s/it]
891
  10%|█ | 456/4480 [03:08<53:19, 1.26it/s]
892
  10%|█ | 457/4480 [03:09<43:53, 1.53it/s]
893
  10%|█ | 458/4480 [03:09<37:31, 1.79it/s]
894
  10%|█ | 459/4480 [03:09<38:22, 1.75it/s]
895
  10%|█ | 460/4480 [03:10<33:39, 1.99it/s]
896
  10%|█ | 461/4480 [03:10<31:32, 2.12it/s]
897
  10%|█ | 462/4480 [03:11<28:45, 2.33it/s]
898
  10%|█ | 463/4480 [03:11<27:17, 2.45it/s]
899
  10%|█ | 464/4480 [03:11<26:13, 2.55it/s]
900
  10%|█ | 465/4480 [03:12<25:11, 2.66it/s]
901
  10%|█ | 466/4480 [03:12<23:50, 2.81it/s]
902
  10%|█ | 467/4480 [03:12<23:50, 2.81it/s]
903
  10%|█ | 468/4480 [03:13<27:53, 2.40it/s]
904
  10%|█ | 469/4480 [03:13<25:14, 2.65it/s]
905
  10%|█ | 470/4480 [03:13<24:07, 2.77it/s]
906
  11%|█ | 471/4480 [03:14<23:45, 2.81it/s]
907
  11%|█ | 472/4480 [03:14<23:26, 2.85it/s]
908
  11%|█ | 473/4480 [03:15<24:05, 2.77it/s]
909
  11%|█ | 474/4480 [03:15<24:20, 2.74it/s]
910
  11%|█ | 475/4480 [03:15<25:03, 2.66it/s]
911
  11%|█ | 476/4480 [03:16<23:49, 2.80it/s]
912
  11%|█ | 477/4480 [03:16<23:51, 2.80it/s]
913
  11%|█ | 478/4480 [03:16<22:26, 2.97it/s]
914
  11%|█ | 479/4480 [03:17<21:31, 3.10it/s]
915
  11%|█ | 480/4480 [03:17<21:46, 3.06it/s]
916
  11%|█ | 481/4480 [03:17<23:15, 2.87it/s]
917
  11%|█ | 482/4480 [03:18<24:33, 2.71it/s]
918
  11%|█ | 483/4480 [03:18<24:43, 2.69it/s]
919
  11%|█ | 484/4480 [03:18<25:12, 2.64it/s]
920
  11%|█ | 485/4480 [03:19<24:29, 2.72it/s]
921
  11%|█ | 486/4480 [03:19<27:55, 2.38it/s]
922
  11%|█ | 487/4480 [03:20<32:18, 2.06it/s]
923
  11%|█ | 488/4480 [03:20<31:42, 2.10it/s]
924
  11%|█ | 489/4480 [03:21<28:55, 2.30it/s]
925
  11%|█ | 490/4480 [03:21<27:55, 2.38it/s]
926
  11%|█ | 491/4480 [03:21<25:09, 2.64it/s]
927
  11%|█ | 492/4480 [03:22<24:27, 2.72it/s]
928
  11%|█ | 493/4480 [03:22<24:30, 2.71it/s]
929
  11%|█ | 494/4480 [03:23<23:53, 2.78it/s]
930
  11%|█ | 495/4480 [03:23<23:30, 2.82it/s]
931
  11%|█ | 496/4480 [03:23<23:04, 2.88it/s]
932
  11%|█ | 497/4480 [03:24<23:29, 2.82it/s]
933
  11%|█ | 498/4480 [03:24<23:06, 2.87it/s]
934
  11%|█ | 499/4480 [03:24<22:46, 2.91it/s]
935
  11%|█ | 500/4480 [03:25<27:16, 2.43it/s]
936
 
937
  11%|█ | 500/4480 [03:25<27:16, 2.43it/s]
938
  11%|█ | 501/4480 [03:25<31:27, 2.11it/s]
939
  11%|█ | 502/4480 [03:26<28:12, 2.35it/s]
940
  11%|█ | 503/4480 [03:26<26:23, 2.51it/s]
941
  11%|█▏ | 504/4480 [03:26<25:09, 2.63it/s]
942
  11%|█▏ | 505/4480 [03:27<24:50, 2.67it/s]
943
  11%|█▏ | 506/4480 [03:27<27:31, 2.41it/s]
944
  11%|█▏ | 507/4480 [03:28<24:50, 2.66it/s]
945
  11%|█▏ | 508/4480 [03:28<27:23, 2.42it/s]
946
  11%|█▏ | 509/4480 [03:28<24:41, 2.68it/s]
947
  11%|█▏ | 510/4480 [03:29<23:15, 2.85it/s]
948
  11%|█▏ | 511/4480 [03:29<22:12, 2.98it/s]
949
  11%|█▏ | 512/4480 [03:29<23:53, 2.77it/s]
950
  11%|█▏ | 513/4480 [03:30<22:50, 2.89it/s]
951
  11%|█▏ | 514/4480 [03:30<23:24, 2.82it/s]
952
  11%|█▏ | 515/4480 [03:30<21:48, 3.03it/s]
953
  12%|█▏ | 516/4480 [03:31<21:58, 3.01it/s]
954
  12%|█▏ | 517/4480 [03:31<21:40, 3.05it/s]
955
  12%|█▏ | 518/4480 [03:31<23:52, 2.77it/s]
956
  12%|█▏ | 519/4480 [03:32<22:42, 2.91it/s]
957
  12%|█▏ | 520/4480 [03:32<22:14, 2.97it/s]
958
  12%|█▏ | 521/4480 [03:32<21:35, 3.06it/s]
959
  12%|█▏ | 522/4480 [03:33<23:50, 2.77it/s]
960
  12%|█▏ | 523/4480 [03:33<24:23, 2.70it/s]
961
  12%|█▏ | 524/4480 [03:33<21:43, 3.03it/s]
962
  12%|█▏ | 525/4480 [03:34<23:16, 2.83it/s]
963
  12%|█▏ | 526/4480 [03:34<23:03, 2.86it/s]
964
  12%|█▏ | 527/4480 [03:34<22:30, 2.93it/s]
965
  12%|█▏ | 528/4480 [03:35<21:39, 3.04it/s]
966
  12%|█▏ | 529/4480 [03:35<23:01, 2.86it/s]
967
  12%|█▏ | 530/4480 [03:36<23:29, 2.80it/s]
968
  12%|█▏ | 531/4480 [03:36<25:11, 2.61it/s]
969
  12%|█▏ | 532/4480 [03:36<24:50, 2.65it/s]
970
  12%|█▏ | 533/4480 [03:37<28:27, 2.31it/s]
971
  12%|█▏ | 534/4480 [03:37<27:49, 2.36it/s]
972
  12%|█▏ | 535/4480 [03:38<27:50, 2.36it/s]
973
  12%|█▏ | 536/4480 [03:38<25:21, 2.59it/s]
974
  12%|█▏ | 537/4480 [03:38<26:08, 2.51it/s]
975
  12%|█▏ | 538/4480 [03:39<25:05, 2.62it/s]
976
  12%|█▏ | 539/4480 [03:39<25:29, 2.58it/s]
977
  12%|█▏ | 540/4480 [03:40<25:05, 2.62it/s]
978
  12%|█▏ | 541/4480 [03:40<24:07, 2.72it/s]
979
  12%|█▏ | 542/4480 [03:40<22:54, 2.86it/s]
980
  12%|█▏ | 543/4480 [03:41<21:59, 2.98it/s]
981
  12%|█▏ | 544/4480 [03:41<25:18, 2.59it/s]
982
  12%|█▏ | 545/4480 [03:41<25:08, 2.61it/s]
983
  12%|█▏ | 546/4480 [03:42<27:46, 2.36it/s]
984
  12%|█▏ | 547/4480 [03:42<26:14, 2.50it/s]
985
  12%|█▏ | 548/4480 [03:43<25:27, 2.57it/s]
986
  12%|█▏ | 549/4480 [03:43<26:18, 2.49it/s]
987
  12%|█▏ | 550/4480 [03:44<28:02, 2.34it/s]
988
  12%|█▏ | 551/4480 [03:44<27:01, 2.42it/s]
989
  12%|█▏ | 552/4480 [03:44<29:30, 2.22it/s]
990
  12%|█▏ | 553/4480 [03:45<26:33, 2.46it/s]
991
  12%|█▏ | 554/4480 [03:45<24:58, 2.62it/s]
992
  12%|█▏ | 555/4480 [03:45<23:37, 2.77it/s]
993
  12%|█▏ | 556/4480 [03:46<25:37, 2.55it/s]
994
  12%|█▏ | 557/4480 [03:46<24:21, 2.68it/s]
995
  12%|█▏ | 558/4480 [03:46<22:27, 2.91it/s]
996
  12%|█▏ | 559/4480 [03:47<21:36, 3.02it/s]
997
  12%|█▎ | 560/4480 [03:47<21:46, 3.00it/s]
998
  13%|█▎ | 561/4480 [03:47<22:41, 2.88it/s]
999
  13%|█▎ | 562/4480 [03:48<23:15, 2.81it/s]
1000
  13%|█▎ | 563/4480 [03:49<29:23, 2.22it/s]
1001
  13%|█▎ | 564/4480 [03:49<28:08, 2.32it/s]
1002
  13%|█▎ | 565/4480 [03:49<28:23, 2.30it/s]
1003
  13%|█▎ | 566/4480 [03:50<26:58, 2.42it/s]
1004
  13%|█▎ | 567/4480 [03:50<27:07, 2.40it/s]
1005
  13%|█▎ | 568/4480 [03:51<26:20, 2.48it/s]
1006
  13%|█▎ | 569/4480 [03:51<25:58, 2.51it/s]
1007
  13%|█▎ | 570/4480 [03:51<23:38, 2.76it/s]
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9.989615784008308,
3
+ "total_flos": 1.3132946802550608e+16,
4
+ "train_loss": 0.0027612092573652642,
5
+ "train_runtime": 2084.9871,
6
+ "train_samples": 30812,
7
+ "train_samples_per_second": 147.78,
8
+ "train_steps_per_second": 2.307
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,225 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9323447636700648,
3
+ "best_model_checkpoint": "/content/dissertation/scripts/ner/output/checkpoint-4333",
4
+ "epoch": 9.989615784008308,
5
+ "eval_steps": 500,
6
+ "global_step": 4810,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.9989615784008308,
13
+ "eval_accuracy": 0.9987441743644127,
14
+ "eval_f1": 0.9291628334866606,
15
+ "eval_loss": 0.004182814620435238,
16
+ "eval_precision": 0.9173478655767484,
17
+ "eval_recall": 0.9412861136999068,
18
+ "eval_runtime": 15.1684,
19
+ "eval_samples_per_second": 457.925,
20
+ "eval_steps_per_second": 57.29,
21
+ "step": 481
22
+ },
23
+ {
24
+ "epoch": 1.0384215991692627,
25
+ "grad_norm": 0.07515838742256165,
26
+ "learning_rate": 4.48024948024948e-05,
27
+ "loss": 0.0156,
28
+ "step": 500
29
+ },
30
+ {
31
+ "epoch": 2.0,
32
+ "eval_accuracy": 0.9986464990372004,
33
+ "eval_f1": 0.9189439555349699,
34
+ "eval_loss": 0.004935940261930227,
35
+ "eval_precision": 0.9134438305709024,
36
+ "eval_recall": 0.9245107176141659,
37
+ "eval_runtime": 15.18,
38
+ "eval_samples_per_second": 457.575,
39
+ "eval_steps_per_second": 57.246,
40
+ "step": 963
41
+ },
42
+ {
43
+ "epoch": 2.0768431983385254,
44
+ "grad_norm": 0.005299085285514593,
45
+ "learning_rate": 3.9604989604989604e-05,
46
+ "loss": 0.0039,
47
+ "step": 1000
48
+ },
49
+ {
50
+ "epoch": 2.9989615784008308,
51
+ "eval_accuracy": 0.9985627773281612,
52
+ "eval_f1": 0.9191873589164785,
53
+ "eval_loss": 0.005292736925184727,
54
+ "eval_precision": 0.8914185639229422,
55
+ "eval_recall": 0.9487418452935694,
56
+ "eval_runtime": 15.1155,
57
+ "eval_samples_per_second": 459.529,
58
+ "eval_steps_per_second": 57.491,
59
+ "step": 1444
60
+ },
61
+ {
62
+ "epoch": 3.115264797507788,
63
+ "grad_norm": 0.06427361071109772,
64
+ "learning_rate": 3.4407484407484405e-05,
65
+ "loss": 0.0024,
66
+ "step": 1500
67
+ },
68
+ {
69
+ "epoch": 4.0,
70
+ "eval_accuracy": 0.9984720788100354,
71
+ "eval_f1": 0.9167412712623096,
72
+ "eval_loss": 0.0061088865622878075,
73
+ "eval_precision": 0.8819982773471146,
74
+ "eval_recall": 0.9543336439888164,
75
+ "eval_runtime": 15.4198,
76
+ "eval_samples_per_second": 450.46,
77
+ "eval_steps_per_second": 56.356,
78
+ "step": 1926
79
+ },
80
+ {
81
+ "epoch": 4.153686396677051,
82
+ "grad_norm": 0.04428843781352043,
83
+ "learning_rate": 2.920997920997921e-05,
84
+ "loss": 0.0017,
85
+ "step": 2000
86
+ },
87
+ {
88
+ "epoch": 4.998961578400831,
89
+ "eval_accuracy": 0.9986046381826807,
90
+ "eval_f1": 0.9254284390921722,
91
+ "eval_loss": 0.007444376591593027,
92
+ "eval_precision": 0.919889502762431,
93
+ "eval_recall": 0.9310344827586207,
94
+ "eval_runtime": 15.1205,
95
+ "eval_samples_per_second": 459.377,
96
+ "eval_steps_per_second": 57.472,
97
+ "step": 2407
98
+ },
99
+ {
100
+ "epoch": 5.192107995846314,
101
+ "grad_norm": 0.004208261147141457,
102
+ "learning_rate": 2.4012474012474013e-05,
103
+ "loss": 0.0011,
104
+ "step": 2500
105
+ },
106
+ {
107
+ "epoch": 6.0,
108
+ "eval_accuracy": 0.9985767309463344,
109
+ "eval_f1": 0.9266943291839557,
110
+ "eval_loss": 0.007942954078316689,
111
+ "eval_precision": 0.916970802919708,
112
+ "eval_recall": 0.9366262814538676,
113
+ "eval_runtime": 15.1887,
114
+ "eval_samples_per_second": 457.314,
115
+ "eval_steps_per_second": 57.214,
116
+ "step": 2889
117
+ },
118
+ {
119
+ "epoch": 6.230529595015576,
120
+ "grad_norm": 0.004876282997429371,
121
+ "learning_rate": 1.8814968814968818e-05,
122
+ "loss": 0.0007,
123
+ "step": 3000
124
+ },
125
+ {
126
+ "epoch": 6.998961578400831,
127
+ "eval_accuracy": 0.9986744062735468,
128
+ "eval_f1": 0.9254004576659038,
129
+ "eval_loss": 0.006659395061433315,
130
+ "eval_precision": 0.9091726618705036,
131
+ "eval_recall": 0.9422180801491147,
132
+ "eval_runtime": 15.1599,
133
+ "eval_samples_per_second": 458.182,
134
+ "eval_steps_per_second": 57.322,
135
+ "step": 3370
136
+ },
137
+ {
138
+ "epoch": 7.268951194184839,
139
+ "grad_norm": 0.0032651671208441257,
140
+ "learning_rate": 1.3617463617463619e-05,
141
+ "loss": 0.0005,
142
+ "step": 3500
143
+ },
144
+ {
145
+ "epoch": 8.0,
146
+ "eval_accuracy": 0.9986674294644602,
147
+ "eval_f1": 0.9275092936802974,
148
+ "eval_loss": 0.007326104678213596,
149
+ "eval_precision": 0.9249304911955515,
150
+ "eval_recall": 0.9301025163094129,
151
+ "eval_runtime": 15.1332,
152
+ "eval_samples_per_second": 458.991,
153
+ "eval_steps_per_second": 57.423,
154
+ "step": 3852
155
+ },
156
+ {
157
+ "epoch": 8.307372793354102,
158
+ "grad_norm": 0.0013715826207771897,
159
+ "learning_rate": 8.419958419958421e-06,
160
+ "loss": 0.0004,
161
+ "step": 4000
162
+ },
163
+ {
164
+ "epoch": 8.99896157840083,
165
+ "eval_accuracy": 0.9987162671280663,
166
+ "eval_f1": 0.9323447636700648,
167
+ "eval_loss": 0.008018395863473415,
168
+ "eval_precision": 0.9271889400921659,
169
+ "eval_recall": 0.9375582479030755,
170
+ "eval_runtime": 15.4151,
171
+ "eval_samples_per_second": 450.598,
172
+ "eval_steps_per_second": 56.373,
173
+ "step": 4333
174
+ },
175
+ {
176
+ "epoch": 9.345794392523365,
177
+ "grad_norm": 0.005300257820636034,
178
+ "learning_rate": 3.2224532224532228e-06,
179
+ "loss": 0.0002,
180
+ "step": 4500
181
+ },
182
+ {
183
+ "epoch": 9.989615784008308,
184
+ "eval_accuracy": 0.9987092903189797,
185
+ "eval_f1": 0.9315448658649399,
186
+ "eval_loss": 0.007857992313802242,
187
+ "eval_precision": 0.9247015610651974,
188
+ "eval_recall": 0.9384902143522833,
189
+ "eval_runtime": 15.1843,
190
+ "eval_samples_per_second": 457.447,
191
+ "eval_steps_per_second": 57.23,
192
+ "step": 4810
193
+ },
194
+ {
195
+ "epoch": 9.989615784008308,
196
+ "step": 4810,
197
+ "total_flos": 1.3132946802550608e+16,
198
+ "train_loss": 0.0027612092573652642,
199
+ "train_runtime": 2084.9871,
200
+ "train_samples_per_second": 147.78,
201
+ "train_steps_per_second": 2.307
202
+ }
203
+ ],
204
+ "logging_steps": 500,
205
+ "max_steps": 4810,
206
+ "num_input_tokens_seen": 0,
207
+ "num_train_epochs": 10,
208
+ "save_steps": 500,
209
+ "stateful_callbacks": {
210
+ "TrainerControl": {
211
+ "args": {
212
+ "should_epoch_stop": false,
213
+ "should_evaluate": false,
214
+ "should_log": false,
215
+ "should_save": true,
216
+ "should_training_stop": true
217
+ },
218
+ "attributes": {}
219
+ }
220
+ },
221
+ "total_flos": 1.3132946802550608e+16,
222
+ "train_batch_size": 32,
223
+ "trial_name": null,
224
+ "trial_params": null
225
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13556e6c97b2f39e25d5830ab0bc61ce81f807bcf643d150d23dd97c2f606c57
3
+ size 5240
vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
vocab.txt ADDED
The diff for this file is too large to render. See raw diff