joshuaphua commited on
Commit
8ec2bc2
1 Parent(s): 3c8b334

Training in progress, epoch 1

Browse files
Files changed (5) hide show
  1. README.md +11 -11
  2. config.json +13 -1
  3. pytorch_model.bin +2 -2
  4. tokenizer_config.json +1 -0
  5. training_args.bin +1 -1
README.md CHANGED
@@ -25,16 +25,16 @@ model-index:
25
  metrics:
26
  - name: Precision
27
  type: precision
28
- value: 0.8764705882352941
29
  - name: Recall
30
  type: recall
31
- value: 0.8969546742209632
32
  - name: F1
33
  type: f1
34
- value: 0.8865943297164859
35
  - name: Accuracy
36
  type: accuracy
37
- value: 0.975923333692258
38
  ---
39
 
40
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -44,11 +44,11 @@ should probably proofread and complete it, then remove this comment. -->
44
 
45
  This model is a fine-tuned version of [dslim/distilbert-NER](https://huggingface.co/dslim/distilbert-NER) on the conll2003 dataset.
46
  It achieves the following results on the evaluation set:
47
- - Loss: 0.1908
48
- - Precision: 0.8765
49
- - Recall: 0.8970
50
- - F1: 0.8866
51
- - Accuracy: 0.9759
52
 
53
  ## Model description
54
 
@@ -79,8 +79,8 @@ The following hyperparameters were used during training:
79
 
80
  | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
81
  |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
82
- | 0.0568 | 1.0 | 3922 | 0.1877 | 0.8678 | 0.8893 | 0.8785 | 0.9740 |
83
- | 0.0314 | 2.0 | 7844 | 0.1908 | 0.8765 | 0.8970 | 0.8866 | 0.9759 |
84
 
85
 
86
  ### Framework versions
 
25
  metrics:
26
  - name: Precision
27
  type: precision
28
+ value: 0.8488967343336276
29
  - name: Recall
30
  type: recall
31
+ value: 0.8514518413597734
32
  - name: F1
33
  type: f1
34
+ value: 0.8501723680721294
35
  - name: Accuracy
36
  type: accuracy
37
+ value: 0.9675675675675676
38
  ---
39
 
40
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
44
 
45
  This model is a fine-tuned version of [dslim/distilbert-NER](https://huggingface.co/dslim/distilbert-NER) on the conll2003 dataset.
46
  It achieves the following results on the evaluation set:
47
+ - Loss: nan
48
+ - Precision: 0.8489
49
+ - Recall: 0.8515
50
+ - F1: 0.8502
51
+ - Accuracy: 0.9676
52
 
53
  ## Model description
54
 
 
79
 
80
  | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 | Accuracy |
81
  |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
82
+ | 0.0773 | 1.0 | 3922 | nan | 0.8505 | 0.8461 | 0.8483 | 0.9668 |
83
+ | 0.0487 | 2.0 | 7844 | nan | 0.8489 | 0.8515 | 0.8502 | 0.9676 |
84
 
85
 
86
  ### Framework versions
config.json CHANGED
@@ -17,18 +17,30 @@
17
  "5": "B-LOC",
18
  "6": "I-LOC",
19
  "7": "B-MISC",
20
- "8": "I-MISC"
 
 
 
 
 
 
21
  },
22
  "initializer_range": 0.02,
23
  "label2id": {
 
24
  "B-LOC": 5,
 
25
  "B-MISC": 7,
26
  "B-ORG": 3,
27
  "B-PER": 1,
 
 
28
  "I-LOC": 6,
 
29
  "I-MISC": 8,
30
  "I-ORG": 4,
31
  "I-PER": 2,
 
32
  "O": 0
33
  },
34
  "max_position_embeddings": 512,
 
17
  "5": "B-LOC",
18
  "6": "I-LOC",
19
  "7": "B-MISC",
20
+ "8": "I-MISC",
21
+ "9": "B-JOB",
22
+ "10": "I-JOB",
23
+ "11": "B-MAJ",
24
+ "12": "I-MAJ",
25
+ "13": "B-SKILL",
26
+ "14": "I-SKILL"
27
  },
28
  "initializer_range": 0.02,
29
  "label2id": {
30
+ "B-JOB": 9,
31
  "B-LOC": 5,
32
+ "B-MAJ": 11,
33
  "B-MISC": 7,
34
  "B-ORG": 3,
35
  "B-PER": 1,
36
+ "B-SKILL": 13,
37
+ "I-JOB": 10,
38
  "I-LOC": 6,
39
+ "I-MAJ": 12,
40
  "I-MISC": 8,
41
  "I-ORG": 4,
42
  "I-PER": 2,
43
+ "I-SKILL": 14,
44
  "O": 0
45
  },
46
  "max_position_embeddings": 512,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08123b2ccbb1766e374a7117a9d612fc6de821d99a70a6dd5a802a9a896656a6
3
- size 260825186
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f48f65569c6d4d2debaefcefa7094a70189a3b1ec61489ef18523d684837010c
3
+ size 260843682
tokenizer_config.json CHANGED
@@ -45,6 +45,7 @@
45
  "cls_token": "[CLS]",
46
  "do_basic_tokenize": false,
47
  "do_lower_case": false,
 
48
  "mask_token": "[MASK]",
49
  "max_length": 512,
50
  "model_max_length": 512,
 
45
  "cls_token": "[CLS]",
46
  "do_basic_tokenize": false,
47
  "do_lower_case": false,
48
+ "ignore_mismatched_sizes": true,
49
  "mask_token": "[MASK]",
50
  "max_length": 512,
51
  "model_max_length": 512,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5dc0ef45ea2eb42c6608e194b3813cc705419c2bd0159649d14f608688f4fd3
3
  size 4472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ccaef9483fc239c2eab3324b34ce65e985a51200fb7d2254edabd926c3451b8
3
  size 4472