TusharGoel commited on
Commit
92c150b
1 Parent(s): b1b8035

Upload 8 files

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "SCUT-DLVCLab/lilt-roberta-en-base",
3
  "architectures": [
4
  "LiltForQuestionAnswering"
5
  ],
 
1
  {
2
+ "_name_or_path": "TusharGoel/LiLT-Document-QA",
3
  "architectures": [
4
  "LiltForQuestionAnswering"
5
  ],
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af19cb0323181b284410f1a59cdcac62819016be9732a0f20c419a6488310f8e
3
  size 520801357
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e47d071230ebb0bb43143469a7ec5cf4f2c16d2dffa29200af02bba9d1ae247
3
  size 520801357
special_tokens_map.json CHANGED
@@ -1,4 +1,11 @@
1
  {
 
 
 
 
 
 
 
2
  "bos_token": "<s>",
3
  "cls_token": "<s>",
4
  "eos_token": "</s>",
 
1
  {
2
+ "additional_special_tokens": [
3
+ "<s>",
4
+ "<pad>",
5
+ "</s>",
6
+ "<unk>",
7
+ "<mask>"
8
+ ],
9
  "bos_token": "<s>",
10
  "cls_token": "<s>",
11
  "eos_token": "</s>",
tokenizer.json CHANGED
@@ -23,7 +23,7 @@
23
  "single_word": false,
24
  "lstrip": false,
25
  "rstrip": false,
26
- "normalized": true,
27
  "special": true
28
  },
29
  {
@@ -32,7 +32,7 @@
32
  "single_word": false,
33
  "lstrip": false,
34
  "rstrip": false,
35
- "normalized": true,
36
  "special": true
37
  },
38
  {
@@ -41,7 +41,7 @@
41
  "single_word": false,
42
  "lstrip": false,
43
  "rstrip": false,
44
- "normalized": true,
45
  "special": true
46
  },
47
  {
@@ -50,16 +50,16 @@
50
  "single_word": false,
51
  "lstrip": false,
52
  "rstrip": false,
53
- "normalized": true,
54
  "special": true
55
  },
56
  {
57
  "id": 50264,
58
  "content": "<mask>",
59
  "single_word": false,
60
- "lstrip": true,
61
  "rstrip": false,
62
- "normalized": true,
63
  "special": true
64
  }
65
  ],
 
23
  "single_word": false,
24
  "lstrip": false,
25
  "rstrip": false,
26
+ "normalized": false,
27
  "special": true
28
  },
29
  {
 
32
  "single_word": false,
33
  "lstrip": false,
34
  "rstrip": false,
35
+ "normalized": false,
36
  "special": true
37
  },
38
  {
 
41
  "single_word": false,
42
  "lstrip": false,
43
  "rstrip": false,
44
+ "normalized": false,
45
  "special": true
46
  },
47
  {
 
50
  "single_word": false,
51
  "lstrip": false,
52
  "rstrip": false,
53
+ "normalized": false,
54
  "special": true
55
  },
56
  {
57
  "id": 50264,
58
  "content": "<mask>",
59
  "single_word": false,
60
+ "lstrip": false,
61
  "rstrip": false,
62
+ "normalized": false,
63
  "special": true
64
  }
65
  ],
tokenizer_config.json CHANGED
@@ -4,7 +4,7 @@
4
  "0": {
5
  "content": "<s>",
6
  "lstrip": false,
7
- "normalized": true,
8
  "rstrip": false,
9
  "single_word": false,
10
  "special": true
@@ -12,7 +12,7 @@
12
  "1": {
13
  "content": "<pad>",
14
  "lstrip": false,
15
- "normalized": true,
16
  "rstrip": false,
17
  "single_word": false,
18
  "special": true
@@ -20,7 +20,7 @@
20
  "2": {
21
  "content": "</s>",
22
  "lstrip": false,
23
- "normalized": true,
24
  "rstrip": false,
25
  "single_word": false,
26
  "special": true
@@ -28,21 +28,27 @@
28
  "3": {
29
  "content": "<unk>",
30
  "lstrip": false,
31
- "normalized": true,
32
  "rstrip": false,
33
  "single_word": false,
34
  "special": true
35
  },
36
  "50264": {
37
  "content": "<mask>",
38
- "lstrip": true,
39
- "normalized": true,
40
  "rstrip": false,
41
  "single_word": false,
42
  "special": true
43
  }
44
  },
45
- "additional_special_tokens": [],
 
 
 
 
 
 
46
  "bos_token": "<s>",
47
  "clean_up_tokenization_spaces": true,
48
  "cls_token": "<s>",
@@ -55,8 +61,10 @@
55
  "eos_token": "</s>",
56
  "errors": "replace",
57
  "mask_token": "<mask>",
 
58
  "model_max_length": 512,
59
  "only_label_first_subword": true,
 
60
  "pad_token": "<pad>",
61
  "pad_token_box": [
62
  0,
@@ -65,6 +73,8 @@
65
  0
66
  ],
67
  "pad_token_label": -100,
 
 
68
  "sep_token": "</s>",
69
  "sep_token_box": [
70
  0,
@@ -72,7 +82,10 @@
72
  0,
73
  0
74
  ],
 
75
  "tokenizer_class": "LayoutLMv3Tokenizer",
76
  "trim_offsets": true,
 
 
77
  "unk_token": "<unk>"
78
  }
 
4
  "0": {
5
  "content": "<s>",
6
  "lstrip": false,
7
+ "normalized": false,
8
  "rstrip": false,
9
  "single_word": false,
10
  "special": true
 
12
  "1": {
13
  "content": "<pad>",
14
  "lstrip": false,
15
+ "normalized": false,
16
  "rstrip": false,
17
  "single_word": false,
18
  "special": true
 
20
  "2": {
21
  "content": "</s>",
22
  "lstrip": false,
23
+ "normalized": false,
24
  "rstrip": false,
25
  "single_word": false,
26
  "special": true
 
28
  "3": {
29
  "content": "<unk>",
30
  "lstrip": false,
31
+ "normalized": false,
32
  "rstrip": false,
33
  "single_word": false,
34
  "special": true
35
  },
36
  "50264": {
37
  "content": "<mask>",
38
+ "lstrip": false,
39
+ "normalized": false,
40
  "rstrip": false,
41
  "single_word": false,
42
  "special": true
43
  }
44
  },
45
+ "additional_special_tokens": [
46
+ "<s>",
47
+ "<pad>",
48
+ "</s>",
49
+ "<unk>",
50
+ "<mask>"
51
+ ],
52
  "bos_token": "<s>",
53
  "clean_up_tokenization_spaces": true,
54
  "cls_token": "<s>",
 
61
  "eos_token": "</s>",
62
  "errors": "replace",
63
  "mask_token": "<mask>",
64
+ "max_length": 512,
65
  "model_max_length": 512,
66
  "only_label_first_subword": true,
67
+ "pad_to_multiple_of": null,
68
  "pad_token": "<pad>",
69
  "pad_token_box": [
70
  0,
 
73
  0
74
  ],
75
  "pad_token_label": -100,
76
+ "pad_token_type_id": 0,
77
+ "padding_side": "right",
78
  "sep_token": "</s>",
79
  "sep_token_box": [
80
  0,
 
82
  0,
83
  0
84
  ],
85
+ "stride": 0,
86
  "tokenizer_class": "LayoutLMv3Tokenizer",
87
  "trim_offsets": true,
88
+ "truncation_side": "right",
89
+ "truncation_strategy": "only_second",
90
  "unk_token": "<unk>"
91
  }