YooSungHyun commited on
Commit
3b5ca91
โ€ข
1 Parent(s): 25d4c6f
README.md ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - ko
4
+ metrics:
5
+ - accuracy
6
+ pipeline_tag: text-classification
7
+
8
+ # Optional. Add this if you want to encode your eval results in a structured way.
9
+ model-index:
10
+ - name: ko-answerable
11
+ results:
12
+ - task:
13
+ type: text-classification # Required. Example: automatic-speech-recognition
14
+ name: text-classification # Optional. Example: Speech Recognition
15
+ metrics:
16
+ - type: eval_accuracy
17
+ value: 0.892
18
+ name: eval_accuracy
19
+ verified: false
20
+ - type: test_accuracy
21
+ value: 0.837
22
+ name: test_accuracy
23
+ verified: false
24
+ ---
25
+ # ko-answerable: Passage์™€ Question์ด ๋‹ต๋ณ€์„ ํ•  ์ˆ˜ ์žˆ๋Š”๊ฐ€?์˜ 2์ง„ ๋ถ„๋ฅ˜
26
+
27
+ ## Model Details
28
+
29
+ SelfCheckGPT์˜ Answerable model์— ๊ฐ๋ช…๋ฐ›์•„ ์ œ์ž‘ํ•˜๊ฒŒ ๋˜์—ˆ์Šต๋‹ˆ๋‹ค. (https://arxiv.org/abs/2303.08896)
30
+
31
+ [monologg/kobigbird-bert-base](https://huggingface.co/monologg/kobigbird-bert-base) ๋ชจ๋ธ์„ ์‚ฌ์šฉํ•˜์—ฌ [BigBirdForSequenceClassification](https://huggingface.co/docs/transformers/v4.33.0/en/model_doc/big_bird#transformers.BigBirdForSequenceClassification) ์œผ๋กœ Fine-Tune ๋˜์—ˆ์Šต๋‹ˆ๋‹ค
32
+
33
+ Max Seq Len: 4096
34
+
35
+ Input Text Style: \<BOS\>Question\<SEP>Title\<SEP\>Passage\<EOS\>
36
+
37
+ Return: 1: ์‘๋‹ต ์—†์Œ, 0: ์‘๋‹ต ๊ฐ€๋Šฅ (sigmoid score ์‚ฌ์šฉ ๊ฐ€๋Šฅ)
38
+
39
+ ์‚ฌ์šฉ๋œ ๋ฐ์ดํ„ฐ์…‹ (ํ•ด๋‹น ๋ฐ์ดํ„ฐ์…‹์—์„œ 'is_impossible'์„ ๊ธฐ์ค€์œผ๋กœ 50:50์œผ๋กœ ๋žœ๋ค ์ถ”์ถœ(0,1 ๋น„์ค‘์ด ๋งž๋„๋ก))
40
+
41
+ 1. KLUE
42
+ 2. AIHub-๋„์„œ์ž๋ฃŒ ๊ธฐ๊ณ„๋…ํ•ด
43
+ 3. AIHub-๋‰ด์Šค ๊ธฐ์‚ฌ ๊ธฐ๊ณ„๋…ํ•ด ๋ฐ์ดํ„ฐ
44
+ 4. AIHub-ํ–‰์ • ๋ฌธ์„œ ๋Œ€์ƒ ๊ธฐ๊ณ„๋…ํ•ด ๋ฐ์ดํ„ฐ
45
+ 5. ํ‘œ๊ธฐ๋ฐ˜ ์งˆ์˜์‘๋‹ต ๋ฐ์ดํ„ฐ (๋งคํŠœ๋‹˜์—๊ฒŒ ๊ฐœ์ธ์ ์œผ๋กœ ๋ฐ›์Œ)
46
+
47
+ `AIHub-๊ธฐ๊ณ„๋…ํ•ด` ๋ฐ์ดํ„ฐ๋„ ์กด์žฌํ•˜๋‚˜, ๋ฐ์ดํ„ฐ ์ „์ฒ˜๋ฆฌํ•˜๊ธฐ ๊ตฌ์กฐ๊ฐ€ ์ข€ ๋ณต์žกํ•˜๊ฒŒ ๋‹ฌ๋ผ์„œ ์ œ์™ธํ•จ.
48
+
49
+ ์˜ˆ์ธก ์‹œ๊ฐ„: ๊ฑด๋‹น ํ‰๊ท  0.05์ดˆ ์ด๋‚ด (RTX 3090 ์‚ฌ์šฉ)
50
+
51
+ ์‚ฌ์šฉ GPU MEM: About 20GB (Seq๊ฐ€ ๊ธธ๋ฉด ๋งŽ์ด ๋จน์Œ)
all_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 10.0,
3
+ "train_loss": 0.07339318460044116,
4
+ "train_runtime": 488254.3014,
5
+ "train_samples_per_second": 19.153,
6
+ "train_steps_per_second": 0.299
7
+ }
config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "monologg/kobigbird-bert-base",
3
+ "architectures": [
4
+ "BigBirdForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "attention_type": "original_full",
8
+ "block_size": 64,
9
+ "bos_token_id": 5,
10
+ "classifier_dropout": null,
11
+ "eos_token_id": 6,
12
+ "gradient_checkpointing": false,
13
+ "hidden_act": "gelu_new",
14
+ "hidden_dropout_prob": 0.1,
15
+ "hidden_size": 768,
16
+ "initializer_range": 0.02,
17
+ "intermediate_size": 3072,
18
+ "layer_norm_eps": 1e-12,
19
+ "max_position_embeddings": 4096,
20
+ "model_type": "big_bird",
21
+ "num_attention_heads": 12,
22
+ "num_hidden_layers": 12,
23
+ "num_random_blocks": 3,
24
+ "pad_token_id": 0,
25
+ "position_embedding_type": "absolute",
26
+ "problem_type": "single_label_classification",
27
+ "rescale_embeddings": false,
28
+ "sep_token_id": 3,
29
+ "tokenizer_class": "BertTokenizer",
30
+ "torch_dtype": "float32",
31
+ "transformers_version": "4.32.0",
32
+ "type_vocab_size": 2,
33
+ "use_bias": true,
34
+ "use_cache": true,
35
+ "vocab_size": 32500
36
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6d0e8c491d76d948cc56b8a8b5b76a6e01f4a28951fde29001066d70afb4b37
3
+ size 457450105
special_tokens_map.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "[CLS]",
4
+ "eos_token": "</s>",
5
+ "mask_token": "[MASK]",
6
+ "pad_token": "[PAD]",
7
+ "sep_token": "[SEP]",
8
+ "unk_token": "[UNK]"
9
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "clean_up_tokenization_spaces": true,
4
+ "cls_token": "[CLS]",
5
+ "do_basic_tokenize": true,
6
+ "do_lower_case": false,
7
+ "eos_token": "</s>",
8
+ "mask_token": "[MASK]",
9
+ "model_max_length": 4096,
10
+ "never_split": null,
11
+ "pad_token": "[PAD]",
12
+ "sep_token": "[SEP]",
13
+ "strip_accents": null,
14
+ "tokenize_chinese_chars": true,
15
+ "tokenizer_class": "BertTokenizer",
16
+ "unk_token": "[UNK]"
17
+ }
vocab.txt ADDED
The diff for this file is too large to render. See raw diff