djsull commited on
Commit
7db1edf
·
verified ·
1 Parent(s): f880627

djsull/sent_classification

Browse files
README.md CHANGED
@@ -1,6 +1,7 @@
1
  ---
2
  library_name: transformers
3
- base_model: klue/roberta-base
 
4
  tags:
5
  - generated_from_trainer
6
  metrics:
@@ -15,14 +16,14 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # aha_sentence_classification
17
 
18
- This model is a fine-tuned version of [klue/roberta-base](https://huggingface.co/klue/roberta-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.8977
21
- - Accuracy: 0.6701
22
- - F1 Micro: 0.6701
23
- - F1 Macro: 0.6301
24
- - Precision Macro: 0.5833
25
- - Recall Macro: 0.7331
26
 
27
  ## Model description
28
 
@@ -54,16 +55,16 @@ The following hyperparameters were used during training:
54
 
55
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 Micro | F1 Macro | Precision Macro | Recall Macro |
56
  |:-------------:|:------:|:-----:|:---------------:|:--------:|:--------:|:--------:|:---------------:|:------------:|
57
- | 1.3115 | 0.5949 | 1000 | 1.3492 | 0.5285 | 0.5285 | 0.5233 | 0.5079 | 0.6638 |
58
- | 0.9152 | 1.1898 | 2000 | 1.0651 | 0.6243 | 0.6243 | 0.6065 | 0.5681 | 0.7156 |
59
- | 0.8716 | 1.7847 | 3000 | 1.0069 | 0.6374 | 0.6374 | 0.6044 | 0.5635 | 0.7218 |
60
- | 0.7678 | 2.3795 | 4000 | 0.9808 | 0.6293 | 0.6293 | 0.6154 | 0.5790 | 0.7316 |
61
- | 0.7341 | 2.9744 | 5000 | 0.8977 | 0.6701 | 0.6701 | 0.6301 | 0.5833 | 0.7331 |
62
- | 0.6194 | 3.5693 | 6000 | 0.9595 | 0.6499 | 0.6499 | 0.6221 | 0.5894 | 0.7091 |
63
- | 0.4718 | 4.1642 | 7000 | 0.9216 | 0.6731 | 0.6731 | 0.6361 | 0.6053 | 0.6995 |
64
- | 0.4739 | 4.7591 | 8000 | 0.9148 | 0.6739 | 0.6739 | 0.6484 | 0.6171 | 0.7059 |
65
- | 0.433 | 5.3540 | 9000 | 1.0006 | 0.6616 | 0.6616 | 0.6298 | 0.5953 | 0.7092 |
66
- | 0.3989 | 5.9488 | 10000 | 0.9988 | 0.6626 | 0.6626 | 0.6412 | 0.6157 | 0.7024 |
67
 
68
 
69
  ### Framework versions
 
1
  ---
2
  library_name: transformers
3
+ license: apache-2.0
4
+ base_model: skt/A.X-Encoder-base
5
  tags:
6
  - generated_from_trainer
7
  metrics:
 
16
 
17
  # aha_sentence_classification
18
 
19
+ This model is a fine-tuned version of [skt/A.X-Encoder-base](https://huggingface.co/skt/A.X-Encoder-base) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.8454
22
+ - Accuracy: 0.6900
23
+ - F1 Micro: 0.6900
24
+ - F1 Macro: 0.6503
25
+ - Precision Macro: 0.6078
26
+ - Recall Macro: 0.7221
27
 
28
  ## Model description
29
 
 
55
 
56
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 Micro | F1 Macro | Precision Macro | Recall Macro |
57
  |:-------------:|:------:|:-----:|:---------------:|:--------:|:--------:|:--------:|:---------------:|:------------:|
58
+ | 0.9702 | 0.5949 | 1000 | 1.1520 | 0.5590 | 0.5590 | 0.5444 | 0.5142 | 0.6791 |
59
+ | 0.7293 | 1.1898 | 2000 | 1.0469 | 0.5992 | 0.5992 | 0.5966 | 0.5599 | 0.7238 |
60
+ | 0.7779 | 1.7847 | 3000 | 0.9977 | 0.6278 | 0.6278 | 0.5964 | 0.5646 | 0.7274 |
61
+ | 0.5545 | 2.3795 | 4000 | 0.9847 | 0.6290 | 0.6290 | 0.6208 | 0.5849 | 0.7236 |
62
+ | 0.5692 | 2.9744 | 5000 | 0.8454 | 0.6900 | 0.6900 | 0.6503 | 0.6078 | 0.7221 |
63
+ | 0.3962 | 3.5693 | 6000 | 1.0074 | 0.6488 | 0.6488 | 0.6316 | 0.6093 | 0.7081 |
64
+ | 0.1624 | 4.1642 | 7000 | 1.1059 | 0.6732 | 0.6732 | 0.6533 | 0.6322 | 0.6930 |
65
+ | 0.1816 | 4.7591 | 8000 | 1.1277 | 0.6872 | 0.6872 | 0.6513 | 0.6429 | 0.6690 |
66
+ | 0.0934 | 5.3540 | 9000 | 1.4084 | 0.6882 | 0.6882 | 0.6468 | 0.6380 | 0.6649 |
67
+ | 0.0882 | 5.9488 | 10000 | 1.4941 | 0.6918 | 0.6918 | 0.6450 | 0.6428 | 0.6606 |
68
 
69
 
70
  ### Framework versions
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<pad>": 49999
3
+ }
config.json CHANGED
@@ -1,15 +1,24 @@
1
  {
2
  "architectures": [
3
- "RobertaForSequenceClassification"
4
  ],
5
- "attention_probs_dropout_prob": 0.1,
 
6
  "bos_token_id": 0,
7
- "classifier_dropout": null,
 
 
 
 
 
 
8
  "dtype": "float32",
9
- "eos_token_id": 2,
 
 
 
10
  "gradient_checkpointing": false,
11
- "hidden_act": "gelu",
12
- "hidden_dropout_prob": 0.1,
13
  "hidden_size": 768,
14
  "id2label": {
15
  "0": "\ud575\uc2ec\uc9c8\ubb38",
@@ -29,8 +38,9 @@
29
  "14": "\uc608\uc2dc\ub370\uc774\ud130/\uc99d\ube59",
30
  "15": "\uc758\ubbf8/\ud574\ub2f9\uc0ac\ud56d\uc5c6\uc74c"
31
  },
 
32
  "initializer_range": 0.02,
33
- "intermediate_size": 3072,
34
  "label2id": {
35
  "\uadfc\uac70/\uc124\uba85": 7,
36
  "\ub300\uc548/\ube44\uad50": 10,
@@ -50,16 +60,23 @@
50
  "\ud575\uc2ec\uc9c8\ubb38": 0
51
  },
52
  "layer_norm_eps": 1e-05,
53
- "max_position_embeddings": 514,
54
- "model_type": "roberta",
 
 
 
 
 
 
55
  "num_attention_heads": 12,
56
- "num_hidden_layers": 12,
57
- "pad_token_id": 1,
58
  "position_embedding_type": "absolute",
59
  "problem_type": "single_label_classification",
60
- "tokenizer_class": "BertTokenizer",
 
 
 
61
  "transformers_version": "4.56.1",
62
- "type_vocab_size": 1,
63
- "use_cache": true,
64
- "vocab_size": 32000
65
  }
 
1
  {
2
  "architectures": [
3
+ "ModernBertForSequenceClassification"
4
  ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
  "bos_token_id": 0,
8
+ "classifier_activation": "gelu",
9
+ "classifier_bias": false,
10
+ "classifier_dropout": 0.0,
11
+ "classifier_pooling": "mean",
12
+ "cls_token_id": 0,
13
+ "decoder_bias": true,
14
+ "deterministic_flash_attn": false,
15
  "dtype": "float32",
16
+ "embedding_dropout": 0.0,
17
+ "eos_token_id": 1,
18
+ "global_attn_every_n_layers": 3,
19
+ "global_rope_theta": 160000,
20
  "gradient_checkpointing": false,
21
+ "hidden_activation": "gelu",
 
22
  "hidden_size": 768,
23
  "id2label": {
24
  "0": "\ud575\uc2ec\uc9c8\ubb38",
 
38
  "14": "\uc608\uc2dc\ub370\uc774\ud130/\uc99d\ube59",
39
  "15": "\uc758\ubbf8/\ud574\ub2f9\uc0ac\ud56d\uc5c6\uc74c"
40
  },
41
+ "initializer_cutoff_factor": 2.0,
42
  "initializer_range": 0.02,
43
+ "intermediate_size": 1152,
44
  "label2id": {
45
  "\uadfc\uac70/\uc124\uba85": 7,
46
  "\ub300\uc548/\ube44\uad50": 10,
 
60
  "\ud575\uc2ec\uc9c8\ubb38": 0
61
  },
62
  "layer_norm_eps": 1e-05,
63
+ "local_attention": 128,
64
+ "local_rope_theta": 10000.0,
65
+ "max_position_embeddings": 16384,
66
+ "mlp_bias": false,
67
+ "mlp_dropout": 0.0,
68
+ "model_type": "modernbert",
69
+ "norm_bias": false,
70
+ "norm_eps": 1e-05,
71
  "num_attention_heads": 12,
72
+ "num_hidden_layers": 22,
73
+ "pad_token_id": 49999,
74
  "position_embedding_type": "absolute",
75
  "problem_type": "single_label_classification",
76
+ "repad_logits_with_grad": false,
77
+ "sep_token_id": 1,
78
+ "sparse_pred_ignore_index": -100,
79
+ "sparse_prediction": false,
80
  "transformers_version": "4.56.1",
81
+ "vocab_size": 50000
 
 
82
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5029cc5e5c4f78dbe3082b65b81081564ee6b3cb0782b23de8341e0360a0ff23
3
- size 442545808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5163bed608f7349e76f6422df8f7c1262a06bb926993bf328bfba2d806281f12
3
+ size 597352360
special_tokens_map.json CHANGED
@@ -1,48 +1,48 @@
1
  {
2
  "bos_token": {
3
- "content": "[CLS]",
4
  "lstrip": false,
5
  "normalized": false,
6
  "rstrip": false,
7
  "single_word": false
8
  },
9
  "cls_token": {
10
- "content": "[CLS]",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
  "eos_token": {
17
- "content": "[SEP]",
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
21
  "single_word": false
22
  },
23
  "mask_token": {
24
- "content": "[MASK]",
25
  "lstrip": false,
26
  "normalized": false,
27
  "rstrip": false,
28
  "single_word": false
29
  },
30
  "pad_token": {
31
- "content": "[PAD]",
32
  "lstrip": false,
33
  "normalized": false,
34
  "rstrip": false,
35
  "single_word": false
36
  },
37
  "sep_token": {
38
- "content": "[SEP]",
39
  "lstrip": false,
40
  "normalized": false,
41
  "rstrip": false,
42
  "single_word": false
43
  },
44
  "unk_token": {
45
- "content": "[UNK]",
46
  "lstrip": false,
47
  "normalized": false,
48
  "rstrip": false,
 
1
  {
2
  "bos_token": {
3
+ "content": "<s>",
4
  "lstrip": false,
5
  "normalized": false,
6
  "rstrip": false,
7
  "single_word": false
8
  },
9
  "cls_token": {
10
+ "content": "<cls>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
  "eos_token": {
17
+ "content": "<\\s>",
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
21
  "single_word": false
22
  },
23
  "mask_token": {
24
+ "content": "<mask>",
25
  "lstrip": false,
26
  "normalized": false,
27
  "rstrip": false,
28
  "single_word": false
29
  },
30
  "pad_token": {
31
+ "content": "<pad>",
32
  "lstrip": false,
33
  "normalized": false,
34
  "rstrip": false,
35
  "single_word": false
36
  },
37
  "sep_token": {
38
+ "content": "<sep>",
39
  "lstrip": false,
40
  "normalized": false,
41
  "rstrip": false,
42
  "single_word": false
43
  },
44
  "unk_token": {
45
+ "content": "<unk>",
46
  "lstrip": false,
47
  "normalized": false,
48
  "rstrip": false,
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "added_tokens_decoder": {
3
  "0": {
4
- "content": "[CLS]",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
@@ -9,7 +9,7 @@
9
  "special": true
10
  },
11
  "1": {
12
- "content": "[PAD]",
13
  "lstrip": false,
14
  "normalized": false,
15
  "rstrip": false,
@@ -17,7 +17,7 @@
17
  "special": true
18
  },
19
  "2": {
20
- "content": "[SEP]",
21
  "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
@@ -25,7 +25,7 @@
25
  "special": true
26
  },
27
  "3": {
28
- "content": "[UNK]",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
@@ -33,7 +33,271 @@
33
  "special": true
34
  },
35
  "4": {
36
- "content": "[MASK]",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
37
  "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
@@ -41,20 +305,18 @@
41
  "special": true
42
  }
43
  },
44
- "bos_token": "[CLS]",
45
- "clean_up_tokenization_spaces": false,
46
- "cls_token": "[CLS]",
47
- "do_basic_tokenize": true,
48
  "do_lower_case": false,
49
- "eos_token": "[SEP]",
50
  "extra_special_tokens": {},
51
- "mask_token": "[MASK]",
52
- "model_max_length": 512,
53
- "never_split": null,
54
- "pad_token": "[PAD]",
55
- "sep_token": "[SEP]",
56
  "strip_accents": null,
57
  "tokenize_chinese_chars": true,
58
  "tokenizer_class": "BertTokenizer",
59
- "unk_token": "[UNK]"
60
  }
 
1
  {
2
  "added_tokens_decoder": {
3
  "0": {
4
+ "content": "<s>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
 
9
  "special": true
10
  },
11
  "1": {
12
+ "content": "<\\s>",
13
  "lstrip": false,
14
  "normalized": false,
15
  "rstrip": false,
 
17
  "special": true
18
  },
19
  "2": {
20
+ "content": "<unk>",
21
  "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
 
25
  "special": true
26
  },
27
  "3": {
28
+ "content": "<sep>",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
 
33
  "special": true
34
  },
35
  "4": {
36
+ "content": "<mask>",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ },
43
+ "5": {
44
+ "content": "<cls>",
45
+ "lstrip": false,
46
+ "normalized": false,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": true
50
+ },
51
+ "6": {
52
+ "content": "<unused0>",
53
+ "lstrip": false,
54
+ "normalized": false,
55
+ "rstrip": false,
56
+ "single_word": false,
57
+ "special": true
58
+ },
59
+ "7": {
60
+ "content": "<unused1>",
61
+ "lstrip": false,
62
+ "normalized": false,
63
+ "rstrip": false,
64
+ "single_word": false,
65
+ "special": true
66
+ },
67
+ "8": {
68
+ "content": "<unused2>",
69
+ "lstrip": false,
70
+ "normalized": false,
71
+ "rstrip": false,
72
+ "single_word": false,
73
+ "special": true
74
+ },
75
+ "9": {
76
+ "content": "<unused3>",
77
+ "lstrip": false,
78
+ "normalized": false,
79
+ "rstrip": false,
80
+ "single_word": false,
81
+ "special": true
82
+ },
83
+ "10": {
84
+ "content": "<unused4>",
85
+ "lstrip": false,
86
+ "normalized": false,
87
+ "rstrip": false,
88
+ "single_word": false,
89
+ "special": true
90
+ },
91
+ "11": {
92
+ "content": "<unused5>",
93
+ "lstrip": false,
94
+ "normalized": false,
95
+ "rstrip": false,
96
+ "single_word": false,
97
+ "special": true
98
+ },
99
+ "12": {
100
+ "content": "<unused6>",
101
+ "lstrip": false,
102
+ "normalized": false,
103
+ "rstrip": false,
104
+ "single_word": false,
105
+ "special": true
106
+ },
107
+ "13": {
108
+ "content": "<unused7>",
109
+ "lstrip": false,
110
+ "normalized": false,
111
+ "rstrip": false,
112
+ "single_word": false,
113
+ "special": true
114
+ },
115
+ "14": {
116
+ "content": "<unused8>",
117
+ "lstrip": false,
118
+ "normalized": false,
119
+ "rstrip": false,
120
+ "single_word": false,
121
+ "special": true
122
+ },
123
+ "15": {
124
+ "content": "<unused9>",
125
+ "lstrip": false,
126
+ "normalized": false,
127
+ "rstrip": false,
128
+ "single_word": false,
129
+ "special": true
130
+ },
131
+ "16": {
132
+ "content": "<unused10>",
133
+ "lstrip": false,
134
+ "normalized": false,
135
+ "rstrip": false,
136
+ "single_word": false,
137
+ "special": true
138
+ },
139
+ "17": {
140
+ "content": "<unused11>",
141
+ "lstrip": false,
142
+ "normalized": false,
143
+ "rstrip": false,
144
+ "single_word": false,
145
+ "special": true
146
+ },
147
+ "18": {
148
+ "content": "<unused12>",
149
+ "lstrip": false,
150
+ "normalized": false,
151
+ "rstrip": false,
152
+ "single_word": false,
153
+ "special": true
154
+ },
155
+ "19": {
156
+ "content": "<unused13>",
157
+ "lstrip": false,
158
+ "normalized": false,
159
+ "rstrip": false,
160
+ "single_word": false,
161
+ "special": true
162
+ },
163
+ "20": {
164
+ "content": "<unused14>",
165
+ "lstrip": false,
166
+ "normalized": false,
167
+ "rstrip": false,
168
+ "single_word": false,
169
+ "special": true
170
+ },
171
+ "21": {
172
+ "content": "<unused15>",
173
+ "lstrip": false,
174
+ "normalized": false,
175
+ "rstrip": false,
176
+ "single_word": false,
177
+ "special": true
178
+ },
179
+ "22": {
180
+ "content": "<unused16>",
181
+ "lstrip": false,
182
+ "normalized": false,
183
+ "rstrip": false,
184
+ "single_word": false,
185
+ "special": true
186
+ },
187
+ "23": {
188
+ "content": "<unused17>",
189
+ "lstrip": false,
190
+ "normalized": false,
191
+ "rstrip": false,
192
+ "single_word": false,
193
+ "special": true
194
+ },
195
+ "24": {
196
+ "content": "<unused18>",
197
+ "lstrip": false,
198
+ "normalized": false,
199
+ "rstrip": false,
200
+ "single_word": false,
201
+ "special": true
202
+ },
203
+ "25": {
204
+ "content": "<unused19>",
205
+ "lstrip": false,
206
+ "normalized": false,
207
+ "rstrip": false,
208
+ "single_word": false,
209
+ "special": true
210
+ },
211
+ "26": {
212
+ "content": "<unused20>",
213
+ "lstrip": false,
214
+ "normalized": false,
215
+ "rstrip": false,
216
+ "single_word": false,
217
+ "special": true
218
+ },
219
+ "27": {
220
+ "content": "<unused21>",
221
+ "lstrip": false,
222
+ "normalized": false,
223
+ "rstrip": false,
224
+ "single_word": false,
225
+ "special": true
226
+ },
227
+ "28": {
228
+ "content": "<unused22>",
229
+ "lstrip": false,
230
+ "normalized": false,
231
+ "rstrip": false,
232
+ "single_word": false,
233
+ "special": true
234
+ },
235
+ "29": {
236
+ "content": "<unused23>",
237
+ "lstrip": false,
238
+ "normalized": false,
239
+ "rstrip": false,
240
+ "single_word": false,
241
+ "special": true
242
+ },
243
+ "30": {
244
+ "content": "<unused24>",
245
+ "lstrip": false,
246
+ "normalized": false,
247
+ "rstrip": false,
248
+ "single_word": false,
249
+ "special": true
250
+ },
251
+ "31": {
252
+ "content": "<unused25>",
253
+ "lstrip": false,
254
+ "normalized": false,
255
+ "rstrip": false,
256
+ "single_word": false,
257
+ "special": true
258
+ },
259
+ "32": {
260
+ "content": "<unused26>",
261
+ "lstrip": false,
262
+ "normalized": false,
263
+ "rstrip": false,
264
+ "single_word": false,
265
+ "special": true
266
+ },
267
+ "33": {
268
+ "content": "<unused27>",
269
+ "lstrip": false,
270
+ "normalized": false,
271
+ "rstrip": false,
272
+ "single_word": false,
273
+ "special": true
274
+ },
275
+ "34": {
276
+ "content": "<unused28>",
277
+ "lstrip": false,
278
+ "normalized": false,
279
+ "rstrip": false,
280
+ "single_word": false,
281
+ "special": true
282
+ },
283
+ "35": {
284
+ "content": "<unused29>",
285
+ "lstrip": false,
286
+ "normalized": false,
287
+ "rstrip": false,
288
+ "single_word": false,
289
+ "special": true
290
+ },
291
+ "36": {
292
+ "content": "<unused30>",
293
+ "lstrip": false,
294
+ "normalized": false,
295
+ "rstrip": false,
296
+ "single_word": false,
297
+ "special": true
298
+ },
299
+ "49999": {
300
+ "content": "<pad>",
301
  "lstrip": false,
302
  "normalized": false,
303
  "rstrip": false,
 
305
  "special": true
306
  }
307
  },
308
+ "bos_token": "<s>",
309
+ "clean_up_tokenization_spaces": true,
310
+ "cls_token": "<cls>",
 
311
  "do_lower_case": false,
312
+ "eos_token": "<\\s>",
313
  "extra_special_tokens": {},
314
+ "mask_token": "<mask>",
315
+ "model_max_length": 1024,
316
+ "pad_token": "<pad>",
317
+ "sep_token": "<sep>",
 
318
  "strip_accents": null,
319
  "tokenize_chinese_chars": true,
320
  "tokenizer_class": "BertTokenizer",
321
+ "unk_token": "<unk>"
322
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89a1c4e17ad5d25dbf2f8b28524d6251bdac9277288d757f1766e38116fae9a5
3
  size 5905
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91f53086e3bb6cbe98433b44baa7f92d9e808cae3146fd2be289265614a28a4e
3
  size 5905
vocab.txt CHANGED
The diff for this file is too large to render. See raw diff