prithviraj-maurya commited on
Commit
3f808a9
·
verified ·
1 Parent(s): 2014fbd

End of training

Browse files
README.md ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ base_model: distilbert-base-uncased
4
+ tags:
5
+ - generated_from_trainer
6
+ metrics:
7
+ - accuracy
8
+ model-index:
9
+ - name: legalbench_task_classification
10
+ results: []
11
+ ---
12
+
13
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
14
+ should probably proofread and complete it, then remove this comment. -->
15
+
16
+ # legalbench_task_classification
17
+
18
+ This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
19
+ It achieves the following results on the evaluation set:
20
+ - Loss: 1.6844
21
+ - Accuracy: 0.9427
22
+
23
+ ## Model description
24
+
25
+ More information needed
26
+
27
+ ## Intended uses & limitations
28
+
29
+ More information needed
30
+
31
+ ## Training and evaluation data
32
+
33
+ More information needed
34
+
35
+ ## Training procedure
36
+
37
+ ### Training hyperparameters
38
+
39
+ The following hyperparameters were used during training:
40
+ - learning_rate: 2e-05
41
+ - train_batch_size: 16
42
+ - eval_batch_size: 16
43
+ - seed: 42
44
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
+ - lr_scheduler_type: linear
46
+ - num_epochs: 2
47
+
48
+ ### Training results
49
+
50
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy |
51
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|
52
+ | No log | 1.0 | 489 | 2.3287 | 0.9008 |
53
+ | 3.5563 | 2.0 | 978 | 1.6844 | 0.9427 |
54
+
55
+
56
+ ### Framework versions
57
+
58
+ - Transformers 4.35.2
59
+ - Pytorch 2.1.0+cu121
60
+ - Datasets 2.17.0
61
+ - Tokenizers 0.15.1
config.json ADDED
@@ -0,0 +1,351 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "abercrombie": 0,
13
+ "canada_tax_court_outcomes": 1,
14
+ "citation_prediction_classification": 2,
15
+ "citation_prediction_open": 3,
16
+ "consumer_contracts_qa": 4,
17
+ "contract_nli_confidentiality_of_agreement": 5,
18
+ "contract_nli_explicit_identification": 6,
19
+ "contract_nli_inclusion_of_verbally_conveyed_information": 7,
20
+ "contract_nli_limited_use": 8,
21
+ "contract_nli_no_licensing": 9,
22
+ "contract_nli_notice_on_compelled_disclosure": 10,
23
+ "contract_nli_permissible_acquirement_of_similar_information": 11,
24
+ "contract_nli_permissible_copy": 12,
25
+ "contract_nli_permissible_development_of_similar_information": 13,
26
+ "contract_nli_permissible_post-agreement_possession": 14,
27
+ "contract_nli_return_of_confidential_information": 15,
28
+ "contract_nli_sharing_with_employees": 16,
29
+ "contract_nli_sharing_with_third-parties": 17,
30
+ "contract_nli_survival_of_obligations": 18,
31
+ "contract_qa": 19,
32
+ "corporate_lobbying": 20,
33
+ "cuad_affiliate_license-licensee": 21,
34
+ "cuad_affiliate_license-licensor": 22,
35
+ "cuad_anti-assignment": 23,
36
+ "cuad_audit_rights": 24,
37
+ "cuad_cap_on_liability": 25,
38
+ "cuad_change_of_control": 26,
39
+ "cuad_competitive_restriction_exception": 27,
40
+ "cuad_covenant_not_to_sue": 28,
41
+ "cuad_effective_date": 29,
42
+ "cuad_exclusivity": 30,
43
+ "cuad_expiration_date": 31,
44
+ "cuad_governing_law": 32,
45
+ "cuad_insurance": 33,
46
+ "cuad_ip_ownership_assignment": 34,
47
+ "cuad_irrevocable_or_perpetual_license": 35,
48
+ "cuad_joint_ip_ownership": 36,
49
+ "cuad_license_grant": 37,
50
+ "cuad_liquidated_damages": 38,
51
+ "cuad_minimum_commitment": 39,
52
+ "cuad_most_favored_nation": 40,
53
+ "cuad_no-solicit_of_customers": 41,
54
+ "cuad_no-solicit_of_employees": 42,
55
+ "cuad_non-compete": 43,
56
+ "cuad_non-disparagement": 44,
57
+ "cuad_non-transferable_license": 45,
58
+ "cuad_notice_period_to_terminate_renewal": 46,
59
+ "cuad_post-termination_services": 47,
60
+ "cuad_price_restrictions": 48,
61
+ "cuad_renewal_term": 49,
62
+ "cuad_revenue-profit_sharing": 50,
63
+ "cuad_rofr-rofo-rofn": 51,
64
+ "cuad_source_code_escrow": 52,
65
+ "cuad_termination_for_convenience": 53,
66
+ "cuad_third_party_beneficiary": 54,
67
+ "cuad_uncapped_liability": 55,
68
+ "cuad_unlimited-all-you-can-eat-license": 56,
69
+ "cuad_volume_restriction": 57,
70
+ "cuad_warranty_duration": 58,
71
+ "definition_classification": 59,
72
+ "definition_extraction": 60,
73
+ "diversity_1": 61,
74
+ "diversity_2": 62,
75
+ "diversity_3": 63,
76
+ "diversity_4": 64,
77
+ "diversity_5": 65,
78
+ "diversity_6": 66,
79
+ "function_of_decision_section": 67,
80
+ "hearsay": 68,
81
+ "insurance_policy_interpretation": 69,
82
+ "international_citizenship_questions": 70,
83
+ "jcrew_blocker": 71,
84
+ "learned_hands_benefits": 72,
85
+ "learned_hands_business": 73,
86
+ "learned_hands_consumer": 74,
87
+ "learned_hands_courts": 75,
88
+ "learned_hands_crime": 76,
89
+ "learned_hands_divorce": 77,
90
+ "learned_hands_domestic_violence": 78,
91
+ "learned_hands_education": 79,
92
+ "learned_hands_employment": 80,
93
+ "learned_hands_estates": 81,
94
+ "learned_hands_family": 82,
95
+ "learned_hands_health": 83,
96
+ "learned_hands_housing": 84,
97
+ "learned_hands_immigration": 85,
98
+ "learned_hands_torts": 86,
99
+ "learned_hands_traffic": 87,
100
+ "legal_reasoning_causality": 88,
101
+ "maud_ability_to_consummate_concept_is_subject_to_mae_carveouts": 89,
102
+ "maud_accuracy_of_fundamental_target_rws_bringdown_standard": 90,
103
+ "maud_accuracy_of_target_capitalization_rw_(outstanding_shares)_bringdown_standard_answer": 91,
104
+ "maud_accuracy_of_target_general_rw_bringdown_timing_answer": 92,
105
+ "maud_additional_matching_rights_period_for_modifications_(cor)": 93,
106
+ "maud_application_of_buyer_consent_requirement_(negative_interim_covenant)": 94,
107
+ "maud_buyer_consent_requirement_(ordinary_course)": 95,
108
+ "maud_change_in_law__subject_to_disproportionate_impact_modifier": 96,
109
+ "maud_changes_in_gaap_or_other_accounting_principles__subject_to_disproportionate_impact_modifier": 97,
110
+ "maud_cor_permitted_in_response_to_intervening_event": 98,
111
+ "maud_cor_permitted_with_board_fiduciary_determination_only": 99,
112
+ "maud_cor_standard_(intervening_event)": 100,
113
+ "maud_cor_standard_(superior_offer)": 101,
114
+ "maud_definition_contains_knowledge_requirement_-_answer": 102,
115
+ "maud_definition_includes_asset_deals": 103,
116
+ "maud_definition_includes_stock_deals": 104,
117
+ "maud_fiduciary_exception__board_determination_standard": 105,
118
+ "maud_fiduciary_exception_board_determination_trigger_(no_shop)": 106,
119
+ "maud_financial_point_of_view_is_the_sole_consideration": 107,
120
+ "maud_fls_(mae)_standard": 108,
121
+ "maud_general_economic_and_financial_conditions_subject_to_disproportionate_impact_modifier": 109,
122
+ "maud_includes_consistent_with_past_practice": 110,
123
+ "maud_initial_matching_rights_period_(cor)": 111,
124
+ "maud_initial_matching_rights_period_(ftr)": 112,
125
+ "maud_intervening_event_-_required_to_occur_after_signing_-_answer": 113,
126
+ "maud_knowledge_definition": 114,
127
+ "maud_liability_standard_for_no-shop_breach_by_target_non-do_representatives": 115,
128
+ "maud_ordinary_course_efforts_standard": 116,
129
+ "maud_pandemic_or_other_public_health_event__subject_to_disproportionate_impact_modifier": 117,
130
+ "maud_pandemic_or_other_public_health_event_specific_reference_to_pandemic-related_governmental_responses_or_measures": 118,
131
+ "maud_relational_language_(mae)_applies_to": 119,
132
+ "maud_specific_performance": 120,
133
+ "maud_tail_period_length": 121,
134
+ "maud_type_of_consideration": 122,
135
+ "nys_judicial_ethics": 123,
136
+ "opp115_data_retention": 124,
137
+ "opp115_data_security": 125,
138
+ "opp115_do_not_track": 126,
139
+ "opp115_first_party_collection_use": 127,
140
+ "opp115_international_and_specific_audiences": 128,
141
+ "opp115_policy_change": 129,
142
+ "opp115_third_party_sharing_collection": 130,
143
+ "opp115_user_access,_edit_and_deletion": 131,
144
+ "opp115_user_choice_control": 132,
145
+ "oral_argument_question_purpose": 133,
146
+ "overruling": 134,
147
+ "personal_jurisdiction": 135,
148
+ "privacy_policy_entailment": 136,
149
+ "privacy_policy_qa": 137,
150
+ "proa": 138,
151
+ "sara_entailment": 139,
152
+ "sara_numeric": 140,
153
+ "scalr": 141,
154
+ "ssla_company_defendants": 142,
155
+ "ssla_individual_defendants": 143,
156
+ "ssla_plaintiff": 144,
157
+ "successor_liability": 145,
158
+ "supply_chain_disclosure_best_practice_accountability": 146,
159
+ "supply_chain_disclosure_best_practice_audits": 147,
160
+ "supply_chain_disclosure_best_practice_certification": 148,
161
+ "supply_chain_disclosure_best_practice_training": 149,
162
+ "supply_chain_disclosure_best_practice_verification": 150,
163
+ "supply_chain_disclosure_disclosed_accountability": 151,
164
+ "supply_chain_disclosure_disclosed_audits": 152,
165
+ "supply_chain_disclosure_disclosed_certification": 153,
166
+ "supply_chain_disclosure_disclosed_training": 154,
167
+ "supply_chain_disclosure_disclosed_verification": 155,
168
+ "telemarketing_sales_rule": 156,
169
+ "textualism_tool_dictionaries": 157,
170
+ "textualism_tool_plain": 158,
171
+ "ucc_v_common_law": 159,
172
+ "unfair_tos": 160
173
+ },
174
+ "initializer_range": 0.02,
175
+ "label2id": {
176
+ "0": "abercrombie",
177
+ "1": "canada_tax_court_outcomes",
178
+ "2": "citation_prediction_classification",
179
+ "3": "citation_prediction_open",
180
+ "4": "consumer_contracts_qa",
181
+ "5": "contract_nli_confidentiality_of_agreement",
182
+ "6": "contract_nli_explicit_identification",
183
+ "7": "contract_nli_inclusion_of_verbally_conveyed_information",
184
+ "8": "contract_nli_limited_use",
185
+ "9": "contract_nli_no_licensing",
186
+ "10": "contract_nli_notice_on_compelled_disclosure",
187
+ "11": "contract_nli_permissible_acquirement_of_similar_information",
188
+ "12": "contract_nli_permissible_copy",
189
+ "13": "contract_nli_permissible_development_of_similar_information",
190
+ "14": "contract_nli_permissible_post-agreement_possession",
191
+ "15": "contract_nli_return_of_confidential_information",
192
+ "16": "contract_nli_sharing_with_employees",
193
+ "17": "contract_nli_sharing_with_third-parties",
194
+ "18": "contract_nli_survival_of_obligations",
195
+ "19": "contract_qa",
196
+ "20": "corporate_lobbying",
197
+ "21": "cuad_affiliate_license-licensee",
198
+ "22": "cuad_affiliate_license-licensor",
199
+ "23": "cuad_anti-assignment",
200
+ "24": "cuad_audit_rights",
201
+ "25": "cuad_cap_on_liability",
202
+ "26": "cuad_change_of_control",
203
+ "27": "cuad_competitive_restriction_exception",
204
+ "28": "cuad_covenant_not_to_sue",
205
+ "29": "cuad_effective_date",
206
+ "30": "cuad_exclusivity",
207
+ "31": "cuad_expiration_date",
208
+ "32": "cuad_governing_law",
209
+ "33": "cuad_insurance",
210
+ "34": "cuad_ip_ownership_assignment",
211
+ "35": "cuad_irrevocable_or_perpetual_license",
212
+ "36": "cuad_joint_ip_ownership",
213
+ "37": "cuad_license_grant",
214
+ "38": "cuad_liquidated_damages",
215
+ "39": "cuad_minimum_commitment",
216
+ "40": "cuad_most_favored_nation",
217
+ "41": "cuad_no-solicit_of_customers",
218
+ "42": "cuad_no-solicit_of_employees",
219
+ "43": "cuad_non-compete",
220
+ "44": "cuad_non-disparagement",
221
+ "45": "cuad_non-transferable_license",
222
+ "46": "cuad_notice_period_to_terminate_renewal",
223
+ "47": "cuad_post-termination_services",
224
+ "48": "cuad_price_restrictions",
225
+ "49": "cuad_renewal_term",
226
+ "50": "cuad_revenue-profit_sharing",
227
+ "51": "cuad_rofr-rofo-rofn",
228
+ "52": "cuad_source_code_escrow",
229
+ "53": "cuad_termination_for_convenience",
230
+ "54": "cuad_third_party_beneficiary",
231
+ "55": "cuad_uncapped_liability",
232
+ "56": "cuad_unlimited-all-you-can-eat-license",
233
+ "57": "cuad_volume_restriction",
234
+ "58": "cuad_warranty_duration",
235
+ "59": "definition_classification",
236
+ "60": "definition_extraction",
237
+ "61": "diversity_1",
238
+ "62": "diversity_2",
239
+ "63": "diversity_3",
240
+ "64": "diversity_4",
241
+ "65": "diversity_5",
242
+ "66": "diversity_6",
243
+ "67": "function_of_decision_section",
244
+ "68": "hearsay",
245
+ "69": "insurance_policy_interpretation",
246
+ "70": "international_citizenship_questions",
247
+ "71": "jcrew_blocker",
248
+ "72": "learned_hands_benefits",
249
+ "73": "learned_hands_business",
250
+ "74": "learned_hands_consumer",
251
+ "75": "learned_hands_courts",
252
+ "76": "learned_hands_crime",
253
+ "77": "learned_hands_divorce",
254
+ "78": "learned_hands_domestic_violence",
255
+ "79": "learned_hands_education",
256
+ "80": "learned_hands_employment",
257
+ "81": "learned_hands_estates",
258
+ "82": "learned_hands_family",
259
+ "83": "learned_hands_health",
260
+ "84": "learned_hands_housing",
261
+ "85": "learned_hands_immigration",
262
+ "86": "learned_hands_torts",
263
+ "87": "learned_hands_traffic",
264
+ "88": "legal_reasoning_causality",
265
+ "89": "maud_ability_to_consummate_concept_is_subject_to_mae_carveouts",
266
+ "90": "maud_accuracy_of_fundamental_target_rws_bringdown_standard",
267
+ "91": "maud_accuracy_of_target_capitalization_rw_(outstanding_shares)_bringdown_standard_answer",
268
+ "92": "maud_accuracy_of_target_general_rw_bringdown_timing_answer",
269
+ "93": "maud_additional_matching_rights_period_for_modifications_(cor)",
270
+ "94": "maud_application_of_buyer_consent_requirement_(negative_interim_covenant)",
271
+ "95": "maud_buyer_consent_requirement_(ordinary_course)",
272
+ "96": "maud_change_in_law__subject_to_disproportionate_impact_modifier",
273
+ "97": "maud_changes_in_gaap_or_other_accounting_principles__subject_to_disproportionate_impact_modifier",
274
+ "98": "maud_cor_permitted_in_response_to_intervening_event",
275
+ "99": "maud_cor_permitted_with_board_fiduciary_determination_only",
276
+ "100": "maud_cor_standard_(intervening_event)",
277
+ "101": "maud_cor_standard_(superior_offer)",
278
+ "102": "maud_definition_contains_knowledge_requirement_-_answer",
279
+ "103": "maud_definition_includes_asset_deals",
280
+ "104": "maud_definition_includes_stock_deals",
281
+ "105": "maud_fiduciary_exception__board_determination_standard",
282
+ "106": "maud_fiduciary_exception_board_determination_trigger_(no_shop)",
283
+ "107": "maud_financial_point_of_view_is_the_sole_consideration",
284
+ "108": "maud_fls_(mae)_standard",
285
+ "109": "maud_general_economic_and_financial_conditions_subject_to_disproportionate_impact_modifier",
286
+ "110": "maud_includes_consistent_with_past_practice",
287
+ "111": "maud_initial_matching_rights_period_(cor)",
288
+ "112": "maud_initial_matching_rights_period_(ftr)",
289
+ "113": "maud_intervening_event_-_required_to_occur_after_signing_-_answer",
290
+ "114": "maud_knowledge_definition",
291
+ "115": "maud_liability_standard_for_no-shop_breach_by_target_non-do_representatives",
292
+ "116": "maud_ordinary_course_efforts_standard",
293
+ "117": "maud_pandemic_or_other_public_health_event__subject_to_disproportionate_impact_modifier",
294
+ "118": "maud_pandemic_or_other_public_health_event_specific_reference_to_pandemic-related_governmental_responses_or_measures",
295
+ "119": "maud_relational_language_(mae)_applies_to",
296
+ "120": "maud_specific_performance",
297
+ "121": "maud_tail_period_length",
298
+ "122": "maud_type_of_consideration",
299
+ "123": "nys_judicial_ethics",
300
+ "124": "opp115_data_retention",
301
+ "125": "opp115_data_security",
302
+ "126": "opp115_do_not_track",
303
+ "127": "opp115_first_party_collection_use",
304
+ "128": "opp115_international_and_specific_audiences",
305
+ "129": "opp115_policy_change",
306
+ "130": "opp115_third_party_sharing_collection",
307
+ "131": "opp115_user_access,_edit_and_deletion",
308
+ "132": "opp115_user_choice_control",
309
+ "133": "oral_argument_question_purpose",
310
+ "134": "overruling",
311
+ "135": "personal_jurisdiction",
312
+ "136": "privacy_policy_entailment",
313
+ "137": "privacy_policy_qa",
314
+ "138": "proa",
315
+ "139": "sara_entailment",
316
+ "140": "sara_numeric",
317
+ "141": "scalr",
318
+ "142": "ssla_company_defendants",
319
+ "143": "ssla_individual_defendants",
320
+ "144": "ssla_plaintiff",
321
+ "145": "successor_liability",
322
+ "146": "supply_chain_disclosure_best_practice_accountability",
323
+ "147": "supply_chain_disclosure_best_practice_audits",
324
+ "148": "supply_chain_disclosure_best_practice_certification",
325
+ "149": "supply_chain_disclosure_best_practice_training",
326
+ "150": "supply_chain_disclosure_best_practice_verification",
327
+ "151": "supply_chain_disclosure_disclosed_accountability",
328
+ "152": "supply_chain_disclosure_disclosed_audits",
329
+ "153": "supply_chain_disclosure_disclosed_certification",
330
+ "154": "supply_chain_disclosure_disclosed_training",
331
+ "155": "supply_chain_disclosure_disclosed_verification",
332
+ "156": "telemarketing_sales_rule",
333
+ "157": "textualism_tool_dictionaries",
334
+ "158": "textualism_tool_plain",
335
+ "159": "ucc_v_common_law",
336
+ "160": "unfair_tos"
337
+ },
338
+ "max_position_embeddings": 512,
339
+ "model_type": "distilbert",
340
+ "n_heads": 12,
341
+ "n_layers": 6,
342
+ "pad_token_id": 0,
343
+ "problem_type": "single_label_classification",
344
+ "qa_dropout": 0.1,
345
+ "seq_classif_dropout": 0.2,
346
+ "sinusoidal_pos_embds": false,
347
+ "tie_weights_": true,
348
+ "torch_dtype": "float32",
349
+ "transformers_version": "4.35.2",
350
+ "vocab_size": 30522
351
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26b1af9a724f532581a03daa3b9f39e074385d892a67343b4f97f6054ffdc2b5
3
+ size 268321660
runs/Feb14_17-10-39_fdf0a2dd9181/events.out.tfevents.1707930641.fdf0a2dd9181.3331.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed2b1e3a83b97c8d05f3de48cb6ff07ca3b4f8e2e885cf10a249b2de3599ab12
3
+ size 19945
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": true,
47
+ "mask_token": "[MASK]",
48
+ "model_max_length": 512,
49
+ "pad_token": "[PAD]",
50
+ "sep_token": "[SEP]",
51
+ "strip_accents": null,
52
+ "tokenize_chinese_chars": true,
53
+ "tokenizer_class": "DistilBertTokenizer",
54
+ "unk_token": "[UNK]"
55
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c9b0378fb8606faf50f6eccb48cb8fba64f6580fc2efe614ef5f8c674d5b513
3
+ size 4600
vocab.txt ADDED
The diff for this file is too large to render. See raw diff