hanyp commited on
Commit
b72cbc3
1 Parent(s): 9c3ca7e

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,230 +1,33 @@
1
  {
2
- "_name_or_path": "google/vit-base-patch16-224-in21k",
 
3
  "architectures": [
4
- "ViTForImageClassification"
5
  ],
6
- "attention_probs_dropout_prob": 0.0,
7
- "encoder_stride": 16,
8
- "hidden_act": "gelu",
9
- "hidden_dropout_prob": 0.0,
10
- "hidden_size": 768,
11
  "id2label": {
12
- "0": "apple_pie",
13
- "1": "baby_back_ribs",
14
- "10": "bruschetta",
15
- "100": "waffles",
16
- "11": "caesar_salad",
17
- "12": "cannoli",
18
- "13": "caprese_salad",
19
- "14": "carrot_cake",
20
- "15": "ceviche",
21
- "16": "cheesecake",
22
- "17": "cheese_plate",
23
- "18": "chicken_curry",
24
- "19": "chicken_quesadilla",
25
- "2": "baklava",
26
- "20": "chicken_wings",
27
- "21": "chocolate_cake",
28
- "22": "chocolate_mousse",
29
- "23": "churros",
30
- "24": "clam_chowder",
31
- "25": "club_sandwich",
32
- "26": "crab_cakes",
33
- "27": "creme_brulee",
34
- "28": "croque_madame",
35
- "29": "cup_cakes",
36
- "3": "beef_carpaccio",
37
- "30": "deviled_eggs",
38
- "31": "donuts",
39
- "32": "dumplings",
40
- "33": "edamame",
41
- "34": "eggs_benedict",
42
- "35": "escargots",
43
- "36": "falafel",
44
- "37": "filet_mignon",
45
- "38": "fish_and_chips",
46
- "39": "foie_gras",
47
- "4": "beef_tartare",
48
- "40": "french_fries",
49
- "41": "french_onion_soup",
50
- "42": "french_toast",
51
- "43": "fried_calamari",
52
- "44": "fried_rice",
53
- "45": "frozen_yogurt",
54
- "46": "garlic_bread",
55
- "47": "gnocchi",
56
- "48": "greek_salad",
57
- "49": "grilled_cheese_sandwich",
58
- "5": "beet_salad",
59
- "50": "grilled_salmon",
60
- "51": "guacamole",
61
- "52": "gyoza",
62
- "53": "hamburger",
63
- "54": "hot_and_sour_soup",
64
- "55": "hot_dog",
65
- "56": "huevos_rancheros",
66
- "57": "hummus",
67
- "58": "ice_cream",
68
- "59": "lasagna",
69
- "6": "beignets",
70
- "60": "lobster_bisque",
71
- "61": "lobster_roll_sandwich",
72
- "62": "macaroni_and_cheese",
73
- "63": "macarons",
74
- "64": "miso_soup",
75
- "65": "mussels",
76
- "66": "nachos",
77
- "67": "omelette",
78
- "68": "onion_rings",
79
- "69": "oysters",
80
- "7": "bibimbap",
81
- "70": "pad_thai",
82
- "71": "paella",
83
- "72": "pancakes",
84
- "73": "panna_cotta",
85
- "74": "peking_duck",
86
- "75": "pho",
87
- "76": "pizza",
88
- "77": "pork_chop",
89
- "78": "poutine",
90
- "79": "prime_rib",
91
- "8": "bread_pudding",
92
- "80": "pulled_pork_sandwich",
93
- "81": "ramen",
94
- "82": "ravioli",
95
- "83": "red_velvet_cake",
96
- "84": "risotto",
97
- "85": "samosa",
98
- "86": "sashimi",
99
- "87": "scallops",
100
- "88": "seaweed_salad",
101
- "89": "shrimp_and_grits",
102
- "9": "breakfast_burrito",
103
- "90": "spaghetti_bolognese",
104
- "91": "spaghetti_carbonara",
105
- "92": "spring_rolls",
106
- "93": "steak",
107
- "94": "strawberry_shortcake",
108
- "95": "sushi",
109
- "96": "tacos",
110
- "97": "takoyaki",
111
- "98": "tiramisu",
112
- "99": "tuna_tartare"
113
  },
114
- "image_size": 224,
115
  "initializer_range": 0.02,
116
- "intermediate_size": 3072,
117
  "label2id": {
118
- "apple_pie": "0",
119
- "baby_back_ribs": "1",
120
- "baklava": "2",
121
- "beef_carpaccio": "3",
122
- "beef_tartare": "4",
123
- "beet_salad": "5",
124
- "beignets": "6",
125
- "bibimbap": "7",
126
- "bread_pudding": "8",
127
- "breakfast_burrito": "9",
128
- "bruschetta": "10",
129
- "caesar_salad": "11",
130
- "cannoli": "12",
131
- "caprese_salad": "13",
132
- "carrot_cake": "14",
133
- "ceviche": "15",
134
- "cheese_plate": "17",
135
- "cheesecake": "16",
136
- "chicken_curry": "18",
137
- "chicken_quesadilla": "19",
138
- "chicken_wings": "20",
139
- "chocolate_cake": "21",
140
- "chocolate_mousse": "22",
141
- "churros": "23",
142
- "clam_chowder": "24",
143
- "club_sandwich": "25",
144
- "crab_cakes": "26",
145
- "creme_brulee": "27",
146
- "croque_madame": "28",
147
- "cup_cakes": "29",
148
- "deviled_eggs": "30",
149
- "donuts": "31",
150
- "dumplings": "32",
151
- "edamame": "33",
152
- "eggs_benedict": "34",
153
- "escargots": "35",
154
- "falafel": "36",
155
- "filet_mignon": "37",
156
- "fish_and_chips": "38",
157
- "foie_gras": "39",
158
- "french_fries": "40",
159
- "french_onion_soup": "41",
160
- "french_toast": "42",
161
- "fried_calamari": "43",
162
- "fried_rice": "44",
163
- "frozen_yogurt": "45",
164
- "garlic_bread": "46",
165
- "gnocchi": "47",
166
- "greek_salad": "48",
167
- "grilled_cheese_sandwich": "49",
168
- "grilled_salmon": "50",
169
- "guacamole": "51",
170
- "gyoza": "52",
171
- "hamburger": "53",
172
- "hot_and_sour_soup": "54",
173
- "hot_dog": "55",
174
- "huevos_rancheros": "56",
175
- "hummus": "57",
176
- "ice_cream": "58",
177
- "lasagna": "59",
178
- "lobster_bisque": "60",
179
- "lobster_roll_sandwich": "61",
180
- "macaroni_and_cheese": "62",
181
- "macarons": "63",
182
- "miso_soup": "64",
183
- "mussels": "65",
184
- "nachos": "66",
185
- "omelette": "67",
186
- "onion_rings": "68",
187
- "oysters": "69",
188
- "pad_thai": "70",
189
- "paella": "71",
190
- "pancakes": "72",
191
- "panna_cotta": "73",
192
- "peking_duck": "74",
193
- "pho": "75",
194
- "pizza": "76",
195
- "pork_chop": "77",
196
- "poutine": "78",
197
- "prime_rib": "79",
198
- "pulled_pork_sandwich": "80",
199
- "ramen": "81",
200
- "ravioli": "82",
201
- "red_velvet_cake": "83",
202
- "risotto": "84",
203
- "samosa": "85",
204
- "sashimi": "86",
205
- "scallops": "87",
206
- "seaweed_salad": "88",
207
- "shrimp_and_grits": "89",
208
- "spaghetti_bolognese": "90",
209
- "spaghetti_carbonara": "91",
210
- "spring_rolls": "92",
211
- "steak": "93",
212
- "strawberry_shortcake": "94",
213
- "sushi": "95",
214
- "tacos": "96",
215
- "takoyaki": "97",
216
- "tiramisu": "98",
217
- "tuna_tartare": "99",
218
- "waffles": "100"
219
  },
220
- "layer_norm_eps": 1e-12,
221
- "model_type": "vit",
222
- "num_attention_heads": 12,
223
- "num_channels": 3,
224
- "num_hidden_layers": 12,
225
- "patch_size": 16,
226
  "problem_type": "single_label_classification",
227
- "qkv_bias": true,
 
 
 
228
  "torch_dtype": "float32",
229
- "transformers_version": "4.41.2"
 
230
  }
 
1
  {
2
+ "_name_or_path": "distilbert/distilbert-base-uncased",
3
+ "activation": "gelu",
4
  "architectures": [
5
+ "DistilBertForSequenceClassification"
6
  ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
 
11
  "id2label": {
12
+ "0": "NEGATIVE",
13
+ "1": "POSITIVE"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
  },
 
15
  "initializer_range": 0.02,
 
16
  "label2id": {
17
+ "NEGATIVE": 0,
18
+ "POSITIVE": 1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  },
20
+ "max_position_embeddings": 512,
21
+ "model_type": "distilbert",
22
+ "n_heads": 12,
23
+ "n_layers": 6,
24
+ "pad_token_id": 0,
 
25
  "problem_type": "single_label_classification",
26
+ "qa_dropout": 0.1,
27
+ "seq_classif_dropout": 0.2,
28
+ "sinusoidal_pos_embds": false,
29
+ "tie_weights_": true,
30
  "torch_dtype": "float32",
31
+ "transformers_version": "4.41.2",
32
+ "vocab_size": 30522
33
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46b11f92f75832003347dfd6dcffc9fb90a83e76b6838a307fa3554399628642
3
- size 343528508
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50f5e258eeac0b7e963dab2163ba48274a7788daa63ee41b557f00b1f6abb849
3
+ size 267832560
runs/Jun08_12-01-24_dsw-5977-84cbf586f7-2r5n8/events.out.tfevents.1717819286.dsw-5977-84cbf586f7-2r5n8.1165019.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:489ba54b7dda0f8d347a6a865e7ad2b42dcb81d5c1900a1808d306e69c0a3866
3
+ size 5357
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": true,
47
+ "mask_token": "[MASK]",
48
+ "model_max_length": 512,
49
+ "pad_token": "[PAD]",
50
+ "sep_token": "[SEP]",
51
+ "strip_accents": null,
52
+ "tokenize_chinese_chars": true,
53
+ "tokenizer_class": "DistilBertTokenizer",
54
+ "unk_token": "[UNK]"
55
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a92f7ca52febe5ec3ffc3a50169bced0c3b74599992d546c481bd91bcdbc9692
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed79e4fdd694746972bf002368e41c3a780b0b3f4fbe707a723d7d39c10277af
3
  size 5112
vocab.txt ADDED
The diff for this file is too large to render. See raw diff