arzans9 commited on
Commit
0c0faa5
1 Parent(s): d71746f

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "_name_or_path": "microsoft/trocr-small-printed",
3
  "architectures": [
4
  "VisionEncoderDecoderModel"
5
  ],
6
  "decoder": {
7
  "_name_or_path": "",
8
  "activation_dropout": 0.0,
9
- "activation_function": "relu",
10
  "add_cross_attention": true,
11
  "architectures": null,
12
  "attention_dropout": 0.0,
@@ -15,12 +15,12 @@
15
  "bos_token_id": 0,
16
  "chunk_size_feed_forward": 0,
17
  "classifier_dropout": 0.0,
18
- "cross_attention_hidden_size": 384,
19
- "d_model": 256,
20
- "decoder_attention_heads": 8,
21
- "decoder_ffn_dim": 1024,
22
  "decoder_layerdrop": 0.0,
23
- "decoder_layers": 6,
24
  "decoder_start_token_id": 2,
25
  "diversity_penalty": 0.0,
26
  "do_sample": false,
@@ -64,14 +64,14 @@
64
  "repetition_penalty": 1.0,
65
  "return_dict": true,
66
  "return_dict_in_generate": false,
67
- "scale_embedding": true,
68
  "sep_token_id": null,
69
  "suppress_tokens": null,
70
  "task_specific_params": null,
71
  "temperature": 1.0,
72
  "tf_legacy_loss": false,
73
  "tie_encoder_decoder": false,
74
- "tie_word_embeddings": false,
75
  "tokenizer_class": null,
76
  "top_k": 50,
77
  "top_p": 1.0,
@@ -81,7 +81,7 @@
81
  "use_bfloat16": false,
82
  "use_cache": false,
83
  "use_learned_position_embeddings": true,
84
- "vocab_size": 64044
85
  },
86
  "decoder_start_token_id": 0,
87
  "early_stopping": true,
@@ -108,14 +108,14 @@
108
  "forced_eos_token_id": null,
109
  "hidden_act": "gelu",
110
  "hidden_dropout_prob": 0.0,
111
- "hidden_size": 384,
112
  "id2label": {
113
  "0": "LABEL_0",
114
  "1": "LABEL_1"
115
  },
116
  "image_size": 384,
117
  "initializer_range": 0.02,
118
- "intermediate_size": 1536,
119
  "is_decoder": false,
120
  "is_encoder_decoder": false,
121
  "label2id": {
@@ -126,9 +126,9 @@
126
  "length_penalty": 1.0,
127
  "max_length": 20,
128
  "min_length": 0,
129
- "model_type": "deit",
130
  "no_repeat_ngram_size": 0,
131
- "num_attention_heads": 6,
132
  "num_beam_groups": 1,
133
  "num_beams": 1,
134
  "num_channels": 3,
@@ -142,7 +142,7 @@
142
  "prefix": null,
143
  "problem_type": null,
144
  "pruned_heads": {},
145
- "qkv_bias": true,
146
  "remove_invalid_values": false,
147
  "repetition_penalty": 1.0,
148
  "return_dict": true,
@@ -173,5 +173,5 @@
173
  "tie_word_embeddings": false,
174
  "torch_dtype": "float32",
175
  "transformers_version": "4.37.2",
176
- "vocab_size": 64044
177
  }
 
1
  {
2
+ "_name_or_path": "microsoft/trocr-base-printed",
3
  "architectures": [
4
  "VisionEncoderDecoderModel"
5
  ],
6
  "decoder": {
7
  "_name_or_path": "",
8
  "activation_dropout": 0.0,
9
+ "activation_function": "gelu",
10
  "add_cross_attention": true,
11
  "architectures": null,
12
  "attention_dropout": 0.0,
 
15
  "bos_token_id": 0,
16
  "chunk_size_feed_forward": 0,
17
  "classifier_dropout": 0.0,
18
+ "cross_attention_hidden_size": 768,
19
+ "d_model": 1024,
20
+ "decoder_attention_heads": 16,
21
+ "decoder_ffn_dim": 4096,
22
  "decoder_layerdrop": 0.0,
23
+ "decoder_layers": 12,
24
  "decoder_start_token_id": 2,
25
  "diversity_penalty": 0.0,
26
  "do_sample": false,
 
64
  "repetition_penalty": 1.0,
65
  "return_dict": true,
66
  "return_dict_in_generate": false,
67
+ "scale_embedding": false,
68
  "sep_token_id": null,
69
  "suppress_tokens": null,
70
  "task_specific_params": null,
71
  "temperature": 1.0,
72
  "tf_legacy_loss": false,
73
  "tie_encoder_decoder": false,
74
+ "tie_word_embeddings": true,
75
  "tokenizer_class": null,
76
  "top_k": 50,
77
  "top_p": 1.0,
 
81
  "use_bfloat16": false,
82
  "use_cache": false,
83
  "use_learned_position_embeddings": true,
84
+ "vocab_size": 50265
85
  },
86
  "decoder_start_token_id": 0,
87
  "early_stopping": true,
 
108
  "forced_eos_token_id": null,
109
  "hidden_act": "gelu",
110
  "hidden_dropout_prob": 0.0,
111
+ "hidden_size": 768,
112
  "id2label": {
113
  "0": "LABEL_0",
114
  "1": "LABEL_1"
115
  },
116
  "image_size": 384,
117
  "initializer_range": 0.02,
118
+ "intermediate_size": 3072,
119
  "is_decoder": false,
120
  "is_encoder_decoder": false,
121
  "label2id": {
 
126
  "length_penalty": 1.0,
127
  "max_length": 20,
128
  "min_length": 0,
129
+ "model_type": "vit",
130
  "no_repeat_ngram_size": 0,
131
+ "num_attention_heads": 12,
132
  "num_beam_groups": 1,
133
  "num_beams": 1,
134
  "num_channels": 3,
 
142
  "prefix": null,
143
  "problem_type": null,
144
  "pruned_heads": {},
145
+ "qkv_bias": false,
146
  "remove_invalid_values": false,
147
  "repetition_penalty": 1.0,
148
  "return_dict": true,
 
173
  "tie_word_embeddings": false,
174
  "torch_dtype": "float32",
175
  "transformers_version": "4.37.2",
176
+ "vocab_size": 50265
177
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab21396825da2c05749b63138470d584cf1894d2665aa6b4f03f11600181b618
3
- size 246430696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2176485c60464ed43e6ea87b2e20820e09416310cd571900bb589d6f3937b986
3
+ size 1335747032
preprocessor_config.json CHANGED
@@ -1,9 +1,4 @@
1
  {
2
- "crop_size": {
3
- "height": 224,
4
- "width": 224
5
- },
6
- "do_center_crop": false,
7
  "do_normalize": true,
8
  "do_rescale": true,
9
  "do_resize": true,
@@ -12,13 +7,13 @@
12
  0.5,
13
  0.5
14
  ],
15
- "image_processor_type": "DeiTImageProcessor",
16
  "image_std": [
17
  0.5,
18
  0.5,
19
  0.5
20
  ],
21
- "resample": 3,
22
  "rescale_factor": 0.00392156862745098,
23
  "size": {
24
  "height": 384,
 
1
  {
 
 
 
 
 
2
  "do_normalize": true,
3
  "do_rescale": true,
4
  "do_resize": true,
 
7
  0.5,
8
  0.5
9
  ],
10
+ "image_processor_type": "ViTImageProcessor",
11
  "image_std": [
12
  0.5,
13
  0.5,
14
  0.5
15
  ],
16
+ "resample": 2,
17
  "rescale_factor": 0.00392156862745098,
18
  "size": {
19
  "height": 384,
runs/Apr23_13-15-41_devai/events.out.tfevents.1713878159.devai.1671410.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72db56a933486d3bfff8ddc1a20e65ddc44df3a9fd7a000f3435c0ddec4ff52d
3
- size 39543
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5cdb07707403489099a4810e401f0825c9c2636e14e8ff8bba26480fab3f645
3
+ size 41805
runs/Apr24_03-06-19_devai/events.out.tfevents.1713927982.devai.1955363.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b86a60f8b2e13e4f3b61f6910a2177584eaa25d29568353e1f04be01757212f7
3
+ size 8280
runs/Apr24_03-08-45_devai/events.out.tfevents.1713928128.devai.1955753.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988dde1dcf181fd41a349a5b70f3b23a8fdc9b3c3ea6178d08e84bde839ea9d9
3
+ size 8280
runs/Apr24_03-09-43_devai/events.out.tfevents.1713928186.devai.1956042.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2db3aee3021e02146133b642849a1c63179d71da9430b603f41cf91d46a2b221
3
+ size 8280
runs/Apr24_03-10-37_devai/events.out.tfevents.1713928240.devai.1956278.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5494f78c2644f382361a82460fb63c9b003fac718332557bdc7078216eaa2230
3
+ size 9682
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88bc0f5e73c45520b0025aa402e4a09038a5f619366f21dbb1b7509f3faac844
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c8841bf546d6ddbda5c5ba1380cbd0a9b788a099db5487d6e92d7489a1f0fc3
3
  size 4856