Training in progress, step 100
Browse files- config.json +1 -1
- model.safetensors +1 -1
- run_cmn.sh +10 -10
- runs/Jan23_05-57-07_ip-172-31-68-44/events.out.tfevents.1705989446.ip-172-31-68-44.20295.0 +3 -0
- tokenizer.json +6 -6
- training_args.bin +1 -1
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
5 |
"apply_spec_augment": false,
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "qanastek/whisper-small-french-uncased",
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
5 |
"apply_spec_augment": false,
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 966995080
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3622ab230d796bea00496f6ee443c80ebb2a7d176777ff4817c17d1c4347bb50
|
3 |
size 966995080
|
run_cmn.sh
CHANGED
@@ -1,23 +1,23 @@
|
|
1 |
python3 run_speech_recognition_seq2seq_streaming.py \
|
2 |
-
--model_name_or_path="
|
3 |
--dataset_name="mozilla-foundation/common_voice_16_0" \
|
4 |
-
--dataset_config_name="
|
5 |
-
--language="
|
6 |
--train_split_name="train+validation" \
|
7 |
--eval_split_name="test" \
|
8 |
-
--model_index_name="Whisper Base
|
9 |
-
--max_steps="
|
10 |
--output_dir="./" \
|
11 |
--per_device_train_batch_size="16" \
|
12 |
-
--per_device_eval_batch_size="
|
13 |
--gradient_accumulation_steps=4 \
|
14 |
--logging_steps="25" \
|
15 |
-
--learning_rate="
|
16 |
-
--warmup_steps="
|
17 |
--evaluation_strategy="steps" \
|
18 |
-
--eval_steps="
|
19 |
--save_strategy="steps" \
|
20 |
-
--save_steps="
|
21 |
--generation_max_length="225" \
|
22 |
--length_column_name="input_length" \
|
23 |
--max_duration_in_seconds="30" \
|
|
|
1 |
python3 run_speech_recognition_seq2seq_streaming.py \
|
2 |
+
--model_name_or_path="qanastek/whisper-small-french-uncased" \
|
3 |
--dataset_name="mozilla-foundation/common_voice_16_0" \
|
4 |
+
--dataset_config_name="fr" \
|
5 |
+
--language="french" \
|
6 |
--train_split_name="train+validation" \
|
7 |
--eval_split_name="test" \
|
8 |
+
--model_index_name="Whisper Base French" \
|
9 |
+
--max_steps="1000" \
|
10 |
--output_dir="./" \
|
11 |
--per_device_train_batch_size="16" \
|
12 |
+
--per_device_eval_batch_size="32" \
|
13 |
--gradient_accumulation_steps=4 \
|
14 |
--logging_steps="25" \
|
15 |
+
--learning_rate="5e-7" \
|
16 |
+
--warmup_steps="100" \
|
17 |
--evaluation_strategy="steps" \
|
18 |
+
--eval_steps="100" \
|
19 |
--save_strategy="steps" \
|
20 |
+
--save_steps="100" \
|
21 |
--generation_max_length="225" \
|
22 |
--length_column_name="input_length" \
|
23 |
--max_duration_in_seconds="30" \
|
runs/Jan23_05-57-07_ip-172-31-68-44/events.out.tfevents.1705989446.ip-172-31-68-44.20295.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0486f429675408de46cc06040fcd0b4163ab6cde2d89a5eebc319fd79fdd9b7f
|
3 |
+
size 6071
|
tokenizer.json
CHANGED
@@ -985,7 +985,7 @@
|
|
985 |
},
|
986 |
{
|
987 |
"SpecialToken": {
|
988 |
-
"id": "<|
|
989 |
"type_id": 0
|
990 |
}
|
991 |
},
|
@@ -1023,7 +1023,7 @@
|
|
1023 |
},
|
1024 |
{
|
1025 |
"SpecialToken": {
|
1026 |
-
"id": "<|
|
1027 |
"type_id": 0
|
1028 |
}
|
1029 |
},
|
@@ -1068,13 +1068,13 @@
|
|
1068 |
"<|endoftext|>"
|
1069 |
]
|
1070 |
},
|
1071 |
-
"<|
|
1072 |
-
"id": "<|
|
1073 |
"ids": [
|
1074 |
-
|
1075 |
],
|
1076 |
"tokens": [
|
1077 |
-
"<|
|
1078 |
]
|
1079 |
},
|
1080 |
"<|notimestamps|>": {
|
|
|
985 |
},
|
986 |
{
|
987 |
"SpecialToken": {
|
988 |
+
"id": "<|fr|>",
|
989 |
"type_id": 0
|
990 |
}
|
991 |
},
|
|
|
1023 |
},
|
1024 |
{
|
1025 |
"SpecialToken": {
|
1026 |
+
"id": "<|fr|>",
|
1027 |
"type_id": 0
|
1028 |
}
|
1029 |
},
|
|
|
1068 |
"<|endoftext|>"
|
1069 |
]
|
1070 |
},
|
1071 |
+
"<|fr|>": {
|
1072 |
+
"id": "<|fr|>",
|
1073 |
"ids": [
|
1074 |
+
50265
|
1075 |
],
|
1076 |
"tokens": [
|
1077 |
+
"<|fr|>"
|
1078 |
]
|
1079 |
},
|
1080 |
"<|notimestamps|>": {
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4792
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c402a950cc7e208f84081823c51369e4011a49eb775a25599d930a6775401c83
|
3 |
size 4792
|