akhooli commited on
Commit
141d84d
·
verified ·
1 Parent(s): 6533672

End of training

Browse files
README.md CHANGED
@@ -5,7 +5,7 @@ base_model: openai/whisper-small
5
  tags:
6
  - generated_from_trainer
7
  datasets:
8
- - common_voice_17_0
9
  metrics:
10
  - wer
11
  model-index:
@@ -15,8 +15,8 @@ model-index:
15
  name: Automatic Speech Recognition
16
  type: automatic-speech-recognition
17
  dataset:
18
- name: common_voice_17_0
19
- type: common_voice_17_0
20
  config: ar
21
  split: None
22
  args: ar
@@ -31,7 +31,7 @@ should probably proofread and complete it, then remove this comment. -->
31
 
32
  # whisper-small-dar
33
 
34
- This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the common_voice_17_0 dataset.
35
  It achieves the following results on the evaluation set:
36
  - Loss: 0.1813
37
  - Wer: 0.3367
 
5
  tags:
6
  - generated_from_trainer
7
  datasets:
8
+ - mozilla-foundation/common_voice_17_0
9
  metrics:
10
  - wer
11
  model-index:
 
15
  name: Automatic Speech Recognition
16
  type: automatic-speech-recognition
17
  dataset:
18
+ name: mozilla-foundation/common_voice_17_0 ar
19
+ type: mozilla-foundation/common_voice_17_0
20
  config: ar
21
  split: None
22
  args: ar
 
31
 
32
  # whisper-small-dar
33
 
34
+ This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the mozilla-foundation/common_voice_17_0 ar dataset.
35
  It achieves the following results on the evaluation set:
36
  - Loss: 0.1813
37
  - Wer: 0.3367
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
- "epoch": 100.0,
3
- "eval_loss": 1.3785362243652344,
4
- "eval_runtime": 12.5874,
5
- "eval_samples": 33,
6
- "eval_samples_per_second": 2.622,
7
- "eval_steps_per_second": 0.159,
8
- "eval_wer": 0.7520215633423181,
9
- "total_flos": 4.617366645252293e+18,
10
- "train_loss": 0.04933440090715885,
11
- "train_runtime": 2429.6725,
12
- "train_samples": 148,
13
- "train_samples_per_second": 6.585,
14
- "train_steps_per_second": 0.206
15
  }
 
1
  {
2
+ "epoch": 2.9673590504451037,
3
+ "eval_loss": 0.18132926523685455,
4
+ "eval_runtime": 479.53,
5
+ "eval_samples": 2296,
6
+ "eval_samples_per_second": 4.788,
7
+ "eval_steps_per_second": 0.15,
8
+ "eval_wer": 0.3367421033522934,
9
+ "total_flos": 9.234732878187725e+18,
10
+ "train_loss": 0.21518024158477783,
11
+ "train_runtime": 7211.1645,
12
+ "train_samples": 10777,
13
+ "train_samples_per_second": 4.438,
14
+ "train_steps_per_second": 0.139
15
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 100.0,
3
- "eval_loss": 1.3785362243652344,
4
- "eval_runtime": 12.5874,
5
- "eval_samples": 33,
6
- "eval_samples_per_second": 2.622,
7
- "eval_steps_per_second": 0.159,
8
- "eval_wer": 0.7520215633423181
9
  }
 
1
  {
2
+ "epoch": 2.9673590504451037,
3
+ "eval_loss": 0.18132926523685455,
4
+ "eval_runtime": 479.53,
5
+ "eval_samples": 2296,
6
+ "eval_samples_per_second": 4.788,
7
+ "eval_steps_per_second": 0.15,
8
+ "eval_wer": 0.3367421033522934
9
  }
runs/Dec26_16-38-08_83479bdb9181/events.out.tfevents.1735239794.83479bdb9181.76.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b6a8858bb33d35fb0224836209866907cc9edb98d4f86800ccc1280b2194d02
3
+ size 406
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 100.0,
3
- "total_flos": 4.617366645252293e+18,
4
- "train_loss": 0.04933440090715885,
5
- "train_runtime": 2429.6725,
6
- "train_samples": 148,
7
- "train_samples_per_second": 6.585,
8
- "train_steps_per_second": 0.206
9
  }
 
1
  {
2
+ "epoch": 2.9673590504451037,
3
+ "total_flos": 9.234732878187725e+18,
4
+ "train_loss": 0.21518024158477783,
5
+ "train_runtime": 7211.1645,
6
+ "train_samples": 10777,
7
+ "train_samples_per_second": 4.438,
8
+ "train_steps_per_second": 0.139
9
  }
trainer_state.json CHANGED
@@ -1,86 +1,142 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 100.0,
5
- "eval_steps": 100,
6
- "global_step": 500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 20.0,
13
- "eval_loss": 1.218579649925232,
14
- "eval_runtime": 12.9357,
15
- "eval_samples_per_second": 2.551,
16
- "eval_steps_per_second": 0.155,
17
- "eval_wer": 0.7466307277628033,
18
  "step": 100
19
  },
20
  {
21
- "epoch": 40.0,
22
- "eval_loss": 1.3031549453735352,
23
- "eval_runtime": 12.9001,
24
- "eval_samples_per_second": 2.558,
25
- "eval_steps_per_second": 0.155,
26
- "eval_wer": 0.7358490566037735,
27
  "step": 200
28
  },
29
  {
30
- "epoch": 50.0,
31
- "grad_norm": 0.009337667375802994,
32
- "learning_rate": 5.6444444444444445e-06,
33
- "loss": 0.0984,
34
- "step": 250
 
 
35
  },
36
  {
37
- "epoch": 60.0,
38
- "eval_loss": 1.348648190498352,
39
- "eval_runtime": 12.4824,
40
- "eval_samples_per_second": 2.644,
41
- "eval_steps_per_second": 0.16,
42
- "eval_wer": 0.7466307277628033,
43
  "step": 300
44
  },
45
  {
46
- "epoch": 80.0,
47
- "eval_loss": 1.371259093284607,
48
- "eval_runtime": 12.6242,
49
- "eval_samples_per_second": 2.614,
50
- "eval_steps_per_second": 0.158,
51
- "eval_wer": 0.7520215633423181,
52
  "step": 400
53
  },
54
  {
55
- "epoch": 100.0,
56
- "grad_norm": 0.006098776590079069,
57
- "learning_rate": 8.88888888888889e-08,
58
- "loss": 0.0003,
59
- "step": 500
 
 
60
  },
61
  {
62
- "epoch": 100.0,
63
- "eval_loss": 1.3785362243652344,
64
- "eval_runtime": 12.7001,
65
- "eval_samples_per_second": 2.598,
66
- "eval_steps_per_second": 0.157,
67
- "eval_wer": 0.7520215633423181,
68
  "step": 500
69
  },
70
  {
71
- "epoch": 100.0,
72
- "step": 500,
73
- "total_flos": 4.617366645252293e+18,
74
- "train_loss": 0.04933440090715885,
75
- "train_runtime": 2429.6725,
76
- "train_samples_per_second": 6.585,
77
- "train_steps_per_second": 0.206
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
78
  }
79
  ],
80
- "logging_steps": 250,
81
- "max_steps": 500,
82
  "num_input_tokens_seen": 0,
83
- "num_train_epochs": 100,
84
  "save_steps": 500,
85
  "stateful_callbacks": {
86
  "TrainerControl": {
@@ -94,7 +150,7 @@
94
  "attributes": {}
95
  }
96
  },
97
- "total_flos": 4.617366645252293e+18,
98
  "train_batch_size": 16,
99
  "trial_name": null,
100
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.9673590504451037,
5
+ "eval_steps": 200,
6
+ "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.29673590504451036,
13
+ "grad_norm": 4.922755241394043,
14
+ "learning_rate": 9.600000000000001e-06,
15
+ "loss": 0.6132,
 
 
16
  "step": 100
17
  },
18
  {
19
+ "epoch": 0.5934718100890207,
20
+ "grad_norm": 4.277930736541748,
21
+ "learning_rate": 8.933333333333333e-06,
22
+ "loss": 0.303,
 
 
23
  "step": 200
24
  },
25
  {
26
+ "epoch": 0.5934718100890207,
27
+ "eval_loss": 0.24335336685180664,
28
+ "eval_runtime": 493.5362,
29
+ "eval_samples_per_second": 4.652,
30
+ "eval_steps_per_second": 0.146,
31
+ "eval_wer": 0.4226068014038485,
32
+ "step": 200
33
  },
34
  {
35
+ "epoch": 0.8902077151335311,
36
+ "grad_norm": 4.590033054351807,
37
+ "learning_rate": 7.822222222222224e-06,
38
+ "loss": 0.2564,
 
 
39
  "step": 300
40
  },
41
  {
42
+ "epoch": 1.1869436201780414,
43
+ "grad_norm": 3.3569984436035156,
44
+ "learning_rate": 6.711111111111111e-06,
45
+ "loss": 0.2,
 
 
46
  "step": 400
47
  },
48
  {
49
+ "epoch": 1.1869436201780414,
50
+ "eval_loss": 0.20352379977703094,
51
+ "eval_runtime": 482.7378,
52
+ "eval_samples_per_second": 4.756,
53
+ "eval_steps_per_second": 0.149,
54
+ "eval_wer": 0.39138327483964663,
55
+ "step": 400
56
  },
57
  {
58
+ "epoch": 1.4836795252225519,
59
+ "grad_norm": 3.2953569889068604,
60
+ "learning_rate": 5.600000000000001e-06,
61
+ "loss": 0.1637,
 
 
62
  "step": 500
63
  },
64
  {
65
+ "epoch": 1.7804154302670623,
66
+ "grad_norm": 3.363754987716675,
67
+ "learning_rate": 4.488888888888889e-06,
68
+ "loss": 0.1633,
69
+ "step": 600
70
+ },
71
+ {
72
+ "epoch": 1.7804154302670623,
73
+ "eval_loss": 0.18764939904212952,
74
+ "eval_runtime": 484.1747,
75
+ "eval_samples_per_second": 4.742,
76
+ "eval_steps_per_second": 0.149,
77
+ "eval_wer": 0.3469079026987777,
78
+ "step": 600
79
+ },
80
+ {
81
+ "epoch": 2.077151335311573,
82
+ "grad_norm": 2.2284867763519287,
83
+ "learning_rate": 3.377777777777778e-06,
84
+ "loss": 0.1428,
85
+ "step": 700
86
+ },
87
+ {
88
+ "epoch": 2.373887240356083,
89
+ "grad_norm": 2.0610995292663574,
90
+ "learning_rate": 2.266666666666667e-06,
91
+ "loss": 0.106,
92
+ "step": 800
93
+ },
94
+ {
95
+ "epoch": 2.373887240356083,
96
+ "eval_loss": 0.18498285114765167,
97
+ "eval_runtime": 480.7097,
98
+ "eval_samples_per_second": 4.776,
99
+ "eval_steps_per_second": 0.15,
100
+ "eval_wer": 0.3487837347210456,
101
+ "step": 800
102
+ },
103
+ {
104
+ "epoch": 2.6706231454005933,
105
+ "grad_norm": 2.554095983505249,
106
+ "learning_rate": 1.1555555555555556e-06,
107
+ "loss": 0.1029,
108
+ "step": 900
109
+ },
110
+ {
111
+ "epoch": 2.9673590504451037,
112
+ "grad_norm": 2.727163314819336,
113
+ "learning_rate": 4.444444444444445e-08,
114
+ "loss": 0.1005,
115
+ "step": 1000
116
+ },
117
+ {
118
+ "epoch": 2.9673590504451037,
119
+ "eval_loss": 0.18132926523685455,
120
+ "eval_runtime": 479.4261,
121
+ "eval_samples_per_second": 4.789,
122
+ "eval_steps_per_second": 0.15,
123
+ "eval_wer": 0.3367421033522934,
124
+ "step": 1000
125
+ },
126
+ {
127
+ "epoch": 2.9673590504451037,
128
+ "step": 1000,
129
+ "total_flos": 9.234732878187725e+18,
130
+ "train_loss": 0.21518024158477783,
131
+ "train_runtime": 7211.1645,
132
+ "train_samples_per_second": 4.438,
133
+ "train_steps_per_second": 0.139
134
  }
135
  ],
136
+ "logging_steps": 100,
137
+ "max_steps": 1000,
138
  "num_input_tokens_seen": 0,
139
+ "num_train_epochs": 3,
140
  "save_steps": 500,
141
  "stateful_callbacks": {
142
  "TrainerControl": {
 
150
  "attributes": {}
151
  }
152
  },
153
+ "total_flos": 9.234732878187725e+18,
154
  "train_batch_size": 16,
155
  "trial_name": null,
156
  "trial_params": null