Mahmoud-Nasser commited on
Commit
4805b0a
·
verified ·
1 Parent(s): 94ae1db

End of training

Browse files
Files changed (2) hide show
  1. README.md +17 -15
  2. generation_config.json +18 -24
README.md CHANGED
@@ -3,7 +3,7 @@ library_name: transformers
3
  language:
4
  - ar
5
  license: apache-2.0
6
- base_model: openai/whisper-small
7
  tags:
8
  - generated_from_trainer
9
  datasets:
@@ -11,7 +11,7 @@ datasets:
11
  metrics:
12
  - wer
13
  model-index:
14
- - name: Whisper Small Ar - Sanchit Gandhi
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
@@ -23,18 +23,18 @@ model-index:
23
  metrics:
24
  - name: Wer
25
  type: wer
26
- value: 221.36990801576871
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
30
  should probably proofread and complete it, then remove this comment. -->
31
 
32
- # Whisper Small Ar - Sanchit Gandhi
33
 
34
- This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the quranic_audio_dataset dataset.
35
  It achieves the following results on the evaluation set:
36
- - Loss: 2.4500
37
- - Wer: 221.3699
38
 
39
  ## Model description
40
 
@@ -59,21 +59,23 @@ The following hyperparameters were used during training:
59
  - seed: 42
60
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
61
  - lr_scheduler_type: linear
62
- - lr_scheduler_warmup_steps: 1
63
- - training_steps: 2
64
  - mixed_precision_training: Native AMP
65
 
66
  ### Training results
67
 
68
- | Training Loss | Epoch | Step | Validation Loss | Wer |
69
- |:-------------:|:------:|:----:|:---------------:|:--------:|
70
- | 2.3047 | 0.0029 | 1 | 2.4500 | 221.3699 |
71
- | 2.6272 | 0.0058 | 2 | 2.4500 | 221.3699 |
 
 
72
 
73
 
74
  ### Framework versions
75
 
76
- - Transformers 4.48.1
77
  - Pytorch 2.5.1+cu124
78
- - Datasets 3.2.0
79
  - Tokenizers 0.21.0
 
3
  language:
4
  - ar
5
  license: apache-2.0
6
+ base_model: openai/whisper-base
7
  tags:
8
  - generated_from_trainer
9
  datasets:
 
11
  metrics:
12
  - wer
13
  model-index:
14
+ - name: Whisper Base Ar - GPTeam
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
 
23
  metrics:
24
  - name: Wer
25
  type: wer
26
+ value: 29.20499342969777
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
30
  should probably proofread and complete it, then remove this comment. -->
31
 
32
+ # Whisper Base Ar - GPTeam
33
 
34
+ This model is a fine-tuned version of [openai/whisper-base](https://huggingface.co/openai/whisper-base) on the quranic_audio_dataset dataset.
35
  It achieves the following results on the evaluation set:
36
+ - Loss: 0.0527
37
+ - Wer: 29.2050
38
 
39
  ## Model description
40
 
 
59
  - seed: 42
60
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
61
  - lr_scheduler_type: linear
62
+ - lr_scheduler_warmup_steps: 500
63
+ - training_steps: 4000
64
  - mixed_precision_training: Native AMP
65
 
66
  ### Training results
67
 
68
+ | Training Loss | Epoch | Step | Validation Loss | Wer |
69
+ |:-------------:|:-------:|:----:|:---------------:|:-------:|
70
+ | 0.0771 | 2.9240 | 1000 | 0.0722 | 34.2806 |
71
+ | 0.0183 | 5.8480 | 2000 | 0.0553 | 30.8476 |
72
+ | 0.0062 | 8.7719 | 3000 | 0.0527 | 30.7654 |
73
+ | 0.0023 | 11.6959 | 4000 | 0.0527 | 29.2050 |
74
 
75
 
76
  ### Framework versions
77
 
78
+ - Transformers 4.49.0
79
  - Pytorch 2.5.1+cu124
80
+ - Datasets 3.3.2
81
  - Tokenizers 0.21.0
generation_config.json CHANGED
@@ -1,44 +1,36 @@
1
  {
2
  "alignment_heads": [
3
  [
4
- 5,
5
- 3
6
- ],
7
- [
8
- 5,
9
- 9
10
  ],
11
  [
12
- 8,
13
- 0
14
  ],
15
  [
16
- 8,
17
- 4
18
  ],
19
  [
20
- 8,
21
  7
22
  ],
23
  [
24
- 8,
25
- 8
26
- ],
27
- [
28
- 9,
29
- 0
30
  ],
31
  [
32
- 9,
33
- 7
34
  ],
35
  [
36
- 9,
37
- 9
38
  ],
39
  [
40
- 10,
41
- 5
42
  ]
43
  ],
44
  "begin_suppress_tokens": [
@@ -241,6 +233,8 @@
241
  49870,
242
  50254,
243
  50258,
 
 
244
  50360,
245
  50361,
246
  50362
@@ -250,5 +244,5 @@
250
  "transcribe": 50359,
251
  "translate": 50358
252
  },
253
- "transformers_version": "4.48.1"
254
  }
 
1
  {
2
  "alignment_heads": [
3
  [
4
+ 3,
5
+ 1
 
 
 
 
6
  ],
7
  [
8
+ 4,
9
+ 2
10
  ],
11
  [
12
+ 4,
13
+ 3
14
  ],
15
  [
16
+ 4,
17
  7
18
  ],
19
  [
20
+ 5,
21
+ 1
 
 
 
 
22
  ],
23
  [
24
+ 5,
25
+ 2
26
  ],
27
  [
28
+ 5,
29
+ 4
30
  ],
31
  [
32
+ 5,
33
+ 6
34
  ]
35
  ],
36
  "begin_suppress_tokens": [
 
233
  49870,
234
  50254,
235
  50258,
236
+ 50358,
237
+ 50359,
238
  50360,
239
  50361,
240
  50362
 
244
  "transcribe": 50359,
245
  "translate": 50358
246
  },
247
+ "transformers_version": "4.49.0"
248
  }