cormerod commited on
Commit
db88c26
·
verified ·
1 Parent(s): 2a9ccae

Training in progress, step 1000

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "distil-whisper/distil-large-v3",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
@@ -10,18 +10,32 @@
10
  "begin_suppress_tokens": null,
11
  "bos_token_id": 50257,
12
  "classifier_proj_size": 256,
13
- "d_model": 1280,
14
- "decoder_attention_heads": 20,
15
- "decoder_ffn_dim": 5120,
16
  "decoder_layerdrop": 0.0,
17
- "decoder_layers": 2,
18
  "decoder_start_token_id": 50258,
19
  "dropout": 0.0,
20
- "encoder_attention_heads": 20,
21
- "encoder_ffn_dim": 5120,
22
  "encoder_layerdrop": 0.0,
23
- "encoder_layers": 32,
24
  "eos_token_id": 50257,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  "init_std": 0.02,
26
  "is_encoder_decoder": true,
27
  "mask_feature_length": 10,
@@ -35,13 +49,13 @@
35
  "max_target_positions": 448,
36
  "median_filter_width": 7,
37
  "model_type": "whisper",
38
- "num_hidden_layers": 32,
39
- "num_mel_bins": 128,
40
- "pad_token_id": 50256,
41
  "scale_embedding": false,
42
  "torch_dtype": "float32",
43
  "transformers_version": "4.48.0",
44
  "use_cache": true,
45
  "use_weighted_layer_sum": false,
46
- "vocab_size": 51866
47
  }
 
1
  {
2
+ "_name_or_path": "openai/whisper-tiny",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
10
  "begin_suppress_tokens": null,
11
  "bos_token_id": 50257,
12
  "classifier_proj_size": 256,
13
+ "d_model": 384,
14
+ "decoder_attention_heads": 6,
15
+ "decoder_ffn_dim": 1536,
16
  "decoder_layerdrop": 0.0,
17
+ "decoder_layers": 4,
18
  "decoder_start_token_id": 50258,
19
  "dropout": 0.0,
20
+ "encoder_attention_heads": 6,
21
+ "encoder_ffn_dim": 1536,
22
  "encoder_layerdrop": 0.0,
23
+ "encoder_layers": 4,
24
  "eos_token_id": 50257,
25
+ "forced_decoder_ids": [
26
+ [
27
+ 1,
28
+ 50259
29
+ ],
30
+ [
31
+ 2,
32
+ 50359
33
+ ],
34
+ [
35
+ 3,
36
+ 50363
37
+ ]
38
+ ],
39
  "init_std": 0.02,
40
  "is_encoder_decoder": true,
41
  "mask_feature_length": 10,
 
49
  "max_target_positions": 448,
50
  "median_filter_width": 7,
51
  "model_type": "whisper",
52
+ "num_hidden_layers": 4,
53
+ "num_mel_bins": 80,
54
+ "pad_token_id": 50257,
55
  "scale_embedding": false,
56
  "torch_dtype": "float32",
57
  "transformers_version": "4.48.0",
58
  "use_cache": true,
59
  "use_weighted_layer_sum": false,
60
+ "vocab_size": 51865
61
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a69adb0c0abc466816efeba6d8f8e9cf86310f364aaa418ef5c5d8c64264ada
3
- size 3025686376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:412646c1aa1f8220c4c911258bc5cb7a8911b2a081b722ac2a4a5bbbfb148b86
3
+ size 151061672
preprocessor_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "chunk_length": 30,
3
  "feature_extractor_type": "WhisperFeatureExtractor",
4
- "feature_size": 128,
5
  "hop_length": 160,
6
  "n_fft": 400,
7
  "n_samples": 480000,
 
1
  {
2
  "chunk_length": 30,
3
  "feature_extractor_type": "WhisperFeatureExtractor",
4
+ "feature_size": 80,
5
  "hop_length": 160,
6
  "n_fft": 400,
7
  "n_samples": 480000,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:572ad06e90352905c554829c1a4e4ce912912ed596fe27cff1185bc17e9a1252
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02edb69986dbfaf8e07afb972b2135a2c10a9458f42fcc07ede4b26b55f9f081
3
  size 5432