Upload optimized ONNX model

#2
by Xenova HF Staff - opened
.gitattributes CHANGED
@@ -36,3 +36,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
36
  onnx/audio_encoder.onnx_data filter=lfs diff=lfs merge=lfs -text
37
  onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
38
  onnx/embed_tokens.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
 
 
36
  onnx/audio_encoder.onnx_data filter=lfs diff=lfs merge=lfs -text
37
  onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
38
  onnx/embed_tokens.onnx_data filter=lfs diff=lfs merge=lfs -text
39
+ onnx/audio_encoder_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
40
+ onnx/decoder_model_merged_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
41
+ onnx/embed_tokens_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -82,8 +82,19 @@
82
  },
83
  "tie_word_embeddings": false,
84
  "transformers.js_config": {
85
- "use_external_data_format": true
 
 
 
 
 
 
 
 
 
 
 
86
  },
87
  "transformers_version": "5.3.0.dev0",
88
  "window_size": 3
89
- }
 
82
  },
83
  "tie_word_embeddings": false,
84
  "transformers.js_config": {
85
+ "use_external_data_format": {
86
+ "audio_encoder.onnx": 1,
87
+ "decoder_model_merged.onnx": 1,
88
+ "embed_tokens.onnx": 1,
89
+ "audio_encoder_fp16.onnx": 1,
90
+ "decoder_model_merged_fp16.onnx": 1,
91
+ "embed_tokens_fp16.onnx": 1
92
+ },
93
+ "kv_cache_dtype": {
94
+ "q4f16": "float16",
95
+ "fp16": "float16"
96
+ }
97
  },
98
  "transformers_version": "5.3.0.dev0",
99
  "window_size": 3
100
+ }
onnx/audio_encoder_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a82b08bef7d8c5b889d5a2c4d1bdd8e09c753210c12395b5c12985f5e1ab73e
3
+ size 41180
onnx/audio_encoder_fp16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34b14dae33ad843406069e9ef058d8fe96db995f9223a526f168d7ab36920c92
3
+ size 154880
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e528e10b4e97bdc6b725d7b894e287f491928ac59b7ad2e4b31860fa7cb4f37
3
- size 20767
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc0ffbeb6b873be83661f6bed70710c3e163bf0111afe7bbd984b3cbedf429c3
3
+ size 22737
onnx/decoder_model_merged.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64eb4cd2b3a4f2f20ae8ec8d88b5d415ab2f5a76ed76c91ff51c38669f26d052
3
  size 26099968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b93639166c0d75cf64249e4de751e865bb00a1dc0244621165bf4bcf69bb0067
3
  size 26099968
onnx/decoder_model_merged_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bc35a3e58316e52cd38f1cf45b76234972f027bd56eebc525c7f8413d7a4e66
3
+ size 22412
onnx/decoder_model_merged_fp16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32a4bb6f12e707aef2a4df8bc53203cf49c487c0229d33e9e420408df47b739d
3
+ size 13049984
onnx/embed_tokens_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3c50291ffe938492d3fceaeea5b0351882bf16ff107c0606ee21bf960340648
3
+ size 632
onnx/embed_tokens_fp16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b1f377c2543fadd03b5404117dc40ecc2159f7760a48e7e551bd45a4d43cc5c
3
+ size 12845184
processor_config.json CHANGED
@@ -4,7 +4,7 @@
4
  "melspec_kwargs": {
5
  "hop_length": 160,
6
  "n_fft": 512,
7
- "n_mels": 8,
8
  "sample_rate": 16000,
9
  "win_length": 400
10
  },
 
4
  "melspec_kwargs": {
5
  "hop_length": 160,
6
  "n_fft": 512,
7
+ "n_mels": 80,
8
  "sample_rate": 16000,
9
  "win_length": 400
10
  },