Automatic Speech Recognition
MLX
Safetensors
English
Chinese
mega_asr
speech-to-text
asr
robust-asr
qwen3-asr
Instructions to use mlx-community/Mega-ASR-bf16 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- MLX
How to use mlx-community/Mega-ASR-bf16 with MLX:
# Download the model from the Hub pip install huggingface_hub[hf_xet] huggingface-cli download --local-dir Mega-ASR-bf16 mlx-community/Mega-ASR-bf16
- Notebooks
- Google Colab
- Kaggle
- Local Apps
- LM Studio
| { | |
| "model_type": "mega_asr", | |
| "model_repo": null, | |
| "audio_token_id": 151676, | |
| "audio_start_token_id": 151669, | |
| "audio_end_token_id": 151670, | |
| "support_languages": [ | |
| "Chinese", | |
| "English", | |
| "Cantonese", | |
| "Arabic", | |
| "German", | |
| "French", | |
| "Spanish", | |
| "Portuguese", | |
| "Indonesian", | |
| "Italian", | |
| "Korean", | |
| "Russian", | |
| "Thai", | |
| "Vietnamese", | |
| "Japanese", | |
| "Turkish", | |
| "Hindi", | |
| "Malay", | |
| "Dutch", | |
| "Swedish", | |
| "Danish", | |
| "Finnish", | |
| "Polish", | |
| "Czech", | |
| "Filipino", | |
| "Persian", | |
| "Greek", | |
| "Romanian", | |
| "Hungarian", | |
| "Macedonian" | |
| ], | |
| "audio_config": { | |
| "num_mel_bins": 128, | |
| "encoder_layers": 24, | |
| "encoder_attention_heads": 16, | |
| "encoder_ffn_dim": 4096, | |
| "d_model": 1024, | |
| "dropout": 0, | |
| "attention_dropout": 0, | |
| "activation_function": "gelu", | |
| "activation_dropout": 0, | |
| "scale_embedding": false, | |
| "initializer_range": 0.02, | |
| "max_source_positions": 1500, | |
| "n_window": 50, | |
| "output_dim": 2048, | |
| "n_window_infer": 800, | |
| "conv_chunksize": 500, | |
| "downsample_hidden_size": 480 | |
| }, | |
| "text_config": { | |
| "model_type": "qwen3", | |
| "vocab_size": 151936, | |
| "hidden_size": 2048, | |
| "intermediate_size": 6144, | |
| "num_hidden_layers": 28, | |
| "num_attention_heads": 16, | |
| "num_key_value_heads": 8, | |
| "head_dim": 128, | |
| "hidden_act": "silu", | |
| "max_position_embeddings": 65536, | |
| "initializer_range": 0.02, | |
| "rms_norm_eps": 1e-06, | |
| "use_cache": true, | |
| "tie_word_embeddings": true, | |
| "rope_theta": 1000000, | |
| "rope_scaling": { | |
| "interleaved": true, | |
| "mrope_interleaved": true, | |
| "mrope_section": [ | |
| 24, | |
| 20, | |
| 20 | |
| ], | |
| "rope_type": "default", | |
| "type": "default" | |
| }, | |
| "attention_bias": false, | |
| "attention_dropout": 0.0 | |
| }, | |
| "router_config": { | |
| "d_model": 256, | |
| "nhead": 4, | |
| "dim_feedforward": 1024, | |
| "num_layers": 1, | |
| "n_mels": 80, | |
| "max_len": 850 | |
| }, | |
| "router_weights": "extras/router.safetensors", | |
| "lora_weights": "extras/lora.safetensors" | |
| } | |