Spaces:
Running
on
Zero
Running
on
Zero
| _target_: default_model.AstralQuantizer | |
| tokenizer_name: "openai/whisper-small" | |
| ssl_model_name: "facebook/hubert-large-ll60k" | |
| ssl_output_layer: 18 | |
| encoder: | |
| _target_: modules.convnext.ConvNeXtV2Stage | |
| dim: 512 | |
| num_blocks: 12 | |
| intermediate_dim: 1536 | |
| dilation: 1 | |
| input_dim: 1024 | |
| quantizer: | |
| _target_: modules.bsq.BinarySphericalQuantize | |
| codebook_size: 32 # codebook size, must be a power of 2 | |
| dim: 512 | |
| entropy_loss_weight: 0.1 | |
| diversity_gamma: 1.0 | |
| spherical: True | |
| enable_entropy_loss: True | |
| soft_entropy_loss: True | |
| decoder: | |
| _target_: modules.convnext.ConvNeXtV2Stage | |
| dim: 512 | |
| num_blocks: 12 | |
| intermediate_dim: 1536 | |
| dilation: 1 | |
| output_dim: 1024 | |
| gin_channels: 192 | |
| asr_decoder: | |
| _target_: modules.asr_decoder.ASRDecoder | |
| hidden_dim: 768 | |
| num_heads: 12 | |
| depth: 12 | |
| block_size: 4096 | |
| in_channels: 512 | |
| n_vocab: 51866 | |
| bos_id: 50528 | |
| eos_id: 50527 | |
| dropout_rate: 0.0 | |
| attn_dropout_rate: 0.0 |