Plachta's picture
Upload 116 files
56a1295 verified
raw
history blame contribute delete
968 Bytes
_target_: default_model.AstralQuantizer
tokenizer_name: "openai/whisper-small"
ssl_model_name: "facebook/hubert-large-ll60k"
ssl_output_layer: 18
encoder:
_target_: modules.convnext.ConvNeXtV2Stage
dim: 512
num_blocks: 12
intermediate_dim: 1536
dilation: 1
input_dim: 1024
quantizer:
_target_: modules.bsq.BinarySphericalQuantize
codebook_size: 32 # codebook size, must be a power of 2
dim: 512
entropy_loss_weight: 0.1
diversity_gamma: 1.0
spherical: True
enable_entropy_loss: True
soft_entropy_loss: True
decoder:
_target_: modules.convnext.ConvNeXtV2Stage
dim: 512
num_blocks: 12
intermediate_dim: 1536
dilation: 1
output_dim: 1024
gin_channels: 192
asr_decoder:
_target_: modules.asr_decoder.ASRDecoder
hidden_dim: 768
num_heads: 12
depth: 12
block_size: 4096
in_channels: 512
n_vocab: 51866
bos_id: 50528
eos_id: 50527
dropout_rate: 0.0
attn_dropout_rate: 0.0