{ "dim": 5120, "eps": 1e-06, "ffn_dim": 13824, "freq_dim": 256, "in_dim": 36, "legacy_audio_cross_attn": true, "model_type": "a2v_af", "num_heads": 40, "num_layers": 40, "out_dim": 16, "audio_output_dim": 768, "norm_output_audio": true, "text_len": 512, "use_concat_attention": true }