aufklarer
/

PersonaPlex-7B-MLX-8bit

speech-to-speech

Model card Files Files and versions

PersonaPlex-7B-MLX-8bit / config.json

aufklarer's picture

Upload PersonaPlex 7B MLX 4-bit weights

559b161 verified 3 months ago

history blame contribute delete

1.46 kB

	{
	"model_type": "personaplex",
	"version": "personaplex-7b-v1",
	"base_model": "kyutai/moshiko-pytorch-bf16",
	"temporal": {
	"dim": 4096,
	"num_layers": 32,
	"num_heads": 32,
	"hidden_scale": 4.125,
	"n_q": 8,
	"card": 2048,
	"text_card": 32000,
	"context": 3000,
	"max_period": 10000
	},
	"depformer": {
	"dim": 1024,
	"num_layers": 6,
	"num_heads": 16,
	"dim_feedforward": 2816,
	"num_steps": 16,
	"card": 2048,
	"text_card": 32000,
	"context": 8,
	"weights_per_step": true,
	"multi_linear": true
	},
	"mimi": {
	"sample_rate": 24000,
	"frame_rate": 12.5,
	"num_codebooks": 16,
	"codebook_size": 2048,
	"codebook_dim": 256,
	"dimension": 512,
	"seanet_ratios": [
	8,
	6,
	5,
	4
	],
	"transformer_layers": 8
	},
	"sampling": {
	"audio_temp": 0.8,
	"audio_top_k": 250,
	"text_temp": 0.7,
	"text_top_k": 25
	},
	"delays": [
	0,
	0,
	1,
	1,
	1,
	1,
	1,
	1,
	1,
	0,
	1,
	1,
	1,
	1,
	1,
	1,
	1
	],
	"quantization": {
	"bits": 8,
	"group_size": 64,
	"quantized_components": [
	"temporal",
	"depformer"
	]
	},
	"voices": [
	"NATF0",
	"NATF1",
	"NATF2",
	"NATF3",
	"NATM0",
	"NATM1",
	"NATM2",
	"NATM3",
	"VARF0",
	"VARF1",
	"VARF2",
	"VARF3",
	"VARF4",
	"VARM0",
	"VARM1",
	"VARM2",
	"VARM3",
	"VARM4"
	]
	}