Instructions to use aufklarer/PersonaPlex-7B-MLX-8bit with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- MLX
How to use aufklarer/PersonaPlex-7B-MLX-8bit with MLX:
# Download the model from the Hub pip install huggingface_hub[hf_xet] huggingface-cli download --local-dir PersonaPlex-7B-MLX-8bit aufklarer/PersonaPlex-7B-MLX-8bit
- Moshi
How to use aufklarer/PersonaPlex-7B-MLX-8bit with Moshi:
# pip install moshi # Run the interactive web server python -m moshi.server --hf-repo "aufklarer/PersonaPlex-7B-MLX-8bit" # Then open https://localhost:8998 in your browser
# pip install moshi import torch from moshi.models import loaders # Load checkpoint info from HuggingFace checkpoint = loaders.CheckpointInfo.from_hf_repo("aufklarer/PersonaPlex-7B-MLX-8bit") # Load the Mimi audio codec mimi = checkpoint.get_mimi(device="cuda") mimi.set_num_codebooks(8) # Encode audio (24kHz, mono) wav = torch.randn(1, 1, 24000 * 10) # [batch, channels, samples] with torch.no_grad(): codes = mimi.encode(wav.cuda()) decoded = mimi.decode(codes) - Notebooks
- Google Colab
- Kaggle
- Local Apps Settings
- LM Studio
| { | |
| "model_type": "personaplex", | |
| "version": "personaplex-7b-v1", | |
| "base_model": "kyutai/moshiko-pytorch-bf16", | |
| "temporal": { | |
| "dim": 4096, | |
| "num_layers": 32, | |
| "num_heads": 32, | |
| "hidden_scale": 4.125, | |
| "n_q": 8, | |
| "card": 2048, | |
| "text_card": 32000, | |
| "context": 3000, | |
| "max_period": 10000 | |
| }, | |
| "depformer": { | |
| "dim": 1024, | |
| "num_layers": 6, | |
| "num_heads": 16, | |
| "dim_feedforward": 2816, | |
| "num_steps": 16, | |
| "card": 2048, | |
| "text_card": 32000, | |
| "context": 8, | |
| "weights_per_step": true, | |
| "multi_linear": true | |
| }, | |
| "mimi": { | |
| "sample_rate": 24000, | |
| "frame_rate": 12.5, | |
| "num_codebooks": 16, | |
| "codebook_size": 2048, | |
| "codebook_dim": 256, | |
| "dimension": 512, | |
| "seanet_ratios": [ | |
| 8, | |
| 6, | |
| 5, | |
| 4 | |
| ], | |
| "transformer_layers": 8 | |
| }, | |
| "sampling": { | |
| "audio_temp": 0.8, | |
| "audio_top_k": 250, | |
| "text_temp": 0.7, | |
| "text_top_k": 25 | |
| }, | |
| "delays": [ | |
| 0, | |
| 0, | |
| 1, | |
| 1, | |
| 1, | |
| 1, | |
| 1, | |
| 1, | |
| 1, | |
| 0, | |
| 1, | |
| 1, | |
| 1, | |
| 1, | |
| 1, | |
| 1, | |
| 1 | |
| ], | |
| "quantization": { | |
| "bits": 8, | |
| "group_size": 64, | |
| "quantized_components": [ | |
| "temporal", | |
| "depformer" | |
| ] | |
| }, | |
| "voices": [ | |
| "NATF0", | |
| "NATF1", | |
| "NATF2", | |
| "NATF3", | |
| "NATM0", | |
| "NATM1", | |
| "NATM2", | |
| "NATM3", | |
| "VARF0", | |
| "VARF1", | |
| "VARF2", | |
| "VARF3", | |
| "VARF4", | |
| "VARM0", | |
| "VARM1", | |
| "VARM2", | |
| "VARM3", | |
| "VARM4" | |
| ] | |
| } |