Moshi How to use kyutai/moshika-pytorch-bf16 with Moshi:
# pip install moshi
# Run the interactive web server
python -m moshi.server --hf-repo "kyutai/moshika-pytorch-bf16"
# Then open https://localhost:8998 in your browser
# pip install moshi
import torch
from moshi.models import loaders
# Load checkpoint info from HuggingFace
checkpoint = loaders.CheckpointInfo.from_hf_repo("kyutai/moshika-pytorch-bf16")
# Load the Mimi audio codec
mimi = checkpoint.get_mimi(device="cuda")
mimi.set_num_codebooks(8)
# Encode audio (24kHz, mono)
wav = torch.randn(1, 1, 24000 * 10) # [batch, channels, samples]
with torch.no_grad():
codes = mimi.encode(wav.cuda())
decoded = mimi.decode(codes)