Files
novafarma/ai_voice_gen/install_vibevoice_rtx.sh

51 lines
1.7 KiB
Bash
Executable File

#!/bin/bash
# Install script for Microsoft VibeVoice on Nvidia RTX (Windows/Linux via WSL/Bash)
echo "🚀 Starting VibeVoice Setup for Nvidia RTX..."
# 1. Create Directory
mkdir -p VibeVoice_RTX
cd VibeVoice_RTX
# 2. Clone Repository
echo "📦 Cloning VibeVoice repository..."
if [ ! -d "VibeVoice" ]; then
git clone https://github.com/vibevoice-community/VibeVoice.git
fi
cd VibeVoice
# 3. Setup Python Environment
echo "🐍 Setting up Python environment..."
python3 -m venv venv
source venv/bin/activate
# 4. Install PyTorch with CUDA 12.1
echo "📥 Installing PyTorch with CUDA support..."
pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
# 5. Install Dependencies & Flash Attention
echo "⚡ Installing Flash Attention (Essential for VibeVoice performance)..."
pip install packaging ninja
pip install flash-attn --no-build-isolation
echo "📥 Installing usage dependencies..."
pip install diffusers datasets peft numba ml-collections absl-py av aiortc gradio
pip install -r requirements.txt
# 6. Download Model
echo "💾 Downloading VibeVoice-1.5B Model..."
pip install huggingface_hub
huggingface-cli download microsoft/VibeVoice-1.5B --local-dir models/VibeVoice-1.5B --local-dir-use-symlinks False
# 7. Apply Fix for "custom_generate/generate.py not found" error
echo "🔧 Applying fix for missing generation config..."
mkdir -p models/VibeVoice-1.5B/custom_generate
touch models/VibeVoice-1.5B/custom_generate/__init__.py
echo "def generate(*args, **kwargs): pass" > models/VibeVoice-1.5B/custom_generate/generate.py
echo "✅ Setup Complete!"
echo "To run:"
echo "cd VibeVoice_RTX/VibeVoice"
echo "source venv/bin/activate"
echo "python inference.py --model_path models/VibeVoice-1.5B"