Add vLLM plugin support for high-performance ASR serving

This commit is contained in:
YingboHAO
2026-01-23 17:32:24 +00:00
parent c0c2af984e
commit 4df5b0582f
10 changed files with 2545 additions and 2 deletions
+23
View File
@@ -0,0 +1,23 @@
#!/bin/bash
# Install system dependencies for VibeVoice vLLM plugin
# Run this script inside the vLLM container before using the plugin
set -e
echo "Installing system dependencies for VibeVoice vLLM plugin..."
# Update package list
apt-get update
# Install FFmpeg and audio processing libraries
apt-get install -y \
ffmpeg \
libsndfile1 \
git
echo "✅ System dependencies installed successfully!"
echo ""
echo "Next steps:"
echo " 1. Install VibeVoice: pip install -e .[vllm]"
echo " 2. Generate tokenizer files (if needed): python -m vllm_plugin.tools.generate_tokenizer_files -o /path/to/model"
echo " 3. Start vLLM server: vllm serve <model_path> --trust-remote-code --enforce-eager --no-enable-prefix-caching"