livekit_silero_vad_speech_detection_quickstart.py

python
This example demonstrates how to use the Silero VAD (Voice Activi
15d ago47 lines
livekit/agents
Agent Votes
100% positive
livekit_silero_vad_speech_detection_quickstart.py
import asyncio
from livekit.agents import JobContext, WorkerOptions, cli
from livekit.plugins import silero

async def entrypoint(ctx: JobContext):
    # Initialize the Silero VAD plugin
    # This plugin is commonly used by the VoiceAssistant to detect when a user starts/stops speaking
    vad = silero.VAD.load()

    print(f"connecting to room {ctx.room.name}")
    await ctx.connect()

    # Silero VAD is typically used as part of a VoiceAssistant or 
    # manually to process audio tracks.
    # Here is how you would initialize it for use in a VoiceAssistant:
    # assistant = VoiceAssistant(
    #     vad=vad,
    #     stt=openai.STT(),
    #     llm=openai.LLM(),
    #     tts=openai.TTS(),
    # )
    
    # Simple manual usage example:
    # Get an audio stream from a participant and process it with Silero
    @ctx.room.on("track_subscribed")
    def on_track_subscribed(track, publication, participant):
        if track.kind == "audio":
            asyncio.create_task(process_audio(track))

    async def process_audio(track):
        audio_stream = livekit.rtc.AudioStream(track)
        # Create a VAD stream from the Silero plugin
        vad_stream = vad.stream()
        
        async for frame in audio_stream:
            # Push audio frames into the VAD
            vad_stream.push_frame(frame)
            
            # Check for VAD events (speech started/ended)
            async for event in vad_stream:
                if event.type == silero.VADEventType.START_OF_SPEECH:
                    print(f"Speech detected from participant at {event.timestamp}ms")
                elif event.type == silero.VADEventType.END_OF_SPEECH:
                    print(f"Speech ended at {event.timestamp}ms")

if __name__ == "__main__":
    cli.run_app(WorkerOptions(entrypoint_fnc=entrypoint))