few last imports
This commit is contained in:
parent
dfb249e13d
commit
a01e3b2fb8
2 changed files with 60 additions and 0 deletions
51
vocode/streaming/input_device/streaming/microphone_input.py
Normal file
51
vocode/streaming/input_device/streaming/microphone_input.py
Normal file
|
|
@ -0,0 +1,51 @@
|
|||
import sounddevice as sd
|
||||
import numpy as np
|
||||
from typing import Optional
|
||||
import queue
|
||||
import wave
|
||||
|
||||
from vocode.streaming.input_device.base_input_device import BaseInputDevice
|
||||
from vocode.streaming.models.audio_encoding import AudioEncoding
|
||||
|
||||
|
||||
class MicrophoneInput(BaseInputDevice):
|
||||
DEFAULT_SAMPLING_RATE = 44100
|
||||
DEFAULT_CHUNK_SIZE = 2048
|
||||
|
||||
def __init__(
|
||||
self,
|
||||
device_info: dict,
|
||||
sampling_rate: int = None,
|
||||
chunk_size: int = DEFAULT_CHUNK_SIZE,
|
||||
microphone_gain: int = 1,
|
||||
):
|
||||
self.device_info = device_info
|
||||
sampling_rate = sampling_rate or (
|
||||
self.device_info.get("default_samplerate", self.DEFAULT_SAMPLING_RATE)
|
||||
)
|
||||
super().__init__(int(sampling_rate), AudioEncoding.LINEAR16, chunk_size)
|
||||
self.stream = sd.InputStream(
|
||||
dtype=np.int16,
|
||||
channels=1,
|
||||
samplerate=self.sampling_rate,
|
||||
blocksize=self.chunk_size,
|
||||
device=int(self.device_info["index"]),
|
||||
callback=self._stream_callback,
|
||||
)
|
||||
self.stream.start()
|
||||
self.queue = queue.Queue()
|
||||
self.microphone_gain = microphone_gain
|
||||
|
||||
def _stream_callback(self, in_data: np.ndarray[np.int16], *_args):
|
||||
if self.microphone_gain > 1:
|
||||
in_data = in_data * (2 ^ self.microphone_gain)
|
||||
else:
|
||||
in_data = in_data // (2 ^ self.microphone_gain)
|
||||
audio_bytes = in_data.tobytes()
|
||||
self.queue.put_nowait(audio_bytes)
|
||||
|
||||
def get_audio(self) -> Optional[bytes]:
|
||||
try:
|
||||
return self.queue.get_nowait()
|
||||
except queue.Empty:
|
||||
return None
|
||||
|
|
@ -0,0 +1,9 @@
|
|||
from vocode.streaming.input_device.base_input_device import BaseInputDevice
|
||||
from vocode.streaming.models.audio_encoding import AudioEncoding
|
||||
|
||||
|
||||
class TelephoneInput(BaseInputDevice):
|
||||
def __init__(self):
|
||||
super().__init__(
|
||||
sampling_rate=8000, audio_encoding=AudioEncoding.MULAW, chunk_size=160
|
||||
)
|
||||
Loading…
Add table
Add a link
Reference in a new issue