Skip to content

Commit fc0797b

Browse files
authored
Addition of Noise Suppression and Gain Control to Profiles (spokestack#37)
1 parent 3281e5f commit fc0797b

2 files changed

Lines changed: 8 additions & 0 deletions

File tree

spokestack/profile/vad_trigger_asr.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,10 @@
44
from typing import Any
55

66
from spokestack.activation_timeout import ActivationTimeout
7+
from spokestack.agc.webrtc import AutomaticGainControl
78
from spokestack.asr.spokestack.speech_recognizer import CloudSpeechRecognizer
89
from spokestack.io.pyaudio import PyAudioInput
10+
from spokestack.nsx.webrtc import AutomaticNoiseSuppression
911
from spokestack.pipeline import SpeechPipeline
1012
from spokestack.vad.webrtc import VoiceActivityDetector, VoiceActivityTrigger
1113

@@ -38,6 +40,8 @@ def create(
3840
sample_rate=sample_rate, frame_width=frame_width, **kwargs
3941
),
4042
stages=[
43+
AutomaticGainControl(sample_rate=sample_rate, frame_width=frame_width),
44+
AutomaticNoiseSuppression(sample_rate=sample_rate),
4145
VoiceActivityDetector(
4246
sample_rate=sample_rate, frame_width=frame_width, **kwargs
4347
),

spokestack/profile/wakeword_asr.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,10 @@
44
from typing import Any
55

66
from spokestack.activation_timeout import ActivationTimeout
7+
from spokestack.agc.webrtc import AutomaticGainControl
78
from spokestack.asr.spokestack.speech_recognizer import CloudSpeechRecognizer
89
from spokestack.io.pyaudio import PyAudioInput
10+
from spokestack.nsx.webrtc import AutomaticNoiseSuppression
911
from spokestack.pipeline import SpeechPipeline
1012
from spokestack.vad.webrtc import VoiceActivityDetector
1113
from spokestack.wakeword.tflite import WakewordTrigger
@@ -40,6 +42,8 @@ def create(
4042
frame_width=frame_width, sample_rate=sample_rate, **kwargs
4143
),
4244
stages=[
45+
AutomaticGainControl(sample_rate=sample_rate, frame_width=frame_width),
46+
AutomaticNoiseSuppression(sample_rate=sample_rate),
4347
VoiceActivityDetector(
4448
frame_width=frame_width,
4549
sample_rate=sample_rate,

0 commit comments

Comments
 (0)