Skip to content
This repository was archived by the owner on May 6, 2022. It is now read-only.

Commit fc0797b

Browse files
authored
Addition of Noise Suppression and Gain Control to Profiles (#37)
1 parent 3281e5f commit fc0797b

File tree

2 files changed

+8
-0
lines changed

2 files changed

+8
-0
lines changed

spokestack/profile/vad_trigger_asr.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,10 @@
44
from typing import Any
55

66
from spokestack.activation_timeout import ActivationTimeout
7+
from spokestack.agc.webrtc import AutomaticGainControl
78
from spokestack.asr.spokestack.speech_recognizer import CloudSpeechRecognizer
89
from spokestack.io.pyaudio import PyAudioInput
10+
from spokestack.nsx.webrtc import AutomaticNoiseSuppression
911
from spokestack.pipeline import SpeechPipeline
1012
from spokestack.vad.webrtc import VoiceActivityDetector, VoiceActivityTrigger
1113

@@ -38,6 +40,8 @@ def create(
3840
sample_rate=sample_rate, frame_width=frame_width, **kwargs
3941
),
4042
stages=[
43+
AutomaticGainControl(sample_rate=sample_rate, frame_width=frame_width),
44+
AutomaticNoiseSuppression(sample_rate=sample_rate),
4145
VoiceActivityDetector(
4246
sample_rate=sample_rate, frame_width=frame_width, **kwargs
4347
),

spokestack/profile/wakeword_asr.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,10 @@
44
from typing import Any
55

66
from spokestack.activation_timeout import ActivationTimeout
7+
from spokestack.agc.webrtc import AutomaticGainControl
78
from spokestack.asr.spokestack.speech_recognizer import CloudSpeechRecognizer
89
from spokestack.io.pyaudio import PyAudioInput
10+
from spokestack.nsx.webrtc import AutomaticNoiseSuppression
911
from spokestack.pipeline import SpeechPipeline
1012
from spokestack.vad.webrtc import VoiceActivityDetector
1113
from spokestack.wakeword.tflite import WakewordTrigger
@@ -40,6 +42,8 @@ def create(
4042
frame_width=frame_width, sample_rate=sample_rate, **kwargs
4143
),
4244
stages=[
45+
AutomaticGainControl(sample_rate=sample_rate, frame_width=frame_width),
46+
AutomaticNoiseSuppression(sample_rate=sample_rate),
4347
VoiceActivityDetector(
4448
frame_width=frame_width,
4549
sample_rate=sample_rate,

0 commit comments

Comments
 (0)