From af41acd1d5db1f345c7ac616b144d4ee0eba911d Mon Sep 17 00:00:00 2001 From: Fangjun Kuang Date: Sat, 30 Mar 2024 11:01:30 +0800 Subject: [PATCH] update for vad and speaker identificaiton --- sherpa_onnx/sherpa_onnx_linux.go | 34 ++++++++++++++++++++++++++++++ sherpa_onnx/sherpa_onnx_macos.go | 34 ++++++++++++++++++++++++++++++ sherpa_onnx/sherpa_onnx_windows.go | 34 ++++++++++++++++++++++++++++++ 3 files changed, 102 insertions(+) diff --git a/sherpa_onnx/sherpa_onnx_linux.go b/sherpa_onnx/sherpa_onnx_linux.go index 627a92e..fb4864d 100644 --- a/sherpa_onnx/sherpa_onnx_linux.go +++ b/sherpa_onnx/sherpa_onnx_linux.go @@ -42,7 +42,41 @@ type OfflineTtsVitsModelConfig = sherpa.OfflineTtsVitsModelConfig type OfflineTtsModelConfig = sherpa.OfflineTtsModelConfig type OfflineTtsConfig = sherpa.OfflineTtsConfig type GeneratedAudio = sherpa.GeneratedAudio +type Wave = sherpa.Wave type OfflineTts = sherpa.OfflineTts var DeleteOfflineTts = sherpa.DeleteOfflineTts var NewOfflineTts = sherpa.NewOfflineTts + +type SileroVadModelConfig = sherpa.SileroVadModelConfig +type VadModelConfig = sherpa.VadModelConfig +type CircularBuffer = sherpa.CircularBuffer + +var DeleteCircularBuffer = sherpa.DeleteCircularBuffer +var NewCircularBuffer = sherpa.NewCircularBuffer + +type SpeechSegment = sherpa.SpeechSegment +type VoiceActivityDetector = sherpa.VoiceActivityDetector + +var NewVoiceActivityDetector = sherpa.NewVoiceActivityDetector +var DeleteVoiceActivityDetector = sherpa.DeleteVoiceActivityDetector + +type SpokenLanguageIdentificationWhisperConfig = sherpa.SpokenLanguageIdentificationWhisperConfig +type SpokenLanguageIdentificationConfig = sherpa.SpokenLanguageIdentificationConfig +type SpokenLanguageIdentification = sherpa.SpokenLanguageIdentification +type SpokenLanguageIdentificationResult = sherpa.SpokenLanguageIdentificationResult + +var NewSpokenLanguageIdentification = sherpa.NewSpokenLanguageIdentification +var DeleteSpokenLanguageIdentification = sherpa.DeleteSpokenLanguageIdentification + +type SpeakerEmbeddingExtractorConfig = sherpa.SpeakerEmbeddingExtractorConfig +type SpeakerEmbeddingExtractor = sherpa.SpeakerEmbeddingExtractor + +var NewSpeakerEmbeddingExtractor = sherpa.NewSpeakerEmbeddingExtractor +var DeleteSpeakerEmbeddingExtractor = sherpa.DeleteSpeakerEmbeddingExtractor + +type SpeakerEmbeddingManager = sherpa.SpeakerEmbeddingManager + +var NewSpeakerEmbeddingManager = sherpa.NewSpeakerEmbeddingManager +var DeleteSpeakerEmbeddingManager = sherpa.DeleteSpeakerEmbeddingManager +var ReadWave = sherpa.ReadWave diff --git a/sherpa_onnx/sherpa_onnx_macos.go b/sherpa_onnx/sherpa_onnx_macos.go index ff009b4..7e410d5 100644 --- a/sherpa_onnx/sherpa_onnx_macos.go +++ b/sherpa_onnx/sherpa_onnx_macos.go @@ -42,7 +42,41 @@ type OfflineTtsVitsModelConfig = sherpa.OfflineTtsVitsModelConfig type OfflineTtsModelConfig = sherpa.OfflineTtsModelConfig type OfflineTtsConfig = sherpa.OfflineTtsConfig type GeneratedAudio = sherpa.GeneratedAudio +type Wave = sherpa.Wave type OfflineTts = sherpa.OfflineTts var DeleteOfflineTts = sherpa.DeleteOfflineTts var NewOfflineTts = sherpa.NewOfflineTts + +type SileroVadModelConfig = sherpa.SileroVadModelConfig +type VadModelConfig = sherpa.VadModelConfig +type CircularBuffer = sherpa.CircularBuffer + +var DeleteCircularBuffer = sherpa.DeleteCircularBuffer +var NewCircularBuffer = sherpa.NewCircularBuffer + +type SpeechSegment = sherpa.SpeechSegment +type VoiceActivityDetector = sherpa.VoiceActivityDetector + +var NewVoiceActivityDetector = sherpa.NewVoiceActivityDetector +var DeleteVoiceActivityDetector = sherpa.DeleteVoiceActivityDetector + +type SpokenLanguageIdentificationWhisperConfig = sherpa.SpokenLanguageIdentificationWhisperConfig +type SpokenLanguageIdentificationConfig = sherpa.SpokenLanguageIdentificationConfig +type SpokenLanguageIdentification = sherpa.SpokenLanguageIdentification +type SpokenLanguageIdentificationResult = sherpa.SpokenLanguageIdentificationResult + +var NewSpokenLanguageIdentification = sherpa.NewSpokenLanguageIdentification +var DeleteSpokenLanguageIdentification = sherpa.DeleteSpokenLanguageIdentification + +type SpeakerEmbeddingExtractorConfig = sherpa.SpeakerEmbeddingExtractorConfig +type SpeakerEmbeddingExtractor = sherpa.SpeakerEmbeddingExtractor + +var NewSpeakerEmbeddingExtractor = sherpa.NewSpeakerEmbeddingExtractor +var DeleteSpeakerEmbeddingExtractor = sherpa.DeleteSpeakerEmbeddingExtractor + +type SpeakerEmbeddingManager = sherpa.SpeakerEmbeddingManager + +var NewSpeakerEmbeddingManager = sherpa.NewSpeakerEmbeddingManager +var DeleteSpeakerEmbeddingManager = sherpa.DeleteSpeakerEmbeddingManager +var ReadWave = sherpa.ReadWave diff --git a/sherpa_onnx/sherpa_onnx_windows.go b/sherpa_onnx/sherpa_onnx_windows.go index 3cc9399..57d2ff8 100644 --- a/sherpa_onnx/sherpa_onnx_windows.go +++ b/sherpa_onnx/sherpa_onnx_windows.go @@ -42,7 +42,41 @@ type OfflineTtsVitsModelConfig = sherpa.OfflineTtsVitsModelConfig type OfflineTtsModelConfig = sherpa.OfflineTtsModelConfig type OfflineTtsConfig = sherpa.OfflineTtsConfig type GeneratedAudio = sherpa.GeneratedAudio +type Wave = sherpa.Wave type OfflineTts = sherpa.OfflineTts var DeleteOfflineTts = sherpa.DeleteOfflineTts var NewOfflineTts = sherpa.NewOfflineTts + +type SileroVadModelConfig = sherpa.SileroVadModelConfig +type VadModelConfig = sherpa.VadModelConfig +type CircularBuffer = sherpa.CircularBuffer + +var DeleteCircularBuffer = sherpa.DeleteCircularBuffer +var NewCircularBuffer = sherpa.NewCircularBuffer + +type SpeechSegment = sherpa.SpeechSegment +type VoiceActivityDetector = sherpa.VoiceActivityDetector + +var NewVoiceActivityDetector = sherpa.NewVoiceActivityDetector +var DeleteVoiceActivityDetector = sherpa.DeleteVoiceActivityDetector + +type SpokenLanguageIdentificationWhisperConfig = sherpa.SpokenLanguageIdentificationWhisperConfig +type SpokenLanguageIdentificationConfig = sherpa.SpokenLanguageIdentificationConfig +type SpokenLanguageIdentification = sherpa.SpokenLanguageIdentification +type SpokenLanguageIdentificationResult = sherpa.SpokenLanguageIdentificationResult + +var NewSpokenLanguageIdentification = sherpa.NewSpokenLanguageIdentification +var DeleteSpokenLanguageIdentification = sherpa.DeleteSpokenLanguageIdentification + +type SpeakerEmbeddingExtractorConfig = sherpa.SpeakerEmbeddingExtractorConfig +type SpeakerEmbeddingExtractor = sherpa.SpeakerEmbeddingExtractor + +var NewSpeakerEmbeddingExtractor = sherpa.NewSpeakerEmbeddingExtractor +var DeleteSpeakerEmbeddingExtractor = sherpa.DeleteSpeakerEmbeddingExtractor + +type SpeakerEmbeddingManager = sherpa.SpeakerEmbeddingManager + +var NewSpeakerEmbeddingManager = sherpa.NewSpeakerEmbeddingManager +var DeleteSpeakerEmbeddingManager = sherpa.DeleteSpeakerEmbeddingManager +var ReadWave = sherpa.ReadWave