31 isVoice(isVoice), audioInterval(audioInterval) {}
35 <<
"isVoice:" << obj.
isVoice <<
", " 50 float speechLengthMs = 0.0f;
55 float backgroundLengthMs = 0.0f;
60 float totalLengthMs = 0.0f;
64 SpeechInfo(
float speechLengthMs,
float backgroundLengthMs,
float totalLengthMs) :
65 speechLengthMs(speechLengthMs),
66 backgroundLengthMs(backgroundLengthMs),
67 totalLengthMs(totalLengthMs)
104 speechEvents(speechEvents),
105 speechInfo(speechInfo)
109 os <<
"SpeechSummary[" 110 <<
"speechEvents.size():" << obj.
speechEvents.size() <<
", " 129 using Ptr = std::shared_ptr<SpeechSummaryStream>;
134 virtual void reset() = 0;
140 virtual void finalize() = 0;
146 virtual bool hasSpeechEvents()
const = 0;
166 virtual SpeechInfo getTotalSpeechInfo()
const = 0;
173 virtual float getCurrentBackgroundLength()
const = 0;
181 virtual void addSamples(
182 const uint8_t *bytes,
183 size_t bytesNum) = 0;
191 virtual void addSamples(
192 const int16_t *pcm16Samples,
193 size_t samplesNum) = 0;
201 virtual void addSamples(
202 const float *floatSamples,
203 size_t samplesNum) = 0;
220 using Ptr = std::shared_ptr<SpeechSummaryStreamOpus>;
235 virtual void reset() = 0;
241 virtual void finalize() = 0;
247 virtual bool hasSpeechEvents()
const = 0;
267 virtual SpeechInfo getTotalSpeechInfo()
const = 0;
274 virtual float getCurrentBackgroundLength()
const = 0;
283 virtual void addPacket(
284 const uint8_t* bytes,
285 size_t bytesNum) = 0;
301 using Ptr = std::shared_ptr<SpeechSummaryEngine>;
323 const uint8_t *bytes,
325 size_t sampleRate) = 0;
336 const int16_t *pcm16Samples,
338 size_t sampleRate) = 0;
349 const float *floatSamples,
351 size_t sampleRate) = 0;
360 const std::string& audioFile) = 0;
bool isVoice
Whether the interval contains speech or not.
Definition: speech_summary.h:21
std::shared_ptr< SpeechSummaryStream > Ptr
Definition: speech_summary.h:129
std::vector< SpeechEvent > speechEvents
Contains audio intervals marked as speech or non-speech.
Definition: speech_summary.h:94
SpeechInfo speechInfo
Contains speech statistics.
Definition: speech_summary.h:99
bool operator==(const SpeechSummary &other) const
Definition: speech_summary.h:115
SpeechInfo(float speechLengthMs, float backgroundLengthMs, float totalLengthMs)
Definition: speech_summary.h:64
Structure representing interval of audio data.
Definition: intervals.h:57
Definition: speech_summary.h:46
float totalLengthMs
Processed audio total length (totalLengthMs = speechLengthMs + backgroundLengthMs) in milliseconds...
Definition: speech_summary.h:60
Definition: intervals.h:8
friend std::ostream & operator<<(std::ostream &os, const SpeechInfo &obj)
Definition: speech_summary.h:70
SpeechSummary(const std::vector< SpeechEvent > &speechEvents, const SpeechInfo &speechInfo)
Definition: speech_summary.h:103
#define VOICE_SDK_API
Definition: config.h:21
float backgroundLengthMs
Non-speech signal length in milliseconds.
Definition: speech_summary.h:55
std::shared_ptr< SpeechSummaryEngine > Ptr
Definition: speech_summary.h:301
Definition: speech_summary.h:17
Speech summary engine class (interface), intended to calculate SpeechSummary with given audio samples...
Definition: speech_summary.h:298
SpeechEvent(bool isVoice, const AudioInterval &audioInterval)
Definition: speech_summary.h:30
bool operator==(const SpeechInfo &other) const
Definition: speech_summary.h:78
Class for online Opus audio stream processing (voice activity detection and speech statistics computa...
Definition: speech_summary.h:217
friend std::ostream & operator<<(std::ostream &os, const SpeechEvent &obj)
Definition: speech_summary.h:33
bool operator==(const SpeechEvent &other) const
Definition: speech_summary.h:40
float speechLengthMs
Speech signal length in milliseconds.
Definition: speech_summary.h:50
AudioInterval audioInterval
Speech event audio interval.
Definition: speech_summary.h:26
Class for online audio stream processing (voice activity detection and speech statistics computation)...
Definition: speech_summary.h:126
std::shared_ptr< SpeechSummaryStreamOpus > Ptr
Definition: speech_summary.h:220
Structure containing speech statistics and audio intervals marked as speech or non-speech.
Definition: speech_summary.h:90
friend std::ostream & operator<<(std::ostream &os, const SpeechSummary &obj)
Definition: speech_summary.h:108