Go to the documentation of this file.
   35                << 
"isVoice:" << obj.
isVoice << 
", " 
  109             os << 
"SpeechSummary[" 
  110                << 
"speechEvents.size():" << obj.
speechEvents.size() << 
", " 
  129         using Ptr = std::shared_ptr<SpeechSummaryStream>;
 
  134         virtual void reset() = 0;
 
  140         virtual void finalize() = 0;
 
  146         virtual bool hasSpeechEvents() 
const = 0;
 
  166         virtual SpeechInfo getTotalSpeechInfo() 
const = 0;
 
  173         virtual float getCurrentBackgroundLength() 
const = 0;
 
  181         virtual void addSamples(
 
  182             const uint8_t *bytes,
 
  183             size_t bytesNum) = 0;
 
  191         virtual void addSamples(
 
  192             const int16_t *pcm16Samples,
 
  193             size_t samplesNum) = 0;
 
  201         virtual void addSamples(
 
  202             const float *floatSamples,
 
  203             size_t samplesNum) = 0;
 
  220         using Ptr = std::shared_ptr<SpeechSummaryStreamOpus>;
 
  235         virtual void reset() = 0;
 
  241         virtual void finalize() = 0;
 
  247         virtual bool hasSpeechEvents() 
const = 0;
 
  267         virtual SpeechInfo getTotalSpeechInfo() 
const = 0;
 
  274         virtual float getCurrentBackgroundLength() 
const = 0;
 
  283         virtual void addPacket(
 
  284                 const uint8_t* bytes,
 
  285                 size_t bytesNum) = 0;
 
  301         using Ptr = std::shared_ptr<SpeechSummaryEngine>;
 
  323             const uint8_t *bytes,
 
  325             size_t sampleRate) = 0;
 
  336             const int16_t *pcm16Samples,
 
  338             size_t sampleRate) = 0;
 
  349             const float *floatSamples,
 
  351             size_t sampleRate) = 0;
 
  360             const std::string& audioFile) = 0;
 
  
Class for online audio stream processing (voice activity detection and speech statistics computation)
Definition: speech_summary.h:126
 
std::shared_ptr< SpeechSummaryStream > Ptr
Definition: speech_summary.h:129
 
bool isVoice
Whether the interval contains speech or not.
Definition: speech_summary.h:21
 
AudioInterval audioInterval
Speech event audio interval.
Definition: speech_summary.h:26
 
std::shared_ptr< SpeechSummaryEngine > Ptr
Definition: speech_summary.h:301
 
SpeechInfo(float speechLengthMs, float backgroundLengthMs, float totalLengthMs)
Definition: speech_summary.h:64
 
Speech summary engine class (interface), intended to calculate SpeechSummary with given audio samples...
Definition: speech_summary.h:298
 
friend std::ostream & operator<<(std::ostream &os, const SpeechInfo &obj)
Definition: speech_summary.h:70
 
#define VOICE_SDK_API
Definition: config.h:21
 
Definition: speech_summary.h:17
 
friend std::ostream & operator<<(std::ostream &os, const SpeechEvent &obj)
Definition: speech_summary.h:33
 
Structure containing speech statistics and audio intervals marked as speech or non-speech.
Definition: speech_summary.h:90
 
SpeechSummary(const std::vector< SpeechEvent > &speechEvents, const SpeechInfo &speechInfo)
Definition: speech_summary.h:103
 
friend std::ostream & operator<<(std::ostream &os, const SpeechSummary &obj)
Definition: speech_summary.h:108
 
float totalLengthMs
Processed audio total length (totalLengthMs = speechLengthMs + backgroundLengthMs) in milliseconds.
Definition: speech_summary.h:60
 
bool operator==(const SpeechSummary &other) const
Definition: speech_summary.h:115
 
float backgroundLengthMs
Non-speech signal length in milliseconds.
Definition: speech_summary.h:55
 
bool operator==(const SpeechEvent &other) const
Definition: speech_summary.h:40
 
bool operator==(const SpeechInfo &other) const
Definition: speech_summary.h:78
 
Structure representing interval of audio data.
Definition: intervals.h:57
 
float speechLengthMs
Speech signal length in milliseconds.
Definition: speech_summary.h:50
 
Definition: speech_summary.h:46
 
Definition: intervals.h:8
 
SpeechEvent(bool isVoice, const AudioInterval &audioInterval)
Definition: speech_summary.h:30
 
std::shared_ptr< SpeechSummaryStreamOpus > Ptr
Definition: speech_summary.h:220
 
SpeechInfo speechInfo
Contains speech statistics.
Definition: speech_summary.h:99
 
std::vector< SpeechEvent > speechEvents
Contains audio intervals marked as speech or non-speech.
Definition: speech_summary.h:94
 
Class for online Opus audio stream processing (voice activity detection and speech statistics computa...
Definition: speech_summary.h:217