Class for online audio stream processing (voice activity detection and speech statistics computation)
More...
#include <voicesdk/media/speech_summary.h>
|
|
virtual void | reset ()=0 |
| | Resets stream state: clears buffer, resets speech summary.
|
| |
|
virtual void | finalize ()=0 |
| | Finalizes input audio stream to process remaining audio samples and produce result if it's possible.
|
| |
| virtual bool | hasSpeechEvents () const =0 |
| | Checks if there are available speech events in output queue. More...
|
| |
| virtual SpeechEvent | getSpeechEvent ()=0 |
| | Retrieves a single speech event from output FIFO queue. Use hasSpeechEvents() to check if there is available speech event. More...
|
| |
| virtual SpeechSummary | getTotalSpeechSummary () const =0 |
| | Retrieves total accumulated speech summary. More...
|
| |
| virtual SpeechInfo | getTotalSpeechInfo () const =0 |
| | Retrieves total accumulated speech info. More...
|
| |
| virtual float | getCurrentBackgroundLength () const =0 |
| | Method for retrieving current background length (length of a continuous non-speech segment starting on the last detected speech frame) More...
|
| |
| virtual void | addSamples (const uint8_t *bytes, size_t bytesNum)=0 |
| | Adds PCM16 audio samples to process. More...
|
| |
| virtual void | addSamples (const int16_t *pcm16Samples, size_t samplesNum)=0 |
| | Adds PCM16 audio samples to process. More...
|
| |
| virtual void | addSamples (const float *floatSamples, size_t samplesNum)=0 |
| | Adds float audio samples (in [-1; 1] range) to process. More...
|
| |
|
virtual bool | compare (const SpeechSummaryStream::Ptr &other) const =0 |
| | Check if resulting states of this and another stream are equal.
|
| |
Class for online audio stream processing (voice activity detection and speech statistics computation)
- See also
- SpeechSummaryEngine to create a SpeechSummaryStream instance
◆ addSamples() [1/3]
| virtual void voicesdk::SpeechSummaryStream::addSamples |
( |
const float * |
floatSamples, |
|
|
size_t |
samplesNum |
|
) |
| |
|
pure virtual |
Adds float audio samples (in [-1; 1] range) to process.
- Parameters
-
| floatSamples | pointer to array with samples |
| samplesNum | size of array with samples |
- Exceptions
-
| std::runtime_error | if runtime error occurred |
◆ addSamples() [2/3]
| virtual void voicesdk::SpeechSummaryStream::addSamples |
( |
const int16_t * |
pcm16Samples, |
|
|
size_t |
samplesNum |
|
) |
| |
|
pure virtual |
Adds PCM16 audio samples to process.
- Parameters
-
| pcm16Samples | pointer to array with samples |
| samplesNum | size of array with samples |
- Exceptions
-
| std::runtime_error | if runtime error occurred |
◆ addSamples() [3/3]
| virtual void voicesdk::SpeechSummaryStream::addSamples |
( |
const uint8_t * |
bytes, |
|
|
size_t |
bytesNum |
|
) |
| |
|
pure virtual |
Adds PCM16 audio samples to process.
- Parameters
-
| bytes | pointer to array with samples |
| bytesNum | size of array with samples |
- Exceptions
-
| std::runtime_error | if runtime error occurred |
◆ getCurrentBackgroundLength()
| virtual float voicesdk::SpeechSummaryStream::getCurrentBackgroundLength |
( |
| ) |
const |
|
pure virtual |
Method for retrieving current background length (length of a continuous non-speech segment starting on the last detected speech frame)
- Returns
- current background length in milliseconds
◆ getSpeechEvent()
| virtual SpeechEvent voicesdk::SpeechSummaryStream::getSpeechEvent |
( |
| ) |
|
|
pure virtual |
Retrieves a single speech event from output FIFO queue. Use hasSpeechEvents() to check if there is available speech event.
- Returns
- A single speech event
- Exceptions
-
| std::runtime_error | if runtime error occurred |
◆ getTotalSpeechInfo()
| virtual SpeechInfo voicesdk::SpeechSummaryStream::getTotalSpeechInfo |
( |
| ) |
const |
|
pure virtual |
Retrieves total accumulated speech info.
- Returns
- speech info
◆ getTotalSpeechSummary()
| virtual SpeechSummary voicesdk::SpeechSummaryStream::getTotalSpeechSummary |
( |
| ) |
const |
|
pure virtual |
Retrieves total accumulated speech summary.
- Returns
- speech summary
◆ hasSpeechEvents()
| virtual bool voicesdk::SpeechSummaryStream::hasSpeechEvents |
( |
| ) |
const |
|
pure virtual |
Checks if there are available speech events in output queue.
- Returns
- true if there is available speech event, false otherwise