6#ifndef WHISPERSPEECHTRANSCRIPTION_H
7#define WHISPERSPEECHTRANSCRIPTION_H
36 bool m_verbose =
true;
37 bool m_no_symbols =
true;
38 std::string m_language=
"auto";
40 std::vector<float> m_pcmf32;
41 std::vector<std::vector<float>> m_pcmf32s;
57 bool close()
override;
60 virtual bool setLanguage(
const std::string& language)
override;
61 virtual bool getLanguage(std::string& language)
override;
WhisperSpeechTranscription: A yarp device which performs audio-to-text transcription using OpenAI Whi...
WhisperSpeechTranscription(const WhisperSpeechTranscription &)=delete
WhisperSpeechTranscription & operator=(const WhisperSpeechTranscription &)=delete
virtual ~WhisperSpeechTranscription()
virtual bool setLanguage(const std::string &language) override
Sets the language for speech transcription.
WhisperSpeechTranscription()
bool open(yarp::os::Searchable &config) override
Open the DeviceDriver.
bool close() override
Close the DeviceDriver.
WhisperSpeechTranscription & operator=(WhisperSpeechTranscription &&)=delete
virtual bool transcribe(const yarp::sig::Sound &sound, std::string &transcription, double &score) override
Performs the speech transcription.
WhisperSpeechTranscription(WhisperSpeechTranscription &&)=delete
virtual bool getLanguage(std::string &language) override
Gets the current language set for speech transcription.
Interface implemented by all device drivers.
A generic interface for speech transcription.
A mini-server for performing network communication in the background.
A base class for nested structures that can be searched.
Class for storing sounds See Audio in YARP for additional documentation on YARP audio.
An interface to the operating system, including Port based communication.