AutomaticSpeechRecognition.py 775 Bytes
Newer Older
1
2
3
4
import torch
from transformers import pipeline
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

Carl De Sousa Trias's avatar
Carl De Sousa Trias committed
5
class AutomaticSpeechRecognition():
6
7
8
9
    QuestionAudio = None
    ##
    QuestionText = None

Carl De Sousa Trias's avatar
Carl De Sousa Trias committed
10
    def funcAutomaticSpeechRecognition(self, input):
11
12
13
14
15
16
17
18
19
20
        '''
        Verify the inference
        '''
        speech_reco = pipeline(
            "automatic-speech-recognition", model="openai/whisper-base", device=device
        )
        res = speech_reco(input)
        return res["text"]

    def run(self):
Carl De Sousa Trias's avatar
Carl De Sousa Trias committed
21
        self.QuestionText = self.funcAutomaticSpeechRecognition(self.QuestionAudio)
22
23

if __name__ == '__main__':
Carl De Sousa Trias's avatar
Carl De Sousa Trias committed
24
    module = AutomaticSpeechRecognition()
25
26
27
    module.QuestionAudio = "path/to/audiofile"
    module.run()
    print(module.QuestionText)