main_oo.py

import whisper
from deep_translator import GoogleTranslator
import pyttsx3
from langdetect import detect, DetectorFactory
import arabic_reshaper
import bidi.algorithm
import pyaudio
import wave
import tempfile
import os

class RT_Translator:
    def __init__(self):
        self.model = whisper.load_model("base")
        DetectorFactory.seed = 0

    def record_audio(self, record_seconds=5):
        p = pyaudio.PyAudio()
        stream = p.open(format=pyaudio.paInt16, channels=1, rate=44100, input=True, frames_per_buffer=1024)
        frames = []
        print("Record started")
        try:
            for _ in range(0, int(44100 / 1024 * record_seconds)):
                data = stream.read(1024)
                frames.append(data)
        except KeyboardInterrupt:
            pass
        print("Record stopped")
        stream.stop_stream()
        stream.close()
        p.terminate()
        
        # Save the recorded audio to a temporary file
        temp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".wav")
        wf = wave.open(temp_file.name, 'wb')
        wf.setnchannels(1)
        wf.setsampwidth(p.get_sample_size(pyaudio.paInt16))
        wf.setframerate(44100)
        wf.writeframes(b''.join(frames))
        wf.close()

        return temp_file.name

    def transcribe_audio(self, file_path):
        try:
            result = self.model.transcribe(file_path)
            return result["text"]
        except Exception as e:
            print(f"Error in transcription: {e}")
            return 'An error occured in transcription'

    def translate_text(self, text, target_language="en"):
        try:
            # If the target language is the same as the original language, no need to translate
            if detect(text) == target_language:
                return text
            else:
                translator = GoogleTranslator(source='auto', target=target_language)
                return translator.translate(text)
        except Exception as e:
            print(f"Error in translation: {e}")
            return text

    def text_to_speech(self, text, lang='en'):
        try:
            engine = pyttsx3.init()
            voices = engine.getProperty('voices')

            # Manual mapping of voice names to languages
            voice_map = {
                'en': 'english',
                'fr': 'french',
                'ru': 'russian',
                'uk': 'russian',
                'de': 'german',
                'ar': 'arabic'
            }

            lang = voice_map.get(lang)
            for voice in voices:
                if lang in voice.name.lower():
                    engine.setProperty('voice', voice.id)
                    selected_voice = voice.name
                    break
            else:
                # If no matching voice is found, fall back to the first voice (default)
                print("No matching voice found, using default voice.")
                engine.setProperty('voice', voices[0].id)
                selected_voice = voices[0].name

            print(f"*Using voice: {selected_voice}")
            engine.say(text)
            engine.runAndWait()
        except Exception as e:
            print(f"Error in text to speech: {e}")

    def delete_temp_file(self, file_path):
        try:
            os.remove(file_path)
            print(f"Temporary file {file_path} deleted successfully.")
        except Exception as e:
            print(f"Error deleting temporary file {file_path}: {e}")

    def speech_to_speech(self, path):
        # Choose the target language
        lang = ('fr', 'en', 'ru', 'de', 'ar')
        while True:
            try:
                choice = int(input("Choose a language to translate the speech: \n1. French \n2. English \n3. Russian \n4. German \n5. Arabic \n"))
                if 0 < choice <= len(lang):
                    target_lang = lang[choice - 1]
                    break
                else:
                    print("Invalid number! Please choose between 1 and 5.\n")
            except ValueError:
                print("Invalid input! Please choose a number (1, 2, 3, 4 or 5).\n")

        # Transcribe audio
        transcribed_text = self.transcribe_audio(path)
        if detect(transcribed_text) == 'ar':
            transcribed_text_ar = arabic_reshaper.reshape(transcribed_text)
            transcribed_text_ar = bidi.algorithm.get_display(transcribed_text_ar)
            print(f"Transcribed Text: \n\n{transcribed_text_ar}\n")
        else:
            print(f"Transcribed Text: \n\n{transcribed_text}\n")

        # Play the transcribed text
        self.text_to_speech(transcribed_text, lang=detect(transcribed_text))
        print("**Transcribed text played.")

        # Translate text
        translated_text = self.translate_text(transcribed_text, target_language=target_lang)
        if target_lang == 'ar':
            translated_text_ar = arabic_reshaper.reshape(translated_text)
            translated_text_ar = bidi.algorithm.get_display(translated_text_ar)
            print(f"-----------------------\nTranslated Text: \n\n{translated_text_ar}\n")
        else:
            print(f"-----------------------\nTranslated Text: \n\n{translated_text}\n")

        # Convert translated text to speech and play it
        self.text_to_speech(translated_text, lang=target_lang)
        print("**Translated text played.")

def main():
    translator = RT_Translator()
    while True:
        try:
            x = int(input('Choose an option: \n1. Translate an audio file \n2. Record an audio to translate \n'))
            if 0 < x <= 2:
                break
            else:
                print('Invalid number! Please choose between 1 or 2.')
        except ValueError:
            print('Invalid input! Please enter a number (1 or 2)')

    if x == 1:
        path = input('Provide the path to the audio file: \n')
    else:
        while True:
            try:
                y = int(input('How many seconds will the program record? : \n'))
                break
            except ValueError:
                print('Invalid input! Please enter a valid number of seconds.')
        path = translator.record_audio(record_seconds=y)

    translator.speech_to_speech(path)
    if x == 2:
        translator.delete_temp_file(path)

if __name__ == "__main__":
    try:
        main()
    except Exception as e:
        print("An error occurred:", e)