SpeechToTextConvertor/main.py at main · Klipar/SpeechToTextConvertor · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
from pydub import AudioSegment
import speech_recognition as sr
import sys
import os
import textwrap
from Easy.massage import *

def SetLanguage ():

    print (colors.VIOLET + """
.▄▄ ·       ▄• ▄▌ ▐ ▄ ·▄▄▄▄      ▄▄▄▄▄          ▄▄▄▄▄▄▄▄ .▐▄• ▄ ▄▄▄▄▄
▐█ ▀. ▪     █▪██▌•█▌▐███▪ ██     •██  ▪         •██  ▀▄.▀· █▌█▌▪•██
▄▀▀▀█▄ ▄█▀▄ █▌▐█▌▐█▐▐▌▐█· ▐█▌     ▐█.▪ ▄█▀▄      ▐█.▪▐▀▀▪▄ ·██·  ▐█.▪
▐█▄▪▐█▐█▌.▐▌▐█▄█▌██▐█▌██. ██      ▐█▌·▐█▌.▐▌     ▐█▌·▐█▄▄▌▪▐█·█▌ ▐█▌·
 ▀▀▀▀  ▀█▄▀▪ ▀▀▀ ▀▀ █▪▀▀▀▀▀•      ▀▀▀  ▀█▄▀▪     ▀▀▀  ▀▀▀ •▀▀ ▀▀ ▀▀▀
            ▄▄·        ▐ ▄  ▌ ▐·▄▄▄ .▄▄▄  ▄▄▄▄▄▄▄▄ .▄▄▄
            ▐█ ▌▪▪     •█▌▐█▪█·█▌▀▄.▀·▀▄ █·•██  ▀▄.▀·▀▄ █·
            ██ ▄▄ ▄█▀▄ ▐█▐▐▌▐█▐█•▐▀▀▪▄▐▀▀▄  ▐█.▪▐▀▀▪▄▐▀▀▄
            ▐███▌▐█▌.▐▌██▐█▌ ███ ▐█▄▄▌▐█•█▌ ▐█▌·▐█▄▄▌▐█•█▌
            ·▀▀▀  ▀█▄▀▪▀▀ █▪. ▀   ▀▀▀ .▀  ▀ ▀▀▀  ▀▀▀ .▀  ▀

"""+ colors.END)


    print(colors.GREEN + """
                    Availble Languages

                [1] English         [2] Ukrainian
                [3] Slovak          [4] Other
        """ + colors.END)
    templates = {
    '1': 'en-US',
    '2': 'uk-UA',
    '3': 'sk-SK',
    '4': 'Other',
    }

    number = input(colors.YELLOW + "[" + colors.END + "?" + colors.YELLOW + "]" + colors.END + "> ")

    if number == "4":
        choice = input("Write the name of your language model, like (en-US or uk-UA): ")

    elif (int(number) > 0 and int(number) < 5):
        choice = templates[number]

    else:
        failed ("Choise if out of range  :(")
        sys.exit

    print("Loading %s...." % (choice))
    return choice

def replace_nth_space_with_newline(text, n=10):
    """function for conditional formatting of a string.
    Replaces every nth space with a newline character
    """
    space_count = 0
    result = []

    for char in text:
        if char == ' ':
            space_count += 1
            if space_count % n == 0:
                result.append('\n')
                continue

        result.append(char)

    return ''.join(result)

def format_text_without_punctuation(text, line_width=80, words_per_sentence=15):
    #formatting the resulting text
    words = text.split()
    formatted_text = ""
    current_sentence = []

    for i, word in enumerate(words):
        current_sentence.append(word)

        if (i + 1) % words_per_sentence == 0:
            sentence = ' '.join(current_sentence) + '.'
            wrapped_sentence = textwrap.fill(sentence, width=line_width)
            formatted_text += wrapped_sentence + "\n\n"
            current_sentence = []

    if current_sentence:
        sentence = ' '.join(current_sentence) + '.'
        wrapped_sentence = textwrap.fill(sentence, width=line_width)
        formatted_text += wrapped_sentence + "\n\n"

    return formatted_text


def main(language_model):
    file_path = ''

    if len(sys.argv) < 2:
        file_path = input("Enter the input file: ")

    else:
        file_path = sys.argv[1]

    try:
        file_name, file_extension = os.path.splitext(file_path)
        file_extension = file_extension.lstrip('.')

        inform (f"Working on file: {file_path}")
        audio = AudioSegment.from_file(file_path, format=file_extension)
        audio.export((file_name+".wav"), format="wav")

    except Exception as e:
        failed (f"File Error   :(\n {e}")
        sys.exit

    try:
        recognizer = sr.Recognizer()

    except Exception as e:
        failed (f"Recognition error   :(\n {e}")
        sys.exit

    try:
        output_file_path = (file_name+'.txt')
        with sr.AudioFile((file_name+".wav")) as source:
            audio = recognizer.record(source)

        os.remove((file_name+".wav"))

    except Exception as e:
        failed (f"File Error   :(\n {e}")
        sys.exit

    try:
        text = str(recognizer.recognize_google(audio, language=language_model))  # Можна змінити мову розпізнавання
        success ("The text is recognized, do you want to improve its readability? (Yes/No): ", en = "")
        t = input().lower()

        if (t == "yes" or t == "y"):
            text = replace_nth_space_with_newline (text)
            success ("The readability of the text is improved!")

        else:
            inform("Text improvement omitted.")

        with open(output_file_path, 'w', encoding='utf-8') as file:
            file.write(text + "\n")

    except sr.UnknownValueError:
        failed("Google Web Speech API can't recognised your file     :(")

    except sr.RequestError as e:
        failed(f"Failed to get results from their api                :({e}")

    success (f"Your content saved in file: {file_name}.txt")

if __name__ == "__main__":
    language_model = SetLanguage()
    main(language_model)