File size: 2,750 Bytes
05b5e18
 
 
 
 
529dc53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
05b5e18
529dc53
 
 
 
 
05b5e18
529dc53
 
 
 
 
05b5e18
529dc53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
05b5e18
529dc53
 
 
 
05b5e18
529dc53
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
import os

# Настройка переменной окружения
os.environ['TRANSFORMERS_CACHE'] = '/path/to/writable/directory'

from transformers import pipeline
import speech_recognition as sr
from gtts import gTTS
import os
import io
from google.oauth2.credentials import Credentials
from googleapiclient.discovery import build
from googleapiclient.http import MediaIoBaseDownload

# Инициализация модели и токенизатора
model_name = "cointegrated/rut5-base-multitask"
chatbot = pipeline("text-generation", model=model_name)

# Функция для распознавания речи
def recognize_speech():
    recognizer = sr.Recognizer()
    with sr.Microphone() as source:
        print("Скажите что-нибудь...")
        audio = recognizer.listen(source)
    try:
        text = recognizer.recognize_google(audio, language="ru-RU")
        print("Вы сказали: " + text)
        return text
    except sr.UnknownValueError:
        print("Не удалось распознавать речь")
        return ""
    except sr.RequestError as e:
        print("Ошибка сервиса распознавания речи; {0}".format(e))
        return ""

# Функция для синтезиса речи
def synthesize_speech(text):
    tts = gTTS(text=text, lang="ru")
    tts.save("response.mp3")
    os.system("mpg321 response.mp3")

# Функция для загрузкии документов с Google Drive
def load_documents_from_drive():
    creds = Credentials.from_authorized_user_file('token.json', ['https://www.googleapis.com/auth/drive.readonly'])
    service = build('drive', 'v3', credentials=creds)
    results = service.files().list(q="mimeType='application/pdf' and trashed=false", fields="files(id, name)").execute()
    items = results.get('files', [])
    documents = []
    for item in items:
        file_id = item['id']
        request = service.files().get_media(fileId=file_id)
        fh = io.FileIO(item['name'], 'wb')
        downloader = MediaIoBaseDownload(fh, request)
        done = False
        while done is False:
            status, done = downloader.next_chunk()
            print(f"Скачивание файла {item['name']}... {int(status.progress() * 100)}% завершено")
        fh.close()
        documents.append(item['name'])
    return documents

# Основой цикл чатбота
def main():
    while True:
        user_input = recognize_speech()
        if user_input:
            response = chatbot(user_input, max_length=100, numreturn_sequences=1)[0]['generated_text']
            print("Чатбот: " + response)
            synthesize_speech(response)

if __name__ == "__main__":
    main()