File size: 1,898 Bytes
1d6b3e5
 
9845260
07cadae
 
 
8df9053
 
 
9845260
6fe217e
07cadae
6b035eb
239228e
 
 
8df9053
9845260
99330d0
239228e
 
 
 
 
1d6b3e5
 
 
 
 
 
 
 
 
654a25e
1d6b3e5
 
0fe8fdc
 
 
1d6b3e5
6b035eb
239228e
 
 
 
 
 
 
 
f465e5e
 
 
 
 
99330d0
 
1d6b3e5
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
import random 
import numpy as np 
from elevenlabs import voices, generate, set_api_key, UnauthenticatedRateLimitError, save
import huggingface_hub
from huggingface_hub import Repository
import os
from huggingface_hub import HfApi
import gradio as gr


DATASET_REPO_URL = "https://huggingface.co/datasets/laxsvips/audiofiles"
DATA_FILENAME = "audio.mp4"
DATA_FILE = os.path.join("data", DATA_FILENAME)
# DATASET_REPO_ID = "audiofiles/audio.mp4"


api = HfApi()

HF_TOKEN = os.environ.get("HF_TOKEN")
repo = Repository(
    local_dir="data",
    clone_from=DATASET_REPO_URL,
    use_auth_token=HF_TOKEN
)

def pad_buffer(audio):
    # Pad buffer to multiple of 2 bytes
    buffer_size = len(audio)
    element_size = np.dtype(np.int16).itemsize
    if buffer_size % element_size != 0:
        audio = audio + b'\0' * (element_size - (buffer_size % element_size))
    return audio 

def generate_voice(text):
    try:
        audio = generate(
            text, 
            voice="Arnold", 
            model="eleven_monolingual_v1"
        )
        save(audio,'data/audio.mp4')   
        save(audio,'audio.mp4') 
        commit_url = repo.push_to_hub()
        # commit_url = api.upload_file(
        #                 DATA_FILE,
        #                 path_in_repo=DATA_FILENAME,
        #                 repo_id=DATASET_REPO_ID,
        #                 repo_type="dataset"
        #             )
        # api.upload_file(
        #     folder_path="./data",
        #     repo_id=DATASET_REPO_ID,
        #     repo_type="dataset",
        # )
        return (commit_url)
        # return (44100, np.frombuffer(pad_buffer(audio), dtype=np.int16))
    except UnauthenticatedRateLimitError as e:
        raise gr.Error("Thanks for trying out ElevenLabs TTS! You've reached the free tier limit. Please provide an API key to continue.") 
    except Exception as e:
        raise gr.Error(e)