Spaces:
Running
Running
const generateBtn = document.getElementById('generateBtn'); | |
const hint = document.getElementById('hint'); | |
const speakerIdLabel = document.getElementById('speakerIdLabel'); | |
const speakerIdInput = document.getElementById('speakerId'); | |
const speedInput = document.getElementById('speed'); | |
const speedValue = document.getElementById('speedValue'); | |
const textArea = document.getElementById('text'); | |
const soundClips = document.getElementById('sound-clips'); | |
speedValue.innerHTML = speedInput.value; | |
let index = 0; | |
let tts = null; | |
let audioCtx = null; | |
Module = {}; | |
Module.onRuntimeInitialized = function() { | |
console.log('Model files downloaded!'); | |
console.log('Initializing tts ......'); | |
tts = createOfflineTts(Module) | |
if (tts.numSpeakers > 1) { | |
speakerIdLabel.innerHTML = `Speaker ID (0 - ${tts.numSpeakers - 1}):`; | |
} | |
hint.innerText = | |
'Initialized! Please enter text and click the Generate button.'; | |
generateBtn.disabled = false; | |
}; | |
speedInput.oninput = function() { | |
speedValue.innerHTML = this.value; | |
}; | |
generateBtn.onclick = function() { | |
let speakerId = speakerIdInput.value; | |
if (speakerId.trim().length == 0) { | |
alert('Please input a speakerId'); | |
return; | |
} | |
if (!speakerId.match(/^\d+$/)) { | |
alert(`Input speakerID ${ | |
speakerId} is not a number.\nPlease enter a number between 0 and ${ | |
tts.numSpeakers - 1}`); | |
return; | |
} | |
speakerId = parseInt(speakerId, 10); | |
if (speakerId > tts.numSpeakers - 1) { | |
alert(`Pleaser enter a number between 0 and ${tts.numSpeakers - 1}`); | |
return; | |
} | |
let text = textArea.value.trim(); | |
if (text.length == 0) { | |
alert('Please input a non-blank text'); | |
return; | |
} | |
console.log('speakerId', speakerId); | |
console.log('speed', speedInput.value); | |
console.log('text', text); | |
let audio = | |
tts.generate({text: text, sid: speakerId, speed: speedInput.value}); | |
console.log(audio.samples.length, audio.sampleRate); | |
if (!audioCtx) { | |
audioCtx = new AudioContext({sampleRate: tts.sampleRate}); | |
} | |
const buffer = audioCtx.createBuffer(1, audio.samples.length, tts.sampleRate); | |
const ptr = buffer.getChannelData(0); | |
for (let i = 0; i < audio.samples.length; i++) { | |
ptr[i] = audio.samples[i]; | |
} | |
const source = audioCtx.createBufferSource(); | |
source.buffer = buffer; | |
source.connect(audioCtx.destination); | |
source.start(); | |
createAudioTag(audio); | |
}; | |
function createAudioTag(generateAudio) { | |
const blob = toWav(generateAudio.samples, generateAudio.sampleRate); | |
const text = textArea.value.trim().substring(0, 100); | |
const clipName = `${index} ${text} ...`; | |
index += 1; | |
const clipContainer = document.createElement('article'); | |
const clipLabel = document.createElement('p'); | |
const audio = document.createElement('audio'); | |
const deleteButton = document.createElement('button'); | |
clipContainer.classList.add('clip'); | |
audio.setAttribute('controls', ''); | |
deleteButton.textContent = 'Delete'; | |
deleteButton.className = 'delete'; | |
clipLabel.textContent = clipName; | |
clipContainer.appendChild(audio); | |
clipContainer.appendChild(clipLabel); | |
clipContainer.appendChild(deleteButton); | |
soundClips.appendChild(clipContainer); | |
audio.controls = true; | |
const audioURL = window.URL.createObjectURL(blob); | |
audio.src = audioURL; | |
deleteButton.onclick = function(e) { | |
let evtTgt = e.target; | |
evtTgt.parentNode.parentNode.removeChild(evtTgt.parentNode); | |
}; | |
clipLabel.onclick = function() { | |
const existingName = clipLabel.textContent; | |
const newClipName = prompt('Enter a new name for your sound clip?'); | |
if (newClipName === null) { | |
clipLabel.textContent = existingName; | |
} else { | |
clipLabel.textContent = newClipName; | |
} | |
}; | |
} | |
// this function is copied/modified from | |
// https://gist.github.com/meziantou/edb7217fddfbb70e899e | |
function toWav(floatSamples, sampleRate) { | |
let samples = new Int16Array(floatSamples.length); | |
for (let i = 0; i < samples.length; ++i) { | |
let s = floatSamples[i]; | |
if (s >= 1) | |
s = 1; | |
else if (s <= -1) | |
s = -1; | |
samples[i] = s * 32767; | |
} | |
let buf = new ArrayBuffer(44 + samples.length * 2); | |
var view = new DataView(buf); | |
// http://soundfile.sapp.org/doc/WaveFormat/ | |
// F F I R | |
view.setUint32(0, 0x46464952, true); // chunkID | |
view.setUint32(4, 36 + samples.length * 2, true); // chunkSize | |
// E V A W | |
view.setUint32(8, 0x45564157, true); // format | |
// | |
// t m f | |
view.setUint32(12, 0x20746d66, true); // subchunk1ID | |
view.setUint32(16, 16, true); // subchunk1Size, 16 for PCM | |
view.setUint32(20, 1, true); // audioFormat, 1 for PCM | |
view.setUint16(22, 1, true); // numChannels: 1 channel | |
view.setUint32(24, sampleRate, true); // sampleRate | |
view.setUint32(28, sampleRate * 2, true); // byteRate | |
view.setUint16(32, 2, true); // blockAlign | |
view.setUint16(34, 16, true); // bitsPerSample | |
view.setUint32(36, 0x61746164, true); // Subchunk2ID | |
view.setUint32(40, samples.length * 2, true); // subchunk2Size | |
let offset = 44; | |
for (let i = 0; i < samples.length; ++i) { | |
view.setInt16(offset, samples[i], true); | |
offset += 2; | |
} | |
return new Blob([view], {type: 'audio/wav'}); | |
} | |