| const generateBtn = document.getElementById('generateBtn'); |
| const hint = document.getElementById('hint'); |
| const speakerIdLabel = document.getElementById('speakerIdLabel'); |
| const speakerIdInput = document.getElementById('speakerId'); |
| const speedInput = document.getElementById('speed'); |
| const speedValue = document.getElementById('speedValue'); |
| const textArea = document.getElementById('text'); |
| const soundClips = document.getElementById('sound-clips'); |
|
|
| speedValue.innerHTML = speedInput.value; |
|
|
| let index = 0; |
|
|
|
|
| let tts = null; |
|
|
| let audioCtx = null; |
|
|
|
|
| Module = {}; |
| Module.onRuntimeInitialized = function() { |
| console.log('Model files downloaded!'); |
|
|
| console.log('Initializing tts ......'); |
| tts = createOfflineTts(Module) |
| if (tts.numSpeakers > 1) { |
| speakerIdLabel.innerHTML = `Speaker ID (0 - ${tts.numSpeakers - 1}):`; |
| } |
|
|
| hint.innerText = |
| 'Initialized! Please enter text and click the Generate button.'; |
|
|
|
|
|
|
| generateBtn.disabled = false; |
| }; |
|
|
| speedInput.oninput = function() { |
| speedValue.innerHTML = this.value; |
| }; |
|
|
| generateBtn.onclick = function() { |
| let speakerId = speakerIdInput.value; |
| if (speakerId.trim().length == 0) { |
| alert('Please input a speakerId'); |
| return; |
| } |
|
|
| if (!speakerId.match(/^\d+$/)) { |
| alert(`Input speakerID ${ |
| speakerId} is not a number.\nPlease enter a number between 0 and ${ |
| tts.numSpeakers - 1}`); |
| return; |
| } |
| speakerId = parseInt(speakerId, 10); |
| if (speakerId > tts.numSpeakers - 1) { |
| alert(`Pleaser enter a number between 0 and ${tts.numSpeakers - 1}`); |
| return; |
| } |
|
|
| let text = textArea.value.trim(); |
| if (text.length == 0) { |
| alert('Please input a non-blank text'); |
| return; |
| } |
|
|
| console.log('speakerId', speakerId); |
| console.log('speed', speedInput.value); |
| console.log('text', text); |
|
|
| let audio = |
| tts.generate({text: text, sid: speakerId, speed: speedInput.value}); |
|
|
| console.log(audio.samples.length, audio.sampleRate); |
|
|
| if (!audioCtx) { |
| audioCtx = new AudioContext({sampleRate: tts.sampleRate}); |
| } |
|
|
| const buffer = audioCtx.createBuffer(1, audio.samples.length, tts.sampleRate); |
|
|
| const ptr = buffer.getChannelData(0); |
| for (let i = 0; i < audio.samples.length; i++) { |
| ptr[i] = audio.samples[i]; |
| } |
| const source = audioCtx.createBufferSource(); |
| source.buffer = buffer; |
| source.connect(audioCtx.destination); |
| source.start(); |
|
|
| createAudioTag(audio); |
| }; |
|
|
| function createAudioTag(generateAudio) { |
| const blob = toWav(generateAudio.samples, generateAudio.sampleRate); |
|
|
| const text = textArea.value.trim().substring(0, 100); |
| const clipName = `${index} ${text} ...`; |
| index += 1; |
|
|
| const clipContainer = document.createElement('article'); |
| const clipLabel = document.createElement('p'); |
| const audio = document.createElement('audio'); |
| const deleteButton = document.createElement('button'); |
| clipContainer.classList.add('clip'); |
| audio.setAttribute('controls', ''); |
| deleteButton.textContent = 'Delete'; |
| deleteButton.className = 'delete'; |
|
|
| clipLabel.textContent = clipName; |
|
|
| clipContainer.appendChild(audio); |
|
|
| clipContainer.appendChild(clipLabel); |
| clipContainer.appendChild(deleteButton); |
| soundClips.appendChild(clipContainer); |
|
|
| audio.controls = true; |
|
|
| const audioURL = window.URL.createObjectURL(blob); |
| audio.src = audioURL; |
|
|
| deleteButton.onclick = function(e) { |
| let evtTgt = e.target; |
| evtTgt.parentNode.parentNode.removeChild(evtTgt.parentNode); |
| }; |
|
|
| clipLabel.onclick = function() { |
| const existingName = clipLabel.textContent; |
| const newClipName = prompt('Enter a new name for your sound clip?'); |
| if (newClipName === null) { |
| clipLabel.textContent = existingName; |
| } else { |
| clipLabel.textContent = newClipName; |
| } |
| }; |
| } |
|
|
| |
| |
| function toWav(floatSamples, sampleRate) { |
| let samples = new Int16Array(floatSamples.length); |
| for (let i = 0; i < samples.length; ++i) { |
| let s = floatSamples[i]; |
| if (s >= 1) |
| s = 1; |
| else if (s <= -1) |
| s = -1; |
|
|
| samples[i] = s * 32767; |
| } |
|
|
| let buf = new ArrayBuffer(44 + samples.length * 2); |
| var view = new DataView(buf); |
|
|
| |
| |
| view.setUint32(0, 0x46464952, true); |
| view.setUint32(4, 36 + samples.length * 2, true); |
| |
| view.setUint32(8, 0x45564157, true); |
| |
| |
| view.setUint32(12, 0x20746d66, true); |
| view.setUint32(16, 16, true); |
| view.setUint32(20, 1, true); |
| view.setUint16(22, 1, true); |
| view.setUint32(24, sampleRate, true); |
| view.setUint32(28, sampleRate * 2, true); |
| view.setUint16(32, 2, true); |
| view.setUint16(34, 16, true); |
| view.setUint32(36, 0x61746164, true); |
| view.setUint32(40, samples.length * 2, true); |
|
|
| let offset = 44; |
| for (let i = 0; i < samples.length; ++i) { |
| view.setInt16(offset, samples[i], true); |
| offset += 2; |
| } |
|
|
| return new Blob([view], {type: 'audio/wav'}); |
| } |
|
|