{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Text-to-Speech web inference using Gradio" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "STT Mel synthesis + Vocoder" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "
\n", " | Size (MB) | \n", "Quantized Size (MB) | \n", "Understand punctuation | \n", "Is lowercase | \n", "
---|---|---|---|---|
male | \n", "119 | \n", "27.6 | \n", "True | \n", "True | \n", "
female | \n", "119 | \n", "27.6 | \n", "True | \n", "True | \n", "
haqkiem | \n", "119 | \n", "27.6 | \n", "True | \n", "True | \n", "
female-singlish | \n", "119 | \n", "27.6 | \n", "True | \n", "True | \n", "
yasmin | \n", "119 | \n", "27.6 | \n", "True | \n", "False | \n", "
osman | \n", "119 | \n", "27.6 | \n", "True | \n", "False | \n", "
multispeaker | \n", "404 | \n", "79.9 | \n", "True | \n", "True | \n", "