diff --git a/.gitignore b/.gitignore index 4128677..c5e29b6 100644 --- a/.gitignore +++ b/.gitignore @@ -1,2 +1,3 @@ BERT_sentiment_classifier/data/* BERT_sentiment_classifier/emotion/* +_site/ \ No newline at end of file diff --git a/_site/Gemfile b/_site/Gemfile deleted file mode 100644 index d74d7c0..0000000 --- a/_site/Gemfile +++ /dev/null @@ -1,3 +0,0 @@ -source 'https://rubygems.org' -gem 'github-pages', group: :jekyll_plugins -gem 'webrick', '~> 1.7' diff --git a/_site/Gemfile.lock b/_site/Gemfile.lock deleted file mode 100644 index ace7546..0000000 --- a/_site/Gemfile.lock +++ /dev/null @@ -1,276 +0,0 @@ -GEM - remote: https://rubygems.org/ - specs: - activesupport (7.1.3.4) - base64 - bigdecimal - concurrent-ruby (~> 1.0, >= 1.0.2) - connection_pool (>= 2.2.5) - drb - i18n (>= 1.6, < 2) - minitest (>= 5.1) - mutex_m - tzinfo (~> 2.0) - addressable (2.8.7) - public_suffix (>= 2.0.2, < 7.0) - base64 (0.2.0) - bigdecimal (3.1.8) - coffee-script (2.4.1) - coffee-script-source - execjs - coffee-script-source (1.12.2) - colorator (1.1.0) - commonmarker (0.23.10) - concurrent-ruby (1.3.3) - connection_pool (2.4.1) - dnsruby (1.72.2) - simpleidn (~> 0.2.1) - drb (2.2.1) - em-websocket (0.5.3) - eventmachine (>= 0.12.9) - http_parser.rb (~> 0) - ethon (0.16.0) - ffi (>= 1.15.0) - eventmachine (1.2.7) - execjs (2.9.1) - faraday (2.10.0) - faraday-net_http (>= 2.0, < 3.2) - logger - faraday-net_http (3.1.0) - net-http - ffi (1.17.0-arm64-darwin) - ffi (1.17.0-x86_64-darwin) - forwardable-extended (2.6.0) - gemoji (4.1.0) - github-pages (231) - github-pages-health-check (= 1.18.2) - jekyll (= 3.9.5) - jekyll-avatar (= 0.8.0) - jekyll-coffeescript (= 1.2.2) - jekyll-commonmark-ghpages (= 0.4.0) - jekyll-default-layout (= 0.1.5) - jekyll-feed (= 0.17.0) - jekyll-gist (= 1.5.0) - jekyll-github-metadata (= 2.16.1) - jekyll-include-cache (= 0.2.1) - jekyll-mentions (= 1.6.0) - jekyll-optional-front-matter (= 0.3.2) - jekyll-paginate (= 1.1.0) - jekyll-readme-index (= 0.3.0) - jekyll-redirect-from (= 0.16.0) - jekyll-relative-links (= 0.6.1) - jekyll-remote-theme (= 0.4.3) - jekyll-sass-converter (= 1.5.2) - jekyll-seo-tag (= 2.8.0) - jekyll-sitemap (= 1.4.0) - jekyll-swiss (= 1.0.0) - jekyll-theme-architect (= 0.2.0) - jekyll-theme-cayman (= 0.2.0) - jekyll-theme-dinky (= 0.2.0) - jekyll-theme-hacker (= 0.2.0) - jekyll-theme-leap-day (= 0.2.0) - jekyll-theme-merlot (= 0.2.0) - jekyll-theme-midnight (= 0.2.0) - jekyll-theme-minimal (= 0.2.0) - jekyll-theme-modernist (= 0.2.0) - jekyll-theme-primer (= 0.6.0) - jekyll-theme-slate (= 0.2.0) - jekyll-theme-tactile (= 0.2.0) - jekyll-theme-time-machine (= 0.2.0) - jekyll-titles-from-headings (= 0.5.3) - jemoji (= 0.13.0) - kramdown (= 2.4.0) - kramdown-parser-gfm (= 1.1.0) - liquid (= 4.0.4) - mercenary (~> 0.3) - minima (= 2.5.1) - nokogiri (>= 1.13.6, < 2.0) - rouge (= 3.30.0) - terminal-table (~> 1.4) - github-pages-health-check (1.18.2) - addressable (~> 2.3) - dnsruby (~> 1.60) - octokit (>= 4, < 8) - public_suffix (>= 3.0, < 6.0) - typhoeus (~> 1.3) - html-pipeline (2.14.3) - activesupport (>= 2) - nokogiri (>= 1.4) - http_parser.rb (0.8.0) - i18n (1.14.5) - concurrent-ruby (~> 1.0) - jekyll (3.9.5) - addressable (~> 2.4) - colorator (~> 1.0) - em-websocket (~> 0.5) - i18n (>= 0.7, < 2) - jekyll-sass-converter (~> 1.0) - jekyll-watch (~> 2.0) - kramdown (>= 1.17, < 3) - liquid (~> 4.0) - mercenary (~> 0.3.3) - pathutil (~> 0.9) - rouge (>= 1.7, < 4) - safe_yaml (~> 1.0) - jekyll-avatar (0.8.0) - jekyll (>= 3.0, < 5.0) - jekyll-coffeescript (1.2.2) - coffee-script (~> 2.2) - coffee-script-source (~> 1.12) - jekyll-commonmark (1.4.0) - commonmarker (~> 0.22) - jekyll-commonmark-ghpages (0.4.0) - commonmarker (~> 0.23.7) - jekyll (~> 3.9.0) - jekyll-commonmark (~> 1.4.0) - rouge (>= 2.0, < 5.0) - jekyll-default-layout (0.1.5) - jekyll (>= 3.0, < 5.0) - jekyll-feed (0.17.0) - jekyll (>= 3.7, < 5.0) - jekyll-gist (1.5.0) - octokit (~> 4.2) - jekyll-github-metadata (2.16.1) - jekyll (>= 3.4, < 5.0) - octokit (>= 4, < 7, != 4.4.0) - jekyll-include-cache (0.2.1) - jekyll (>= 3.7, < 5.0) - jekyll-mentions (1.6.0) - html-pipeline (~> 2.3) - jekyll (>= 3.7, < 5.0) - jekyll-optional-front-matter (0.3.2) - jekyll (>= 3.0, < 5.0) - jekyll-paginate (1.1.0) - jekyll-readme-index (0.3.0) - jekyll (>= 3.0, < 5.0) - jekyll-redirect-from (0.16.0) - jekyll (>= 3.3, < 5.0) - jekyll-relative-links (0.6.1) - jekyll (>= 3.3, < 5.0) - jekyll-remote-theme (0.4.3) - addressable (~> 2.0) - jekyll (>= 3.5, < 5.0) - jekyll-sass-converter (>= 1.0, <= 3.0.0, != 2.0.0) - rubyzip (>= 1.3.0, < 3.0) - jekyll-sass-converter (1.5.2) - sass (~> 3.4) - jekyll-seo-tag (2.8.0) - jekyll (>= 3.8, < 5.0) - jekyll-sitemap (1.4.0) - jekyll (>= 3.7, < 5.0) - jekyll-swiss (1.0.0) - jekyll-theme-architect (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-cayman (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-dinky (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-hacker (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-leap-day (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-merlot (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-midnight (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-minimal (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-modernist (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-primer (0.6.0) - jekyll (> 3.5, < 5.0) - jekyll-github-metadata (~> 2.9) - jekyll-seo-tag (~> 2.0) - jekyll-theme-slate (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-tactile (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-theme-time-machine (0.2.0) - jekyll (> 3.5, < 5.0) - jekyll-seo-tag (~> 2.0) - jekyll-titles-from-headings (0.5.3) - jekyll (>= 3.3, < 5.0) - jekyll-watch (2.2.1) - listen (~> 3.0) - jemoji (0.13.0) - gemoji (>= 3, < 5) - html-pipeline (~> 2.2) - jekyll (>= 3.0, < 5.0) - kramdown (2.4.0) - rexml - kramdown-parser-gfm (1.1.0) - kramdown (~> 2.0) - liquid (4.0.4) - listen (3.9.0) - rb-fsevent (~> 0.10, >= 0.10.3) - rb-inotify (~> 0.9, >= 0.9.10) - logger (1.6.0) - mercenary (0.3.6) - minima (2.5.1) - jekyll (>= 3.5, < 5.0) - jekyll-feed (~> 0.9) - jekyll-seo-tag (~> 2.1) - minitest (5.24.1) - mutex_m (0.2.0) - net-http (0.4.1) - uri - nokogiri (1.16.6-arm64-darwin) - racc (~> 1.4) - nokogiri (1.16.6-x86_64-darwin) - racc (~> 1.4) - octokit (4.25.1) - faraday (>= 1, < 3) - sawyer (~> 0.9) - pathutil (0.16.2) - forwardable-extended (~> 2.6) - public_suffix (5.1.1) - racc (1.8.0) - rb-fsevent (0.11.2) - rb-inotify (0.11.1) - ffi (~> 1.0) - rexml (3.3.1) - strscan - rouge (3.30.0) - rubyzip (2.3.2) - safe_yaml (1.0.5) - sass (3.7.4) - sass-listen (~> 4.0.0) - sass-listen (4.0.0) - rb-fsevent (~> 0.9, >= 0.9.4) - rb-inotify (~> 0.9, >= 0.9.7) - sawyer (0.9.2) - addressable (>= 2.3.5) - faraday (>= 0.17.3, < 3) - simpleidn (0.2.3) - strscan (3.1.0) - terminal-table (1.8.0) - unicode-display_width (~> 1.1, >= 1.1.1) - typhoeus (1.4.1) - ethon (>= 0.9.0) - tzinfo (2.0.6) - concurrent-ruby (~> 1.0) - unicode-display_width (1.8.0) - uri (0.13.0) - webrick (1.8.1) - -PLATFORMS - arm64-darwin - x86_64-darwin - -DEPENDENCIES - github-pages - webrick (~> 1.7) - -BUNDLED WITH - 2.5.15 diff --git a/_site/LICENSE b/_site/LICENSE deleted file mode 100644 index cc6d670..0000000 --- a/_site/LICENSE +++ /dev/null @@ -1,21 +0,0 @@ -MIT License - -Copyright (c) 2022 Ionut Bostan - -Permission is hereby granted, free of charge, to any person obtaining a copy -of this software and associated documentation files (the "Software"), to deal -in the Software without restriction, including without limitation the rights -to use, copy, modify, merge, publish, distribute, sublicense, and/or sell -copies of the Software, and to permit persons to whom the Software is -furnished to do so, subject to the following conditions: - -The above copyright notice and this permission notice shall be included in all -copies or substantial portions of the Software. - -THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR -IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, -FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE -AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER -LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, -OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE -SOFTWARE. diff --git a/_site/README.md b/_site/README.md deleted file mode 100644 index c163079..0000000 --- a/_site/README.md +++ /dev/null @@ -1,40 +0,0 @@ -# Emotion-Aware Speech Generation with Integrated Text Analysis - -This repository contains the code and experiments for the final year project in Computer Science, focusing on Emotion-Aware Speech Generation with Integrated Text Analysis using emotion embeddings from a RoBERTa model. It includes various Natural Language Processing (NLP) experiments performed during an NLP course, as well as a modified version of an existing text-to-speech synthesis codebase. - -## Samples - -Please visit the [GitHub page](https://ionut-cmd.github.io/Emotion-Aware-TTS/) to view comparative samples. - -Or generate new ones on HuggingFace - - - HuggingFace - - -## Project Overview - -The project aims to generate emotion-aware speech using a modified text-to-speech synthesis system. By integrating emotion embeddings from a RoBERTa model, the generated speech output exhibits the desired emotions as specified by the input text. - -## Repository Structure - -- `FYP_Notebooks/`: Contains various notebooks for different experiments and data processing methods -- `FastSpeech2_Text_Aware_Emotion_TTS/`: Contains the modified text-to-speech synthesis codebase for emotion-aware speech generation. -- `Transformers_for_NLP/`: Contains various NLP experiments conducted during the Data Science: Transformers for Natural Language Processing course. -- `Utils/`: Contains the code for processing and preparing the data for training and evaluation. - -## Getting Started - -To run the experiments and use the Emotion-Aware Speech Generation system, follow these steps: - -1. Clone this repository: `git clone https://github.com/ionut-cmd/FYP.git` -2. Navigate to the `FastSpeech2_Text_Aware_Emotion_TTS/` directory. -3. Follow the installation and usage instructions provided in the `FastSpeech2_Text_Aware_Emotion_TTS/README.md` file. - -## Acknowledgements - -This project is based on the [ming024/FastSpeech2](https://github.com/ming024/FastSpeech2.git) for text-to-speech synthesis. I would like to thank the original author for their work, which served as a starting point for this project. - -## License - -This project is licensed under the [MIT License](LICENSE). diff --git a/_site/assets/main.css b/_site/assets/main.css deleted file mode 100644 index 83b9124..0000000 --- a/_site/assets/main.css +++ /dev/null @@ -1,196 +0,0 @@ -/** Reset some basic elements */ -body, h1, h2, h3, h4, h5, h6, p, blockquote, pre, hr, dl, dd, ol, ul, figure { margin: 0; padding: 0; } - -/** Basic styling */ -body { font: 400 16px/1.5 -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, Helvetica, Arial, sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol"; color: #111; background-color: #fdfdfd; -webkit-text-size-adjust: 100%; -webkit-font-feature-settings: "kern" 1; -moz-font-feature-settings: "kern" 1; -o-font-feature-settings: "kern" 1; font-feature-settings: "kern" 1; font-kerning: normal; display: flex; min-height: 100vh; flex-direction: column; } - -/** Set `margin-bottom` to maintain vertical rhythm */ -h1, h2, h3, h4, h5, h6, p, blockquote, pre, ul, ol, dl, figure, .highlight { margin-bottom: 15px; } - -/** `main` element */ -main { display: block; /* Default value of `display` of `main` element is 'inline' in IE 11. */ } - -/** Images */ -img { max-width: 100%; vertical-align: middle; } - -/** Figures */ -figure > img { display: block; } - -figcaption { font-size: 14px; } - -/** Lists */ -ul, ol { margin-left: 30px; } - -li > ul, li > ol { margin-bottom: 0; } - -/** Headings */ -h1, h2, h3, h4, h5, h6 { font-weight: 400; } - -/** Links */ -a { color: #2a7ae2; text-decoration: none; } -a:visited { color: #1756a9; } -a:hover { color: #111; text-decoration: underline; } -.social-media-list a:hover { text-decoration: none; } -.social-media-list a:hover .username { text-decoration: underline; } - -/** Blockquotes */ -blockquote { color: #828282; border-left: 4px solid #e8e8e8; padding-left: 15px; font-size: 18px; letter-spacing: -1px; font-style: italic; } -blockquote > :last-child { margin-bottom: 0; } - -/** Code formatting */ -pre, code { font-size: 15px; border: 1px solid #e8e8e8; border-radius: 3px; background-color: #eef; } - -code { padding: 1px 5px; } - -pre { padding: 8px 12px; overflow-x: auto; } -pre > code { border: 0; padding-right: 0; padding-left: 0; } - -/** Wrapper */ -.wrapper { max-width: -webkit-calc(800px - (30px * 2)); max-width: calc(800px - (30px * 2)); margin-right: auto; margin-left: auto; padding-right: 30px; padding-left: 30px; } -@media screen and (max-width: 800px) { .wrapper { max-width: -webkit-calc(800px - (30px)); max-width: calc(800px - (30px)); padding-right: 15px; padding-left: 15px; } } - -/** Clearfix */ -.wrapper:after, .footer-col-wrapper:after { content: ""; display: table; clear: both; } - -/** Icons */ -.svg-icon { width: 16px; height: 16px; display: inline-block; fill: #828282; padding-right: 5px; vertical-align: text-top; } - -.social-media-list li + li { padding-top: 5px; } - -/** Tables */ -table { margin-bottom: 30px; width: 100%; text-align: left; color: #3f3f3f; border-collapse: collapse; border: 1px solid #e8e8e8; } -table tr:nth-child(even) { background-color: #f7f7f7; } -table th, table td { padding: 10px 15px; } -table th { background-color: #f0f0f0; border: 1px solid #dedede; border-bottom-color: #c9c9c9; } -table td { border: 1px solid #e8e8e8; } - -/** Site header */ -.site-header { border-top: 5px solid #424242; border-bottom: 1px solid #e8e8e8; min-height: 55.95px; position: relative; } - -.site-title { font-size: 26px; font-weight: 300; line-height: 54px; letter-spacing: -1px; margin-bottom: 0; float: left; } -.site-title, .site-title:visited { color: #424242; } - -.site-nav { float: right; line-height: 54px; } -.site-nav .nav-trigger { display: none; } -.site-nav .menu-icon { display: none; } -.site-nav .page-link { color: #111; line-height: 1.5; } -.site-nav .page-link:not(:last-child) { margin-right: 20px; } -@media screen and (max-width: 600px) { .site-nav { position: absolute; top: 9px; right: 15px; background-color: #fdfdfd; border: 1px solid #e8e8e8; border-radius: 5px; text-align: right; } - .site-nav label[for="nav-trigger"] { display: block; float: right; width: 36px; height: 36px; z-index: 2; cursor: pointer; } - .site-nav .menu-icon { display: block; float: right; width: 36px; height: 26px; line-height: 0; padding-top: 10px; text-align: center; } - .site-nav .menu-icon > svg { fill: #424242; } - .site-nav input ~ .trigger { clear: both; display: none; } - .site-nav input:checked ~ .trigger { display: block; padding-bottom: 5px; } - .site-nav .page-link { display: block; padding: 5px 10px; margin-left: 20px; } - .site-nav .page-link:not(:last-child) { margin-right: 0; } } - -/** Site footer */ -.site-footer { border-top: 1px solid #e8e8e8; padding: 30px 0; } - -.footer-heading { font-size: 18px; margin-bottom: 15px; } - -.contact-list, .social-media-list { list-style: none; margin-left: 0; } - -.footer-col-wrapper { font-size: 15px; color: #828282; margin-left: -15px; } - -.footer-col { float: left; margin-bottom: 15px; padding-left: 15px; } - -.footer-col-1 { width: -webkit-calc(35% - (30px / 2)); width: calc(35% - (30px / 2)); } - -.footer-col-2 { width: -webkit-calc(20% - (30px / 2)); width: calc(20% - (30px / 2)); } - -.footer-col-3 { width: -webkit-calc(45% - (30px / 2)); width: calc(45% - (30px / 2)); } - -@media screen and (max-width: 800px) { .footer-col-1, .footer-col-2 { width: -webkit-calc(50% - (30px / 2)); width: calc(50% - (30px / 2)); } - .footer-col-3 { width: -webkit-calc(100% - (30px / 2)); width: calc(100% - (30px / 2)); } } -@media screen and (max-width: 600px) { .footer-col { float: none; width: -webkit-calc(100% - (30px / 2)); width: calc(100% - (30px / 2)); } } -/** Page content */ -.page-content { padding: 30px 0; flex: 1; } - -.page-heading { font-size: 32px; } - -.post-list-heading { font-size: 28px; } - -.post-list { margin-left: 0; list-style: none; } -.post-list > li { margin-bottom: 30px; } - -.post-meta { font-size: 14px; color: #828282; } - -.post-link { display: block; font-size: 24px; } - -/** Posts */ -.post-header { margin-bottom: 30px; } - -.post-title { font-size: 42px; letter-spacing: -1px; line-height: 1; } -@media screen and (max-width: 800px) { .post-title { font-size: 36px; } } - -.post-content { margin-bottom: 30px; } -.post-content h2 { font-size: 32px; } -@media screen and (max-width: 800px) { .post-content h2 { font-size: 28px; } } -.post-content h3 { font-size: 26px; } -@media screen and (max-width: 800px) { .post-content h3 { font-size: 22px; } } -.post-content h4 { font-size: 20px; } -@media screen and (max-width: 800px) { .post-content h4 { font-size: 18px; } } - -/** Syntax highlighting styles */ -.highlight { background: #fff; } -.highlighter-rouge .highlight { background: #eef; } -.highlight .c { color: #998; font-style: italic; } -.highlight .err { color: #a61717; background-color: #e3d2d2; } -.highlight .k { font-weight: bold; } -.highlight .o { font-weight: bold; } -.highlight .cm { color: #998; font-style: italic; } -.highlight .cp { color: #999; font-weight: bold; } -.highlight .c1 { color: #998; font-style: italic; } -.highlight .cs { color: #999; font-weight: bold; font-style: italic; } -.highlight .gd { color: #000; background-color: #fdd; } -.highlight .gd .x { color: #000; background-color: #faa; } -.highlight .ge { font-style: italic; } -.highlight .gr { color: #a00; } -.highlight .gh { color: #999; } -.highlight .gi { color: #000; background-color: #dfd; } -.highlight .gi .x { color: #000; background-color: #afa; } -.highlight .go { color: #888; } -.highlight .gp { color: #555; } -.highlight .gs { font-weight: bold; } -.highlight .gu { color: #aaa; } -.highlight .gt { color: #a00; } -.highlight .kc { font-weight: bold; } -.highlight .kd { font-weight: bold; } -.highlight .kp { font-weight: bold; } -.highlight .kr { font-weight: bold; } -.highlight .kt { color: #458; font-weight: bold; } -.highlight .m { color: #099; } -.highlight .s { color: #d14; } -.highlight .na { color: #008080; } -.highlight .nb { color: #0086B3; } -.highlight .nc { color: #458; font-weight: bold; } -.highlight .no { color: #008080; } -.highlight .ni { color: #800080; } -.highlight .ne { color: #900; font-weight: bold; } -.highlight .nf { color: #900; font-weight: bold; } -.highlight .nn { color: #555; } -.highlight .nt { color: #000080; } -.highlight .nv { color: #008080; } -.highlight .ow { font-weight: bold; } -.highlight .w { color: #bbb; } -.highlight .mf { color: #099; } -.highlight .mh { color: #099; } -.highlight .mi { color: #099; } -.highlight .mo { color: #099; } -.highlight .sb { color: #d14; } -.highlight .sc { color: #d14; } -.highlight .sd { color: #d14; } -.highlight .s2 { color: #d14; } -.highlight .se { color: #d14; } -.highlight .sh { color: #d14; } -.highlight .si { color: #d14; } -.highlight .sx { color: #d14; } -.highlight .sr { color: #009926; } -.highlight .s1 { color: #d14; } -.highlight .ss { color: #990073; } -.highlight .bp { color: #999; } -.highlight .vc { color: #008080; } -.highlight .vg { color: #008080; } -.highlight .vi { color: #008080; } -.highlight .il { color: #099; } diff --git a/_site/assets/minima-social-icons.svg b/_site/assets/minima-social-icons.svg deleted file mode 100644 index fa7399f..0000000 --- a/_site/assets/minima-social-icons.svg +++ /dev/null @@ -1,33 +0,0 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - diff --git a/_site/feed.xml b/_site/feed.xml deleted file mode 100644 index d41539b..0000000 --- a/_site/feed.xml +++ /dev/null @@ -1,2 +0,0 @@ -Jekyll2024-07-20T11:29:54+01:00http://localhost:4000/feed.xmlMaking Social Platforms Accessible: -Emotion-Aware Speech Generation with Integrated TextEmotion-Aware TTS \ No newline at end of file diff --git a/_site/index.html b/_site/index.html deleted file mode 100644 index 5ac9a0b..0000000 --- a/_site/index.html +++ /dev/null @@ -1,280 +0,0 @@ - - - - - -Emotion-Aware TTS | Making Social Platforms Accessible: Emotion-Aware Speech Generation with Integrated Text - - - - - - - - - - - - - - - -
-
-

Authors

- -

Suparna De
-Email: s.de@surrey.ac.uk

- -

Ionut Bostan
-Email: ionut@nquiringminds.com

- -

Nishanth Sastry
-Email: n.sastry@surrey.ac.uk

- -
- -

Abstract

- -

Recent studies have outlined the accessibility challenges that blind and visually impaired people face in interacting -with social networks, with monotone text-to-speech (TTS) screen -readers and audio narration of visual elements such as emojis. -Emotional speech generation traditionally relies on human input -of the expected emotion together with the text to synthesise, -with additional challenges around data simplification (causing -information loss) and duration inaccuracy, leading to lack of -expressive emotional rendering. In real-life communications, the -duration of phonemes can vary since the same sentence might -be spoken in a variety of ways depending on the speakers’ -emotional states or accents (referred to as the one-to-many -problem of text to speech generation). As a result, an advanced -voice synthesis system is required to account for this unpredictability. We propose an end-to-end context-aware Text-toSpeech (TTS) synthesis system that derives the conveyed emotion -from text input and synthesises audio that focuses on emotions -and speaker features for natural and expressive speech, integrating advanced natural language processing (NLP) and speech -synthesis techniques for real-time applications. The proposed -system has two core components: an emotion classifier and a -speech synthesiser. The emotion classifier utilises a classification -model to extract sentiment information from the input text. -Leveraging a non-autoregressive neural TTS model, the speech -synthesiser generates Mel-spectrograms by incorporating speaker -and emotion embeddings derived from the classifier’s output. We -employ a Generative Adversarial Network (GAN)-based vocoder -to convert the Mel-spectrograms into audible waveforms. One of -the key contributions lies in effectively incorporating emotional -characteristics into TTS synthesis. Our system also showcases -competitive inference time performance when benchmarked -against the state-of-the-art TTS models, making it suitable for -real-time accessibility applications.

- -
- -

Demo

- -

Welcome to the demonstration page of our Emotion-Aware Text-to-Speech Models. Below, you can listen to audio samples from different TTS models.

- - - - - - - - - - - - - - - - - - - - - - - - - - -
DescriptionFastSpeech 2[1]TEMOTTS[2]Our Model
Bikes are fun to ride - - - - - -
Dreams can come true - - - - - -
Friends make life more fun - - - - - -
- -

Emotion Aware Samples

- - - - - - - - - - - - - - - - - - - - - - - - - - -
DescriptionFastSpeech 2[1]TEMOTTS[2]Our Model
Blowing out birthday candles makes me feel special! - - - - - -
Her heart felt heavy with sorrow - - - - - -
I am feeling sad - - - - - -
- -

References

- -
- -
    -
  1. Yi Ren, Chenxu Hu, Xu Tan, Tao Qin, Sheng Zhao, Zhou Zhao, and Tie-Yan Liu, “Fastspeech 2: Fast and high-quality end-to-end text to speech,” in International Conference on Learning Representations, 2021.
  2. -
  3. Shreeram Suresh Chandra, Zongyang Du, Berrak Sisman, “TEMOTTS: Text-aware Emotional Text-to-Speech with no labels”, Speech & Machine Learning Lab, The University of Texas at Dallas, TX, USA, 2024.
  4. -
- -
-
- - - diff --git a/_site/samples/fastspeech/Bikes_are_fun_to_ride__gen.wav b/_site/samples/fastspeech/Bikes_are_fun_to_ride__gen.wav deleted file mode 100644 index 940f640..0000000 Binary files a/_site/samples/fastspeech/Bikes_are_fun_to_ride__gen.wav and /dev/null differ diff --git a/_site/samples/fastspeech/Blowing_out_birthday_candles_makes_me_feel_special__gen.wav b/_site/samples/fastspeech/Blowing_out_birthday_candles_makes_me_feel_special__gen.wav deleted file mode 100644 index 5ec1998..0000000 Binary files a/_site/samples/fastspeech/Blowing_out_birthday_candles_makes_me_feel_special__gen.wav and /dev/null differ diff --git a/_site/samples/fastspeech/Dreams_can_come_true__gen.wav b/_site/samples/fastspeech/Dreams_can_come_true__gen.wav deleted file mode 100644 index 260efb7..0000000 Binary files a/_site/samples/fastspeech/Dreams_can_come_true__gen.wav and /dev/null differ diff --git a/_site/samples/fastspeech/Friends_make_life_more_fun__gen.wav b/_site/samples/fastspeech/Friends_make_life_more_fun__gen.wav deleted file mode 100644 index d2cb8c3..0000000 Binary files a/_site/samples/fastspeech/Friends_make_life_more_fun__gen.wav and /dev/null differ diff --git a/_site/samples/fastspeech/Her_heart_felt_heavy_with_sorrow__gen.wav b/_site/samples/fastspeech/Her_heart_felt_heavy_with_sorrow__gen.wav deleted file mode 100644 index 2a0692b..0000000 Binary files a/_site/samples/fastspeech/Her_heart_felt_heavy_with_sorrow__gen.wav and /dev/null differ diff --git a/_site/samples/fastspeech/I_am_feeling_sad__gen.wav b/_site/samples/fastspeech/I_am_feeling_sad__gen.wav deleted file mode 100644 index f11eac3..0000000 Binary files a/_site/samples/fastspeech/I_am_feeling_sad__gen.wav and /dev/null differ diff --git a/_site/samples/ours/Bikes are fun to ride..wav b/_site/samples/ours/Bikes are fun to ride..wav deleted file mode 100644 index a9dce57..0000000 Binary files a/_site/samples/ours/Bikes are fun to ride..wav and /dev/null differ diff --git a/_site/samples/ours/Blowing out birthday candles makes me feel special!.wav b/_site/samples/ours/Blowing out birthday candles makes me feel special!.wav deleted file mode 100644 index 4082a88..0000000 Binary files a/_site/samples/ours/Blowing out birthday candles makes me feel special!.wav and /dev/null differ diff --git a/_site/samples/ours/Dreams can come true.wav b/_site/samples/ours/Dreams can come true.wav deleted file mode 100644 index 7a663c5..0000000 Binary files a/_site/samples/ours/Dreams can come true.wav and /dev/null differ diff --git a/_site/samples/ours/Friends make life more fun.wav b/_site/samples/ours/Friends make life more fun.wav deleted file mode 100644 index fdb08a1..0000000 Binary files a/_site/samples/ours/Friends make life more fun.wav and /dev/null differ diff --git a/_site/samples/ours/Her heart felt heavy with sorrow.wav b/_site/samples/ours/Her heart felt heavy with sorrow.wav deleted file mode 100644 index 87fb160..0000000 Binary files a/_site/samples/ours/Her heart felt heavy with sorrow.wav and /dev/null differ diff --git a/_site/samples/ours/I am feeling sad.wav b/_site/samples/ours/I am feeling sad.wav deleted file mode 100644 index a96f004..0000000 Binary files a/_site/samples/ours/I am feeling sad.wav and /dev/null differ diff --git a/_site/samples/temotts/Bikes_are_fun_to_ride__gen.wav b/_site/samples/temotts/Bikes_are_fun_to_ride__gen.wav deleted file mode 100644 index 02793e4..0000000 Binary files a/_site/samples/temotts/Bikes_are_fun_to_ride__gen.wav and /dev/null differ diff --git a/_site/samples/temotts/Blowing_out_birthday_candles_makes_me_feel_special__gen.wav b/_site/samples/temotts/Blowing_out_birthday_candles_makes_me_feel_special__gen.wav deleted file mode 100644 index b38d953..0000000 Binary files a/_site/samples/temotts/Blowing_out_birthday_candles_makes_me_feel_special__gen.wav and /dev/null differ diff --git a/_site/samples/temotts/Dreams_can_come_true__gen.wav b/_site/samples/temotts/Dreams_can_come_true__gen.wav deleted file mode 100644 index 7105f42..0000000 Binary files a/_site/samples/temotts/Dreams_can_come_true__gen.wav and /dev/null differ diff --git a/_site/samples/temotts/Friends_make_life_more_fun__gen.wav b/_site/samples/temotts/Friends_make_life_more_fun__gen.wav deleted file mode 100644 index 2128eca..0000000 Binary files a/_site/samples/temotts/Friends_make_life_more_fun__gen.wav and /dev/null differ diff --git a/_site/samples/temotts/Her_heart_felt_heavy_with_sorrow__gen.wav b/_site/samples/temotts/Her_heart_felt_heavy_with_sorrow__gen.wav deleted file mode 100644 index 6d49a61..0000000 Binary files a/_site/samples/temotts/Her_heart_felt_heavy_with_sorrow__gen.wav and /dev/null differ diff --git a/_site/samples/temotts/I_am_feeling_sad__gen.wav b/_site/samples/temotts/I_am_feeling_sad__gen.wav deleted file mode 100644 index c9b7aec..0000000 Binary files a/_site/samples/temotts/I_am_feeling_sad__gen.wav and /dev/null differ diff --git a/index.md b/index.md index 356fd40..4b786a3 100644 --- a/index.md +++ b/index.md @@ -52,7 +52,7 @@ real-time accessibility applications. ## Demo -Welcome to the demonstration page of our Emotion-Aware Text-to-Speech Models. Below, you can listen to audiohttps://github.com/ionut-cmd/Emotion-Aware-TTS/tree/main/FastSpeech2_Text_Aware_Emotion_TTS samples from different TTS models. +Welcome to the demonstration page of our Emotion-Aware Text-to-Speech Models. Below, you can listen to audiohttps://raw.githubusercontent.com/ionut-cmd/Emotion-Aware-TTS/main/FastSpeech2_Text_Aware_Emotion_TTS samples from different TTS models. @@ -65,19 +65,19 @@ Welcome to the demonstration page of our Emotion-Aware Text-to-Speech Models. Be @@ -86,19 +86,19 @@ Welcome to the demonstration page of our Emotion-Aware Text-to-Speech Models. Be @@ -107,19 +107,19 @@ Welcome to the demonstration page of our Emotion-Aware Text-to-Speech Models. Be @@ -139,19 +139,19 @@ Welcome to the demonstration page of our Emotion-Aware Text-to-Speech Models. Be @@ -160,19 +160,19 @@ Welcome to the demonstration page of our Emotion-Aware Text-to-Speech Models. Be @@ -181,19 +181,19 @@ Welcome to the demonstration page of our Emotion-Aware Text-to-Speech Models. Be
Bikes are fun to ride Dreams can come true Friends make life more fun Blowing out birthday candles makes me feel special! Her heart felt heavy with sorrow I am feeling sad