diff options
author | Martin Czygan <martin.czygan@gmail.com> | 2020-11-24 23:51:40 +0100 |
---|---|---|
committer | Martin Czygan <martin.czygan@gmail.com> | 2020-11-24 23:51:40 +0100 |
commit | 268e7948e6fa2ee9871430104f60bdab3212464c (patch) | |
tree | b25b96f17767a4f9fdd72e73ccbb5d7b41050314 /tests/data/release/efumvvpw6jbb7ehp2qfdatgxzy | |
parent | 48d9265ce97e032e4f5fd2aaa3bde7fb8f49d6c5 (diff) | |
download | fuzzycat-268e7948e6fa2ee9871430104f60bdab3212464c.tar.gz fuzzycat-268e7948e6fa2ee9871430104f60bdab3212464c.zip |
move towards data subdir
Diffstat (limited to 'tests/data/release/efumvvpw6jbb7ehp2qfdatgxzy')
-rw-r--r-- | tests/data/release/efumvvpw6jbb7ehp2qfdatgxzy | 49 |
1 files changed, 49 insertions, 0 deletions
diff --git a/tests/data/release/efumvvpw6jbb7ehp2qfdatgxzy b/tests/data/release/efumvvpw6jbb7ehp2qfdatgxzy new file mode 100644 index 0000000..a14a775 --- /dev/null +++ b/tests/data/release/efumvvpw6jbb7ehp2qfdatgxzy @@ -0,0 +1,49 @@ +{ + "abstracts": [ + { + "content": "This paper introduces Taco-VC, a novel architecture for voice conversion\nbased on Tacotron synthesizer, which is a sequence-to-sequence with attention\nmodel. The training of multi-speaker voice conversion systems requires a large\nnumber of resources, both in training and corpus size. Taco-VC is implemented\nusing a single speaker Tacotron synthesizer based on Phonetic PosteriorGrams\n(PPGs) and a single speaker WaveNet vocoder conditioned on mel spectrograms. To\nenhance the converted speech quality, and to overcome over-smoothing, the\noutputs of Tacotron are passed through a novel speechenhancement network, which\nis composed of a combination of the phoneme recognition and Tacotron networks.\nOur system is trained just with a single speaker corpus and adapts to new\nspeakers using only a few minutes of training data. Using mid-size public\ndatasets, our method outperforms the baseline in the VCC 2018 SPOKE\nnon-parallel voice conversion task and achieves competitive results compared to\nmulti-speaker networks trained on large private datasets.", + "lang": "en", + "mimetype": "text/plain", + "sha1": "3d39e2b0529feac401b47d8f5c048e27be0e9b60" + } + ], + "contribs": [ + { + "index": 0, + "raw_name": "Roee Levy Leshem", + "role": "author" + }, + { + "index": 1, + "raw_name": "Raja Giryes", + "role": "author" + } + ], + "ext_ids": { + "arxiv": "1904.03522v4" + }, + "extra": { + "arxiv": { + "base_id": "1904.03522", + "categories": [ + "cs.SD", + "cs.LG", + "eess.AS" + ], + "comments": "Accepted to EUSIPCO 2020" + } + }, + "ident": "efumvvpw6jbb7ehp2qfdatgxzy", + "language": "en", + "license_slug": "ARXIV-1.0", + "refs": [], + "release_date": "2020-06-19", + "release_stage": "submitted", + "release_type": "article", + "release_year": 2020, + "revision": "32b1f508-d004-47dc-bc1a-2a65feb3a1a7", + "state": "active", + "title": "Taco-VC: A Single Speaker Tacotron based Voice Conversion with Limited Data", + "version": "v4", + "work_id": "bqizapjfrfbbhnele4mba3e5ay" +} |