aboutsummaryrefslogtreecommitdiffstats
path: root/tests/data/release/funn7cwjbrgefji27tzpl4avuu
diff options
context:
space:
mode:
authorMartin Czygan <martin.czygan@gmail.com>2020-11-24 23:51:40 +0100
committerMartin Czygan <martin.czygan@gmail.com>2020-11-24 23:51:40 +0100
commit268e7948e6fa2ee9871430104f60bdab3212464c (patch)
treeb25b96f17767a4f9fdd72e73ccbb5d7b41050314 /tests/data/release/funn7cwjbrgefji27tzpl4avuu
parent48d9265ce97e032e4f5fd2aaa3bde7fb8f49d6c5 (diff)
downloadfuzzycat-268e7948e6fa2ee9871430104f60bdab3212464c.tar.gz
fuzzycat-268e7948e6fa2ee9871430104f60bdab3212464c.zip
move towards data subdir
Diffstat (limited to 'tests/data/release/funn7cwjbrgefji27tzpl4avuu')
-rw-r--r--tests/data/release/funn7cwjbrgefji27tzpl4avuu50
1 files changed, 50 insertions, 0 deletions
diff --git a/tests/data/release/funn7cwjbrgefji27tzpl4avuu b/tests/data/release/funn7cwjbrgefji27tzpl4avuu
new file mode 100644
index 0000000..8be0a7b
--- /dev/null
+++ b/tests/data/release/funn7cwjbrgefji27tzpl4avuu
@@ -0,0 +1,50 @@
+{
+ "abstracts": [
+ {
+ "content": "This paper introduces Taco-VC, a novel architecture for voice conversion (VC)\nbased on the Tacotron synthesizer, which is a sequence-to-sequence with\nattention model. Most current prosody preserving VC systems suffer from target\nsimilarity and quality issues in the converted speech. To address these\nproblems, we first recover initial prosody preserving speech using a Phonetic\nPosteriorgrams (PPGs) based Tacotron synthesizer. Then, we enhance the quality\nof the converted speech using a novel speech-enhancement network, which is\nbased on a combination of phoneme recognition and Tacotron networks. The final\nconverted speech is generated by a Wavenet vocoder conditioned on Mel\nSpectrograms. Given the advantages of a single speaker Tacotron and Wavenet, we\nshow how to adapt them to other speakers with limited training data. We\nevaluate our solution on the VCC 2018 SPOKE task. Using public mid-size\ndatasets, our method outperforms the baseline and achieves competitive results",
+ "lang": "en",
+ "mimetype": "text/plain",
+ "sha1": "6b3ec27cabf8042bb5dd6278b9aa0cee71d92789"
+ }
+ ],
+ "contribs": [
+ {
+ "index": 0,
+ "raw_name": "Roee Levy Leshem",
+ "role": "author"
+ },
+ {
+ "index": 1,
+ "raw_name": "Raja Giryes",
+ "role": "author"
+ }
+ ],
+ "ext_ids": {
+ "arxiv": "1904.03522v1"
+ },
+ "extra": {
+ "arxiv": {
+ "base_id": "1904.03522",
+ "categories": [
+ "cs.SD",
+ "cs.LG",
+ "eess.AS"
+ ],
+ "comments": "Submitted to Interspeech 2019"
+ },
+ "superceded": true
+ },
+ "ident": "funn7cwjbrgefji27tzpl4avuu",
+ "language": "en",
+ "license_slug": "ARXIV-1.0",
+ "refs": [],
+ "release_date": "2019-04-06",
+ "release_stage": "submitted",
+ "release_type": "article",
+ "release_year": 2019,
+ "revision": "8dd55bc1-c846-48f9-bcc6-96069460b8d8",
+ "state": "active",
+ "title": "Taco-VC: A Single Speaker Tacotron based Voice Conversion with Limited\n Data",
+ "version": "v1",
+ "work_id": "bqizapjfrfbbhnele4mba3e5ay"
+}