{"data":{"id":"10.48550/arxiv.1809.10460","type":"dois","attributes":{"doi":"10.48550/arxiv.1809.10460","prefix":"10.48550","suffix":"arxiv.1809.10460","identifiers":[{"identifier":"1809.10460","identifierType":"arXiv"}],"alternateIdentifiers":[{"alternateIdentifierType":"arXiv","alternateIdentifier":"1809.10460"}],"creators":[{"name":"Chen, Yutian","nameType":"Personal","givenName":"Yutian","familyName":"Chen","affiliation":[],"nameIdentifiers":[]},{"name":"Assael, Yannis","nameType":"Personal","givenName":"Yannis","familyName":"Assael","affiliation":[],"nameIdentifiers":[]},{"name":"Shillingford, Brendan","nameType":"Personal","givenName":"Brendan","familyName":"Shillingford","affiliation":[],"nameIdentifiers":[]},{"name":"Budden, David","nameType":"Personal","givenName":"David","familyName":"Budden","affiliation":[],"nameIdentifiers":[]},{"name":"Reed, Scott","nameType":"Personal","givenName":"Scott","familyName":"Reed","affiliation":[],"nameIdentifiers":[]},{"name":"Zen, Heiga","nameType":"Personal","givenName":"Heiga","familyName":"Zen","affiliation":[],"nameIdentifiers":[]},{"name":"Wang, Quan","nameType":"Personal","givenName":"Quan","familyName":"Wang","affiliation":[],"nameIdentifiers":[]},{"name":"Cobo, Luis C.","nameType":"Personal","givenName":"Luis C.","familyName":"Cobo","affiliation":[],"nameIdentifiers":[]},{"name":"Trask, Andrew","nameType":"Personal","givenName":"Andrew","familyName":"Trask","affiliation":[],"nameIdentifiers":[]},{"name":"Laurie, Ben","nameType":"Personal","givenName":"Ben","familyName":"Laurie","affiliation":[],"nameIdentifiers":[]},{"name":"Gulcehre, Caglar","nameType":"Personal","givenName":"Caglar","familyName":"Gulcehre","affiliation":[],"nameIdentifiers":[]},{"name":"Oord, Aäron van den","nameType":"Personal","givenName":"Aäron van den","familyName":"Oord","affiliation":[],"nameIdentifiers":[]},{"name":"Vinyals, Oriol","nameType":"Personal","givenName":"Oriol","familyName":"Vinyals","affiliation":[],"nameIdentifiers":[]},{"name":"de Freitas, Nando","nameType":"Personal","givenName":"Nando","familyName":"de Freitas","affiliation":[],"nameIdentifiers":[]}],"titles":[{"title":"Sample Efficient Adaptive Text-to-Speech"}],"publisher":"arXiv","container":{},"publicationYear":2018,"subjects":[{"lang":"en","subject":"Machine Learning (cs.LG)","subjectScheme":"arXiv"},{"lang":"en","subject":"Sound (cs.SD)","subjectScheme":"arXiv"},{"lang":"en","subject":"Machine Learning (stat.ML)","subjectScheme":"arXiv"},{"subject":"FOS: Computer and information sciences","subjectScheme":"Fields of Science and Technology (FOS)"},{"subject":"FOS: Computer and information sciences","schemeUri":"http://www.oecd.org/science/inno/38235147.pdf","subjectScheme":"Fields of Science and Technology (FOS)"}],"contributors":[],"dates":[{"date":"2018-09-27T11:31:19Z","dateType":"Submitted","dateInformation":"v1"},{"date":"2018-09-28T00:09:50Z","dateType":"Updated","dateInformation":"v1"},{"date":"2018-12-21T15:23:54Z","dateType":"Submitted","dateInformation":"v2"},{"date":"2018-12-24T01:15:49Z","dateType":"Updated","dateInformation":"v2"},{"date":"2019-01-16T22:30:22Z","dateType":"Submitted","dateInformation":"v3"},{"date":"2019-01-18T01:03:17Z","dateType":"Updated","dateInformation":"v3"},{"date":"2018-09","dateType":"Available","dateInformation":"v1"},{"date":"2018","dateType":"Issued"}],"language":null,"types":{"ris":"GEN","bibtex":"misc","citeproc":"article","schemaOrg":"CreativeWork","resourceType":"Article","resourceTypeGeneral":"Preprint"},"relatedIdentifiers":[],"relatedItems":[],"sizes":[],"formats":[],"version":"3","rightsList":[{"rights":"arXiv.org perpetual, non-exclusive license","rightsUri":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/"}],"descriptions":[{"description":"We present a meta-learning approach for adaptive text-to-speech (TTS) with few data. During training, we learn a multi-speaker model using a shared conditional WaveNet core and independent learned embeddings for each speaker. The aim of training is not to produce a neural network with fixed weights, which is then deployed as a TTS system. Instead, the aim is to produce a network that requires few data at deployment time to rapidly adapt to new speakers. We introduce and benchmark three strategies: (i) learning the speaker embedding while keeping the WaveNet core fixed, (ii) fine-tuning the entire architecture with stochastic gradient descent, and (iii) predicting the speaker embedding with a trained neural network encoder. The experiments show that these approaches are successful at adapting the multi-speaker neural network to new speakers, obtaining state-of-the-art results in both sample naturalness and voice similarity with merely a few minutes of audio data from new speakers.","descriptionType":"Abstract"},{"description":"Accepted by ICLR 2019","descriptionType":"Other"}],"geoLocations":[],"fundingReferences":[],"xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0idXRmLTgiPz4KPHJlc291cmNlIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCIgeG1sbnM6eHNpPSJodHRwOi8vd3d3LnczLm9yZy8yMDAxL1hNTFNjaGVtYS1pbnN0YW5jZSIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC00LjMvbWV0YWRhdGEueHNkIj4KICA8aWRlbnRpZmllciBpZGVudGlmaWVyVHlwZT0iRE9JIj4xMC40ODU1MC9BUlhJVi4xODA5LjEwNDYwPC9pZGVudGlmaWVyPgogIDxhbHRlcm5hdGVJZGVudGlmaWVycz4KICAgIDxhbHRlcm5hdGVJZGVudGlmaWVyIGFsdGVybmF0ZUlkZW50aWZpZXJUeXBlPSJhclhpdiI+MTgwOS4xMDQ2MDwvYWx0ZXJuYXRlSWRlbnRpZmllcj4KICA8L2FsdGVybmF0ZUlkZW50aWZpZXJzPgogIDxjcmVhdG9ycz4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5DaGVuLCBZdXRpYW48L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPll1dGlhbjwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5DaGVuPC9mYW1pbHlOYW1lPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZSBuYW1lVHlwZT0iUGVyc29uYWwiPkFzc2FlbCwgWWFubmlzPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5ZYW5uaXM8L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+QXNzYWVsPC9mYW1pbHlOYW1lPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZSBuYW1lVHlwZT0iUGVyc29uYWwiPlNoaWxsaW5nZm9yZCwgQnJlbmRhbjwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+QnJlbmRhbjwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5TaGlsbGluZ2ZvcmQ8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+QnVkZGVuLCBEYXZpZDwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+RGF2aWQ8L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+QnVkZGVuPC9mYW1pbHlOYW1lPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZSBuYW1lVHlwZT0iUGVyc29uYWwiPlJlZWQsIFNjb3R0PC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5TY290dDwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5SZWVkPC9mYW1pbHlOYW1lPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZSBuYW1lVHlwZT0iUGVyc29uYWwiPlplbiwgSGVpZ2E8L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPkhlaWdhPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPlplbjwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5XYW5nLCBRdWFuPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5RdWFuPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPldhbmc8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+Q29ibywgTHVpcyBDLjwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+THVpcyBDLjwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5Db2JvPC9mYW1pbHlOYW1lPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZSBuYW1lVHlwZT0iUGVyc29uYWwiPlRyYXNrLCBBbmRyZXc8L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPkFuZHJldzwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5UcmFzazwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5MYXVyaWUsIEJlbjwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+QmVuPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPkxhdXJpZTwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5HdWxjZWhyZSwgQ2FnbGFyPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5DYWdsYXI8L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+R3VsY2VocmU8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+T29yZCwgQcOkcm9uIHZhbiBkZW48L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPkHDpHJvbiB2YW4gZGVuPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPk9vcmQ8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+VmlueWFscywgT3Jpb2w8L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPk9yaW9sPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPlZpbnlhbHM8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+ZGUgRnJlaXRhcywgTmFuZG88L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPk5hbmRvPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPmRlIEZyZWl0YXM8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgPC9jcmVhdG9ycz4KICA8dGl0bGVzPgogICAgPHRpdGxlPlNhbXBsZSBFZmZpY2llbnQgQWRhcHRpdmUgVGV4dC10by1TcGVlY2g8L3RpdGxlPgogIDwvdGl0bGVzPgogIDxwdWJsaXNoZXI+YXJYaXY8L3B1Ymxpc2hlcj4KICA8cHVibGljYXRpb25ZZWFyPjIwMTg8L3B1YmxpY2F0aW9uWWVhcj4KICA8c3ViamVjdHM+CiAgICA8c3ViamVjdCB4bWw6bGFuZz0iZW4iIHN1YmplY3RTY2hlbWU9ImFyWGl2Ij5NYWNoaW5lIExlYXJuaW5nIChjcy5MRyk8L3N1YmplY3Q+CiAgICA8c3ViamVjdCB4bWw6bGFuZz0iZW4iIHN1YmplY3RTY2hlbWU9ImFyWGl2Ij5Tb3VuZCAoY3MuU0QpPC9zdWJqZWN0PgogICAgPHN1YmplY3QgeG1sOmxhbmc9ImVuIiBzdWJqZWN0U2NoZW1lPSJhclhpdiI+TWFjaGluZSBMZWFybmluZyAoc3RhdC5NTCk8L3N1YmplY3Q+CiAgICA8c3ViamVjdCBzdWJqZWN0U2NoZW1lPSJGaWVsZHMgb2YgU2NpZW5jZSBhbmQgVGVjaG5vbG9neSAoRk9TKSI+Rk9TOiBDb21wdXRlciBhbmQgaW5mb3JtYXRpb24gc2NpZW5jZXM8L3N1YmplY3Q+CiAgPC9zdWJqZWN0cz4KICA8ZGF0ZXM+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iU3VibWl0dGVkIiBkYXRlSW5mb3JtYXRpb249InYxIj4yMDE4LTA5LTI3VDExOjMxOjE5WjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJVcGRhdGVkIiBkYXRlSW5mb3JtYXRpb249InYxIj4yMDE4LTA5LTI4VDAwOjA5OjUwWjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJTdWJtaXR0ZWQiIGRhdGVJbmZvcm1hdGlvbj0idjIiPjIwMTgtMTItMjFUMTU6MjM6NTRaPC9kYXRlPgogICAgPGRhdGUgZGF0ZVR5cGU9IlVwZGF0ZWQiIGRhdGVJbmZvcm1hdGlvbj0idjIiPjIwMTgtMTItMjRUMDE6MTU6NDlaPC9kYXRlPgogICAgPGRhdGUgZGF0ZVR5cGU9IlN1Ym1pdHRlZCIgZGF0ZUluZm9ybWF0aW9uPSJ2MyI+MjAxOS0wMS0xNlQyMjozMDoyMlo8L2RhdGU+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iVXBkYXRlZCIgZGF0ZUluZm9ybWF0aW9uPSJ2MyI+MjAxOS0wMS0xOFQwMTowMzoxN1o8L2RhdGU+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iQXZhaWxhYmxlIiBkYXRlSW5mb3JtYXRpb249InYxIj4yMDE4LTA5PC9kYXRlPgogIDwvZGF0ZXM+CiAgPHJlc291cmNlVHlwZSByZXNvdXJjZVR5cGVHZW5lcmFsPSJQcmVwcmludCI+QXJ0aWNsZTwvcmVzb3VyY2VUeXBlPgogIDx2ZXJzaW9uPjM8L3ZlcnNpb24+CiAgPHJpZ2h0c0xpc3Q+CiAgICA8cmlnaHRzIHJpZ2h0c1VSST0iaHR0cDovL2FyeGl2Lm9yZy9saWNlbnNlcy9ub25leGNsdXNpdmUtZGlzdHJpYi8xLjAvIj5hclhpdi5vcmcgcGVycGV0dWFsLCBub24tZXhjbHVzaXZlIGxpY2Vuc2U8L3JpZ2h0cz4KICA8L3JpZ2h0c0xpc3Q+CiAgPGRlc2NyaXB0aW9ucz4KICAgIDxkZXNjcmlwdGlvbiBkZXNjcmlwdGlvblR5cGU9IkFic3RyYWN0Ij5XZSBwcmVzZW50IGEgbWV0YS1sZWFybmluZyBhcHByb2FjaCBmb3IgYWRhcHRpdmUgdGV4dC10by1zcGVlY2ggKFRUUykgd2l0aCBmZXcgZGF0YS4gRHVyaW5nIHRyYWluaW5nLCB3ZSBsZWFybiBhIG11bHRpLXNwZWFrZXIgbW9kZWwgdXNpbmcgYSBzaGFyZWQgY29uZGl0aW9uYWwgV2F2ZU5ldCBjb3JlIGFuZCBpbmRlcGVuZGVudCBsZWFybmVkIGVtYmVkZGluZ3MgZm9yIGVhY2ggc3BlYWtlci4gVGhlIGFpbSBvZiB0cmFpbmluZyBpcyBub3QgdG8gcHJvZHVjZSBhIG5ldXJhbCBuZXR3b3JrIHdpdGggZml4ZWQgd2VpZ2h0cywgd2hpY2ggaXMgdGhlbiBkZXBsb3llZCBhcyBhIFRUUyBzeXN0ZW0uIEluc3RlYWQsIHRoZSBhaW0gaXMgdG8gcHJvZHVjZSBhIG5ldHdvcmsgdGhhdCByZXF1aXJlcyBmZXcgZGF0YSBhdCBkZXBsb3ltZW50IHRpbWUgdG8gcmFwaWRseSBhZGFwdCB0byBuZXcgc3BlYWtlcnMuIFdlIGludHJvZHVjZSBhbmQgYmVuY2htYXJrIHRocmVlIHN0cmF0ZWdpZXM6IChpKSBsZWFybmluZyB0aGUgc3BlYWtlciBlbWJlZGRpbmcgd2hpbGUga2VlcGluZyB0aGUgV2F2ZU5ldCBjb3JlIGZpeGVkLCAoaWkpIGZpbmUtdHVuaW5nIHRoZSBlbnRpcmUgYXJjaGl0ZWN0dXJlIHdpdGggc3RvY2hhc3RpYyBncmFkaWVudCBkZXNjZW50LCBhbmQgKGlpaSkgcHJlZGljdGluZyB0aGUgc3BlYWtlciBlbWJlZGRpbmcgd2l0aCBhIHRyYWluZWQgbmV1cmFsIG5ldHdvcmsgZW5jb2Rlci4gVGhlIGV4cGVyaW1lbnRzIHNob3cgdGhhdCB0aGVzZSBhcHByb2FjaGVzIGFyZSBzdWNjZXNzZnVsIGF0IGFkYXB0aW5nIHRoZSBtdWx0aS1zcGVha2VyIG5ldXJhbCBuZXR3b3JrIHRvIG5ldyBzcGVha2Vycywgb2J0YWluaW5nIHN0YXRlLW9mLXRoZS1hcnQgcmVzdWx0cyBpbiBib3RoIHNhbXBsZSBuYXR1cmFsbmVzcyBhbmQgdm9pY2Ugc2ltaWxhcml0eSB3aXRoIG1lcmVseSBhIGZldyBtaW51dGVzIG9mIGF1ZGlvIGRhdGEgZnJvbSBuZXcgc3BlYWtlcnMuPC9kZXNjcmlwdGlvbj4KICAgIDxkZXNjcmlwdGlvbiBkZXNjcmlwdGlvblR5cGU9Ik90aGVyIj5BY2NlcHRlZCBieSBJQ0xSIDIwMTk8L2Rlc2NyaXB0aW9uPgogIDwvZGVzY3JpcHRpb25zPgo8L3Jlc291cmNlPg==","url":"https://arxiv.org/abs/1809.10460","contentUrl":null,"metadataVersion":0,"schemaVersion":"http://datacite.org/schema/kernel-4","source":"mds","isActive":true,"state":"findable","reason":null,"viewCount":0,"viewsOverTime":[],"downloadCount":0,"downloadsOverTime":[],"referenceCount":0,"citationCount":0,"citationsOverTime":[],"partCount":0,"partOfCount":0,"versionCount":0,"versionOfCount":0,"created":"2022-03-02T15:02:30.000Z","registered":"2022-03-02T15:02:31.000Z","published":"2018","updated":"2022-03-02T15:02:31.000Z"},"relationships":{"client":{"data":{"id":"arxiv.content","type":"clients"}},"provider":{"data":{"id":"arxiv","type":"providers"}},"media":{"data":{"id":"10.48550/arxiv.1809.10460","type":"media"}},"references":{"data":[]},"citations":{"data":[]},"parts":{"data":[]},"partOf":{"data":[]},"versions":{"data":[]},"versionOf":{"data":[]}}}}