{"data":{"id":"10.48550/arxiv.1609.03193","type":"dois","attributes":{"doi":"10.48550/arxiv.1609.03193","prefix":"10.48550","suffix":"arxiv.1609.03193","identifiers":[{"identifier":"1609.03193","identifierType":"arXiv"}],"alternateIdentifiers":[{"alternateIdentifierType":"arXiv","alternateIdentifier":"1609.03193"}],"creators":[{"name":"Collobert, Ronan","nameType":"Personal","givenName":"Ronan","familyName":"Collobert","affiliation":[],"nameIdentifiers":[]},{"name":"Puhrsch, Christian","nameType":"Personal","givenName":"Christian","familyName":"Puhrsch","affiliation":[],"nameIdentifiers":[]},{"name":"Synnaeve, Gabriel","nameType":"Personal","givenName":"Gabriel","familyName":"Synnaeve","affiliation":[],"nameIdentifiers":[]}],"titles":[{"title":"Wav2Letter: an End-to-End ConvNet-based Speech Recognition System"}],"publisher":"arXiv","container":{},"publicationYear":2016,"subjects":[{"lang":"en","subject":"Machine Learning (cs.LG)","subjectScheme":"arXiv"},{"lang":"en","subject":"Artificial Intelligence (cs.AI)","subjectScheme":"arXiv"},{"lang":"en","subject":"Computation and Language (cs.CL)","subjectScheme":"arXiv"},{"subject":"FOS: Computer and information sciences","subjectScheme":"Fields of Science and Technology (FOS)"},{"subject":"FOS: Computer and information sciences","schemeUri":"http://www.oecd.org/science/inno/38235147.pdf","subjectScheme":"Fields of Science and Technology (FOS)"},{"lang":"en","subject":"I.2.6; I.2.7","subjectScheme":"ACM"}],"contributors":[],"dates":[{"date":"2016-09-11T18:56:53Z","dateType":"Submitted","dateInformation":"v1"},{"date":"2016-09-13T00:05:06Z","dateType":"Updated","dateInformation":"v1"},{"date":"2016-09-13T02:49:05Z","dateType":"Submitted","dateInformation":"v2"},{"date":"2016-09-14T00:02:02Z","dateType":"Updated","dateInformation":"v2"},{"date":"2016-09","dateType":"Available","dateInformation":"v1"},{"date":"2016","dateType":"Issued"}],"language":null,"types":{"ris":"GEN","bibtex":"misc","citeproc":"article","schemaOrg":"CreativeWork","resourceType":"Article","resourceTypeGeneral":"Preprint"},"relatedIdentifiers":[],"relatedItems":[],"sizes":[],"formats":[],"version":"2","rightsList":[{"rights":"arXiv.org perpetual, non-exclusive license","rightsUri":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/"}],"descriptions":[{"description":"This paper presents a simple end-to-end model for speech recognition, combining a convolutional network based acoustic model and a graph decoding. It is trained to output letters, with transcribed speech, without the need for force alignment of phonemes. We introduce an automatic segmentation criterion for training from sequence annotation without alignment that is on par with CTC while being simpler. We show competitive results in word error rate on the Librispeech corpus with MFCC features, and promising results from raw waveform.","descriptionType":"Abstract"},{"description":"8 pages, 4 figures (7 plots/schemas), 2 tables (4 tabulars)","descriptionType":"Other"}],"geoLocations":[],"fundingReferences":[],"xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0idXRmLTgiPz4KPHJlc291cmNlIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCIgeG1sbnM6eHNpPSJodHRwOi8vd3d3LnczLm9yZy8yMDAxL1hNTFNjaGVtYS1pbnN0YW5jZSIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC00LjMvbWV0YWRhdGEueHNkIj4KICA8aWRlbnRpZmllciBpZGVudGlmaWVyVHlwZT0iRE9JIj4xMC40ODU1MC9BUlhJVi4xNjA5LjAzMTkzPC9pZGVudGlmaWVyPgogIDxhbHRlcm5hdGVJZGVudGlmaWVycz4KICAgIDxhbHRlcm5hdGVJZGVudGlmaWVyIGFsdGVybmF0ZUlkZW50aWZpZXJUeXBlPSJhclhpdiI+MTYwOS4wMzE5MzwvYWx0ZXJuYXRlSWRlbnRpZmllcj4KICA8L2FsdGVybmF0ZUlkZW50aWZpZXJzPgogIDxjcmVhdG9ycz4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5Db2xsb2JlcnQsIFJvbmFuPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5Sb25hbjwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5Db2xsb2JlcnQ8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+UHVocnNjaCwgQ2hyaXN0aWFuPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5DaHJpc3RpYW48L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+UHVocnNjaDwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5TeW5uYWV2ZSwgR2FicmllbDwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+R2FicmllbDwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5TeW5uYWV2ZTwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICA8L2NyZWF0b3JzPgogIDx0aXRsZXM+CiAgICA8dGl0bGU+V2F2MkxldHRlcjogYW4gRW5kLXRvLUVuZCBDb252TmV0LWJhc2VkIFNwZWVjaCBSZWNvZ25pdGlvbiBTeXN0ZW08L3RpdGxlPgogIDwvdGl0bGVzPgogIDxwdWJsaXNoZXI+YXJYaXY8L3B1Ymxpc2hlcj4KICA8cHVibGljYXRpb25ZZWFyPjIwMTY8L3B1YmxpY2F0aW9uWWVhcj4KICA8c3ViamVjdHM+CiAgICA8c3ViamVjdCB4bWw6bGFuZz0iZW4iIHN1YmplY3RTY2hlbWU9ImFyWGl2Ij5NYWNoaW5lIExlYXJuaW5nIChjcy5MRyk8L3N1YmplY3Q+CiAgICA8c3ViamVjdCB4bWw6bGFuZz0iZW4iIHN1YmplY3RTY2hlbWU9ImFyWGl2Ij5BcnRpZmljaWFsIEludGVsbGlnZW5jZSAoY3MuQUkpPC9zdWJqZWN0PgogICAgPHN1YmplY3QgeG1sOmxhbmc9ImVuIiBzdWJqZWN0U2NoZW1lPSJhclhpdiI+Q29tcHV0YXRpb24gYW5kIExhbmd1YWdlIChjcy5DTCk8L3N1YmplY3Q+CiAgICA8c3ViamVjdCBzdWJqZWN0U2NoZW1lPSJGaWVsZHMgb2YgU2NpZW5jZSBhbmQgVGVjaG5vbG9neSAoRk9TKSI+Rk9TOiBDb21wdXRlciBhbmQgaW5mb3JtYXRpb24gc2NpZW5jZXM8L3N1YmplY3Q+CiAgICA8c3ViamVjdCB4bWw6bGFuZz0iZW4iIHN1YmplY3RTY2hlbWU9IkFDTSI+SS4yLjY7IEkuMi43PC9zdWJqZWN0PgogIDwvc3ViamVjdHM+CiAgPGRhdGVzPgogICAgPGRhdGUgZGF0ZVR5cGU9IlN1Ym1pdHRlZCIgZGF0ZUluZm9ybWF0aW9uPSJ2MSI+MjAxNi0wOS0xMVQxODo1Njo1M1o8L2RhdGU+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iVXBkYXRlZCIgZGF0ZUluZm9ybWF0aW9uPSJ2MSI+MjAxNi0wOS0xM1QwMDowNTowNlo8L2RhdGU+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iU3VibWl0dGVkIiBkYXRlSW5mb3JtYXRpb249InYyIj4yMDE2LTA5LTEzVDAyOjQ5OjA1WjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJVcGRhdGVkIiBkYXRlSW5mb3JtYXRpb249InYyIj4yMDE2LTA5LTE0VDAwOjAyOjAyWjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJBdmFpbGFibGUiIGRhdGVJbmZvcm1hdGlvbj0idjEiPjIwMTYtMDk8L2RhdGU+CiAgPC9kYXRlcz4KICA8cmVzb3VyY2VUeXBlIHJlc291cmNlVHlwZUdlbmVyYWw9IlByZXByaW50Ij5BcnRpY2xlPC9yZXNvdXJjZVR5cGU+CiAgPHZlcnNpb24+MjwvdmVyc2lvbj4KICA8cmlnaHRzTGlzdD4KICAgIDxyaWdodHMgcmlnaHRzVVJJPSJodHRwOi8vYXJ4aXYub3JnL2xpY2Vuc2VzL25vbmV4Y2x1c2l2ZS1kaXN0cmliLzEuMC8iPmFyWGl2Lm9yZyBwZXJwZXR1YWwsIG5vbi1leGNsdXNpdmUgbGljZW5zZTwvcmlnaHRzPgogIDwvcmlnaHRzTGlzdD4KICA8ZGVzY3JpcHRpb25zPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iQWJzdHJhY3QiPlRoaXMgcGFwZXIgcHJlc2VudHMgYSBzaW1wbGUgZW5kLXRvLWVuZCBtb2RlbCBmb3Igc3BlZWNoIHJlY29nbml0aW9uLCBjb21iaW5pbmcgYSBjb252b2x1dGlvbmFsIG5ldHdvcmsgYmFzZWQgYWNvdXN0aWMgbW9kZWwgYW5kIGEgZ3JhcGggZGVjb2RpbmcuIEl0IGlzIHRyYWluZWQgdG8gb3V0cHV0IGxldHRlcnMsIHdpdGggdHJhbnNjcmliZWQgc3BlZWNoLCB3aXRob3V0IHRoZSBuZWVkIGZvciBmb3JjZSBhbGlnbm1lbnQgb2YgcGhvbmVtZXMuIFdlIGludHJvZHVjZSBhbiBhdXRvbWF0aWMgc2VnbWVudGF0aW9uIGNyaXRlcmlvbiBmb3IgdHJhaW5pbmcgZnJvbSBzZXF1ZW5jZSBhbm5vdGF0aW9uIHdpdGhvdXQgYWxpZ25tZW50IHRoYXQgaXMgb24gcGFyIHdpdGggQ1RDIHdoaWxlIGJlaW5nIHNpbXBsZXIuIFdlIHNob3cgY29tcGV0aXRpdmUgcmVzdWx0cyBpbiB3b3JkIGVycm9yIHJhdGUgb24gdGhlIExpYnJpc3BlZWNoIGNvcnB1cyB3aXRoIE1GQ0MgZmVhdHVyZXMsIGFuZCBwcm9taXNpbmcgcmVzdWx0cyBmcm9tIHJhdyB3YXZlZm9ybS48L2Rlc2NyaXB0aW9uPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iT3RoZXIiPjggcGFnZXMsIDQgZmlndXJlcyAoNyBwbG90cy9zY2hlbWFzKSwgMiB0YWJsZXMgKDQgdGFidWxhcnMpPC9kZXNjcmlwdGlvbj4KICA8L2Rlc2NyaXB0aW9ucz4KPC9yZXNvdXJjZT4=","url":"https://arxiv.org/abs/1609.03193","contentUrl":null,"metadataVersion":0,"schemaVersion":"http://datacite.org/schema/kernel-4","source":"mds","isActive":true,"state":"findable","reason":null,"viewCount":0,"viewsOverTime":[],"downloadCount":0,"downloadsOverTime":[],"referenceCount":0,"citationCount":0,"citationsOverTime":[],"partCount":0,"partOfCount":0,"versionCount":0,"versionOfCount":0,"created":"2022-03-05T19:43:15.000Z","registered":"2022-03-05T19:43:16.000Z","published":"2016","updated":"2022-03-05T19:43:16.000Z"},"relationships":{"client":{"data":{"id":"arxiv.content","type":"clients"}},"provider":{"data":{"id":"arxiv","type":"providers"}},"media":{"data":{"id":"10.48550/arxiv.1609.03193","type":"media"}},"references":{"data":[]},"citations":{"data":[]},"parts":{"data":[]},"partOf":{"data":[]},"versions":{"data":[]},"versionOf":{"data":[]}}}}