{"data":{"id":"10.48550/arxiv.2204.05999","type":"dois","attributes":{"doi":"10.48550/arxiv.2204.05999","prefix":"10.48550","suffix":"arxiv.2204.05999","identifiers":[{"identifier":"2204.05999","identifierType":"arXiv"}],"alternateIdentifiers":[{"alternateIdentifierType":"arXiv","alternateIdentifier":"2204.05999"}],"creators":[{"name":"Fried, Daniel","nameType":"Personal","givenName":"Daniel","familyName":"Fried","affiliation":[],"nameIdentifiers":[]},{"name":"Aghajanyan, Armen","nameType":"Personal","givenName":"Armen","familyName":"Aghajanyan","affiliation":[],"nameIdentifiers":[]},{"name":"Lin, Jessy","nameType":"Personal","givenName":"Jessy","familyName":"Lin","affiliation":[],"nameIdentifiers":[]},{"name":"Wang, Sida","nameType":"Personal","givenName":"Sida","familyName":"Wang","affiliation":[],"nameIdentifiers":[]},{"name":"Wallace, Eric","nameType":"Personal","givenName":"Eric","familyName":"Wallace","affiliation":[],"nameIdentifiers":[]},{"name":"Shi, Freda","nameType":"Personal","givenName":"Freda","familyName":"Shi","affiliation":[],"nameIdentifiers":[]},{"name":"Zhong, Ruiqi","nameType":"Personal","givenName":"Ruiqi","familyName":"Zhong","affiliation":[],"nameIdentifiers":[]},{"name":"Yih, Wen-tau","nameType":"Personal","givenName":"Wen-tau","familyName":"Yih","affiliation":[],"nameIdentifiers":[]},{"name":"Zettlemoyer, Luke","nameType":"Personal","givenName":"Luke","familyName":"Zettlemoyer","affiliation":[],"nameIdentifiers":[]},{"name":"Lewis, Mike","nameType":"Personal","givenName":"Mike","familyName":"Lewis","affiliation":[],"nameIdentifiers":[]}],"titles":[{"title":"InCoder: A Generative Model for Code Infilling and Synthesis"}],"publisher":"arXiv","container":{},"publicationYear":2022,"subjects":[{"lang":"en","subject":"Software Engineering (cs.SE)","subjectScheme":"arXiv"},{"lang":"en","subject":"Computation and Language (cs.CL)","subjectScheme":"arXiv"},{"lang":"en","subject":"Machine Learning (cs.LG)","subjectScheme":"arXiv"},{"subject":"FOS: Computer and information sciences","subjectScheme":"Fields of Science and Technology (FOS)"},{"subject":"FOS: Computer and information sciences","schemeUri":"http://www.oecd.org/science/inno/38235147.pdf","subjectScheme":"Fields of Science and Technology (FOS)"}],"contributors":[],"dates":[{"date":"2022-04-12T16:25:26Z","dateType":"Submitted","dateInformation":"v1"},{"date":"2022-04-14T00:00:09Z","dateType":"Updated","dateInformation":"v1"},{"date":"2022-04-17T17:30:27Z","dateType":"Submitted","dateInformation":"v2"},{"date":"2022-04-19T00:31:28Z","dateType":"Updated","dateInformation":"v2"},{"date":"2023-04-09T14:31:40Z","dateType":"Submitted","dateInformation":"v3"},{"date":"2023-04-11T00:14:38Z","dateType":"Updated","dateInformation":"v3"},{"date":"2022-04","dateType":"Available","dateInformation":"v1"},{"date":"2022","dateType":"Issued"}],"language":null,"types":{"ris":"GEN","bibtex":"misc","citeproc":"article","schemaOrg":"CreativeWork","resourceType":"Article","resourceTypeGeneral":"Preprint"},"relatedIdentifiers":[],"relatedItems":[],"sizes":[],"formats":[],"version":"3","rightsList":[{"rights":"Creative Commons Attribution Non Commercial Share Alike 4.0 International","rightsUri":"https://creativecommons.org/licenses/by-nc-sa/4.0/legalcode","schemeUri":"https://spdx.org/licenses/","rightsIdentifier":"cc-by-nc-sa-4.0","rightsIdentifierScheme":"SPDX"}],"descriptions":[{"description":"Code is seldom written in a single left-to-right pass and is instead repeatedly edited and refined. We introduce InCoder, a unified generative model that can perform program synthesis (via left-to-right generation) as well as editing (via infilling). InCoder is trained to generate code files from a large corpus of permissively licensed code, where regions of code have been randomly masked and moved to the end of each file, allowing code infilling with bidirectional context. Our model is the first generative model that is able to directly perform zero-shot code infilling, which we evaluate on challenging tasks such as type inference, comment generation, and variable re-naming. We find that the ability to condition on bidirectional context substantially improves performance on these tasks, while still performing comparably on standard program synthesis benchmarks in comparison to left-to-right only models pretrained at similar scale. The InCoder models and code are publicly released. https://sites.google.com/view/incoder-code-models","descriptionType":"Abstract"},{"description":"ICLR 2023. v3: camera-ready that includes PLBART and OpenAI baselines","descriptionType":"Other"}],"geoLocations":[],"fundingReferences":[],"xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0idXRmLTgiPz4KPHJlc291cmNlIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCIgeG1sbnM6eHNpPSJodHRwOi8vd3d3LnczLm9yZy8yMDAxL1hNTFNjaGVtYS1pbnN0YW5jZSIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC00LjMvbWV0YWRhdGEueHNkIj4KICA8aWRlbnRpZmllciBpZGVudGlmaWVyVHlwZT0iRE9JIj4xMC40ODU1MC9BUlhJVi4yMjA0LjA1OTk5PC9pZGVudGlmaWVyPgogIDxhbHRlcm5hdGVJZGVudGlmaWVycz4KICAgIDxhbHRlcm5hdGVJZGVudGlmaWVyIGFsdGVybmF0ZUlkZW50aWZpZXJUeXBlPSJhclhpdiI+MjIwNC4wNTk5OTwvYWx0ZXJuYXRlSWRlbnRpZmllcj4KICA8L2FsdGVybmF0ZUlkZW50aWZpZXJzPgogIDxjcmVhdG9ycz4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5GcmllZCwgRGFuaWVsPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5EYW5pZWw8L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+RnJpZWQ8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+QWdoYWphbnlhbiwgQXJtZW48L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPkFybWVuPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPkFnaGFqYW55YW48L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+TGluLCBKZXNzeTwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+SmVzc3k8L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+TGluPC9mYW1pbHlOYW1lPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZSBuYW1lVHlwZT0iUGVyc29uYWwiPldhbmcsIFNpZGE8L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPlNpZGE8L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+V2FuZzwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5XYWxsYWNlLCBFcmljPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5FcmljPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPldhbGxhY2U8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+U2hpLCBGcmVkYTwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+RnJlZGE8L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+U2hpPC9mYW1pbHlOYW1lPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZSBuYW1lVHlwZT0iUGVyc29uYWwiPlpob25nLCBSdWlxaTwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+UnVpcWk8L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+Wmhvbmc8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+WWloLCBXZW4tdGF1PC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5XZW4tdGF1PC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPllpaDwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5aZXR0bGVtb3llciwgTHVrZTwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+THVrZTwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5aZXR0bGVtb3llcjwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5MZXdpcywgTWlrZTwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+TWlrZTwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5MZXdpczwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICA8L2NyZWF0b3JzPgogIDx0aXRsZXM+CiAgICA8dGl0bGU+SW5Db2RlcjogQSBHZW5lcmF0aXZlIE1vZGVsIGZvciBDb2RlIEluZmlsbGluZyBhbmQgU3ludGhlc2lzPC90aXRsZT4KICA8L3RpdGxlcz4KICA8cHVibGlzaGVyPmFyWGl2PC9wdWJsaXNoZXI+CiAgPHB1YmxpY2F0aW9uWWVhcj4yMDIyPC9wdWJsaWNhdGlvblllYXI+CiAgPHN1YmplY3RzPgogICAgPHN1YmplY3QgeG1sOmxhbmc9ImVuIiBzdWJqZWN0U2NoZW1lPSJhclhpdiI+U29mdHdhcmUgRW5naW5lZXJpbmcgKGNzLlNFKTwvc3ViamVjdD4KICAgIDxzdWJqZWN0IHhtbDpsYW5nPSJlbiIgc3ViamVjdFNjaGVtZT0iYXJYaXYiPkNvbXB1dGF0aW9uIGFuZCBMYW5ndWFnZSAoY3MuQ0wpPC9zdWJqZWN0PgogICAgPHN1YmplY3QgeG1sOmxhbmc9ImVuIiBzdWJqZWN0U2NoZW1lPSJhclhpdiI+TWFjaGluZSBMZWFybmluZyAoY3MuTEcpPC9zdWJqZWN0PgogICAgPHN1YmplY3Qgc3ViamVjdFNjaGVtZT0iRmllbGRzIG9mIFNjaWVuY2UgYW5kIFRlY2hub2xvZ3kgKEZPUykiPkZPUzogQ29tcHV0ZXIgYW5kIGluZm9ybWF0aW9uIHNjaWVuY2VzPC9zdWJqZWN0PgogIDwvc3ViamVjdHM+CiAgPGRhdGVzPgogICAgPGRhdGUgZGF0ZVR5cGU9IlN1Ym1pdHRlZCIgZGF0ZUluZm9ybWF0aW9uPSJ2MSI+MjAyMi0wNC0xMlQxNjoyNToyNlo8L2RhdGU+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iVXBkYXRlZCIgZGF0ZUluZm9ybWF0aW9uPSJ2MSI+MjAyMi0wNC0xNFQwMDowMDowOVo8L2RhdGU+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iU3VibWl0dGVkIiBkYXRlSW5mb3JtYXRpb249InYyIj4yMDIyLTA0LTE3VDE3OjMwOjI3WjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJVcGRhdGVkIiBkYXRlSW5mb3JtYXRpb249InYyIj4yMDIyLTA0LTE5VDAwOjMxOjI4WjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJTdWJtaXR0ZWQiIGRhdGVJbmZvcm1hdGlvbj0idjMiPjIwMjMtMDQtMDlUMTQ6MzE6NDBaPC9kYXRlPgogICAgPGRhdGUgZGF0ZVR5cGU9IlVwZGF0ZWQiIGRhdGVJbmZvcm1hdGlvbj0idjMiPjIwMjMtMDQtMTFUMDA6MTQ6MzhaPC9kYXRlPgogICAgPGRhdGUgZGF0ZVR5cGU9IkF2YWlsYWJsZSIgZGF0ZUluZm9ybWF0aW9uPSJ2MSI+MjAyMi0wNDwvZGF0ZT4KICA8L2RhdGVzPgogIDxyZXNvdXJjZVR5cGUgcmVzb3VyY2VUeXBlR2VuZXJhbD0iUHJlcHJpbnQiPkFydGljbGU8L3Jlc291cmNlVHlwZT4KICA8dmVyc2lvbj4zPC92ZXJzaW9uPgogIDxyaWdodHNMaXN0PgogICAgPHJpZ2h0cyByaWdodHNVUkk9Imh0dHA6Ly9jcmVhdGl2ZWNvbW1vbnMub3JnL2xpY2Vuc2VzL2J5LW5jLXNhLzQuMC8iIHJpZ2h0c0lkZW50aWZpZXJTY2hlbWU9IlNQRFgiIHJpZ2h0c0lkZW50aWZpZXI9IkNDLUJZLU5DLVNBLTQuMCI+Q3JlYXRpdmUgQ29tbW9ucyBBdHRyaWJ1dGlvbiBOb24gQ29tbWVyY2lhbCBTaGFyZSBBbGlrZSA0LjAgSW50ZXJuYXRpb25hbDwvcmlnaHRzPgogIDwvcmlnaHRzTGlzdD4KICA8ZGVzY3JpcHRpb25zPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iQWJzdHJhY3QiPkNvZGUgaXMgc2VsZG9tIHdyaXR0ZW4gaW4gYSBzaW5nbGUgbGVmdC10by1yaWdodCBwYXNzIGFuZCBpcyBpbnN0ZWFkIHJlcGVhdGVkbHkgZWRpdGVkIGFuZCByZWZpbmVkLiBXZSBpbnRyb2R1Y2UgSW5Db2RlciwgYSB1bmlmaWVkIGdlbmVyYXRpdmUgbW9kZWwgdGhhdCBjYW4gcGVyZm9ybSBwcm9ncmFtIHN5bnRoZXNpcyAodmlhIGxlZnQtdG8tcmlnaHQgZ2VuZXJhdGlvbikgYXMgd2VsbCBhcyBlZGl0aW5nICh2aWEgaW5maWxsaW5nKS4gSW5Db2RlciBpcyB0cmFpbmVkIHRvIGdlbmVyYXRlIGNvZGUgZmlsZXMgZnJvbSBhIGxhcmdlIGNvcnB1cyBvZiBwZXJtaXNzaXZlbHkgbGljZW5zZWQgY29kZSwgd2hlcmUgcmVnaW9ucyBvZiBjb2RlIGhhdmUgYmVlbiByYW5kb21seSBtYXNrZWQgYW5kIG1vdmVkIHRvIHRoZSBlbmQgb2YgZWFjaCBmaWxlLCBhbGxvd2luZyBjb2RlIGluZmlsbGluZyB3aXRoIGJpZGlyZWN0aW9uYWwgY29udGV4dC4gT3VyIG1vZGVsIGlzIHRoZSBmaXJzdCBnZW5lcmF0aXZlIG1vZGVsIHRoYXQgaXMgYWJsZSB0byBkaXJlY3RseSBwZXJmb3JtIHplcm8tc2hvdCBjb2RlIGluZmlsbGluZywgd2hpY2ggd2UgZXZhbHVhdGUgb24gY2hhbGxlbmdpbmcgdGFza3Mgc3VjaCBhcyB0eXBlIGluZmVyZW5jZSwgY29tbWVudCBnZW5lcmF0aW9uLCBhbmQgdmFyaWFibGUgcmUtbmFtaW5nLiBXZSBmaW5kIHRoYXQgdGhlIGFiaWxpdHkgdG8gY29uZGl0aW9uIG9uIGJpZGlyZWN0aW9uYWwgY29udGV4dCBzdWJzdGFudGlhbGx5IGltcHJvdmVzIHBlcmZvcm1hbmNlIG9uIHRoZXNlIHRhc2tzLCB3aGlsZSBzdGlsbCBwZXJmb3JtaW5nIGNvbXBhcmFibHkgb24gc3RhbmRhcmQgcHJvZ3JhbSBzeW50aGVzaXMgYmVuY2htYXJrcyBpbiBjb21wYXJpc29uIHRvIGxlZnQtdG8tcmlnaHQgb25seSBtb2RlbHMgcHJldHJhaW5lZCBhdCBzaW1pbGFyIHNjYWxlLiBUaGUgSW5Db2RlciBtb2RlbHMgYW5kIGNvZGUgYXJlIHB1YmxpY2x5IHJlbGVhc2VkLiBodHRwczovL3NpdGVzLmdvb2dsZS5jb20vdmlldy9pbmNvZGVyLWNvZGUtbW9kZWxzPC9kZXNjcmlwdGlvbj4KICAgIDxkZXNjcmlwdGlvbiBkZXNjcmlwdGlvblR5cGU9Ik90aGVyIj5JQ0xSIDIwMjMuIHYzOiBjYW1lcmEtcmVhZHkgdGhhdCBpbmNsdWRlcyBQTEJBUlQgYW5kIE9wZW5BSSBiYXNlbGluZXM8L2Rlc2NyaXB0aW9uPgogIDwvZGVzY3JpcHRpb25zPgo8L3Jlc291cmNlPg==","url":"https://arxiv.org/abs/2204.05999","contentUrl":null,"metadataVersion":2,"schemaVersion":"http://datacite.org/schema/kernel-4","source":"mds","isActive":true,"state":"findable","reason":null,"viewCount":0,"viewsOverTime":[],"downloadCount":0,"downloadsOverTime":[],"referenceCount":0,"citationCount":0,"citationsOverTime":[],"partCount":0,"partOfCount":0,"versionCount":0,"versionOfCount":0,"created":"2022-04-14T00:56:07.000Z","registered":"2022-04-14T00:56:08.000Z","published":"2022","updated":"2023-04-11T03:39:41.000Z"},"relationships":{"client":{"data":{"id":"arxiv.content","type":"clients"}},"provider":{"data":{"id":"arxiv","type":"providers"}},"media":{"data":{"id":"10.48550/arxiv.2204.05999","type":"media"}},"references":{"data":[]},"citations":{"data":[]},"parts":{"data":[]},"partOf":{"data":[]},"versions":{"data":[]},"versionOf":{"data":[]}}}}