{"data":{"id":"10.48550/arxiv.1410.4803","type":"dois","attributes":{"doi":"10.48550/arxiv.1410.4803","prefix":"10.48550","suffix":"arxiv.1410.4803","identifiers":[{"identifier":"1410.4803","identifierType":"arXiv"}],"alternateIdentifiers":[{"alternateIdentifierType":"arXiv","alternateIdentifier":"1410.4803"}],"creators":[{"name":"Chang, Christopher C.","nameType":"Personal","givenName":"Christopher C.","familyName":"Chang","affiliation":[],"nameIdentifiers":[]},{"name":"Chow, Carson C.","nameType":"Personal","givenName":"Carson C.","familyName":"Chow","affiliation":[],"nameIdentifiers":[]},{"name":"Tellier, Laurent C. A. M.","nameType":"Personal","givenName":"Laurent C. A. M.","familyName":"Tellier","affiliation":[],"nameIdentifiers":[]},{"name":"Vattikuti, Shashaank","nameType":"Personal","givenName":"Shashaank","familyName":"Vattikuti","affiliation":[],"nameIdentifiers":[]},{"name":"Purcell, Shaun M.","nameType":"Personal","givenName":"Shaun M.","familyName":"Purcell","affiliation":[],"nameIdentifiers":[]},{"name":"Lee, James J.","nameType":"Personal","givenName":"James J.","familyName":"Lee","affiliation":[],"nameIdentifiers":[]}],"titles":[{"title":"Second-generation PLINK: rising to the challenge of larger and richer datasets"}],"publisher":"arXiv","container":{},"publicationYear":2014,"subjects":[{"lang":"en","subject":"Genomics (q-bio.GN)","subjectScheme":"arXiv"},{"lang":"en","subject":"Computation (stat.CO)","subjectScheme":"arXiv"},{"subject":"FOS: Biological sciences","subjectScheme":"Fields of Science and Technology (FOS)"},{"subject":"FOS: Biological sciences","schemeUri":"http://www.oecd.org/science/inno/38235147.pdf","subjectScheme":"Fields of Science and Technology (FOS)"},{"subject":"FOS: Computer and information sciences","subjectScheme":"Fields of Science and Technology (FOS)"},{"subject":"FOS: Computer and information sciences","schemeUri":"http://www.oecd.org/science/inno/38235147.pdf","subjectScheme":"Fields of Science and Technology (FOS)"},{"lang":"en","subject":"G.3; G.4; J.3","subjectScheme":"ACM"},{"lang":"en","subject":"62-04","subjectScheme":"MSC"}],"contributors":[],"dates":[{"date":"2014-10-17T17:37:02Z","dateType":"Submitted","dateInformation":"v1"},{"date":"2015-03-03T01:06:41Z","dateType":"Updated","dateInformation":"v1"},{"date":"2014-10","dateType":"Available","dateInformation":"v1"},{"date":"2014","dateType":"Issued"}],"language":null,"types":{"ris":"RPRT","bibtex":"article","citeproc":"article-journal","schemaOrg":"ScholarlyArticle","resourceType":"Article","resourceTypeGeneral":"Text"},"relatedIdentifiers":[{"relationType":"IsVersionOf","relatedIdentifier":"10.1186/s13742-015-0047-8","relatedIdentifierType":"DOI"}],"relatedItems":[],"sizes":[],"formats":[],"version":"1","rightsList":[{"rights":"arXiv.org perpetual, non-exclusive license","rightsUri":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/"}],"descriptions":[{"description":"PLINK 1 is a widely used open-source C/C++ toolset for genome-wide association studies (GWAS) and research in population genetics. However, the steady accumulation of data from imputation and whole-genome sequencing studies has exposed a strong need for even faster and more scalable implementations of key functions. In addition, GWAS and population-genetic data now frequently contain probabilistic calls, phase information, and/or multiallelic variants, none of which can be represented by PLINK 1's primary data format. To address these issues, we are developing a second-generation codebase for PLINK. The first major release from this codebase, PLINK 1.9, introduces extensive use of bit-level parallelism, O(sqrt(n))-time/constant-space Hardy-Weinberg equilibrium and Fisher's exact tests, and many other algorithmic improvements. In combination, these changes accelerate most operations by 1-4 orders of magnitude, and allow the program to handle datasets too large to fit in RAM. This will be followed by PLINK 2.0, which will introduce (a) a new data format capable of efficiently representing probabilities, phase, and multiallelic variants, and (b) extensions of many functions to account for the new types of information. The second-generation versions of PLINK will offer dramatic improvements in performance and compatibility. For the first time, users without access to high-end computing resources can perform several essential analyses of the feature-rich and very large genetic datasets coming into use.","descriptionType":"Abstract"},{"description":"2 figures, 1 additional file","descriptionType":"Other"}],"geoLocations":[],"fundingReferences":[],"xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0idXRmLTgiPz4KPHJlc291cmNlIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCIgeG1sbnM6eHNpPSJodHRwOi8vd3d3LnczLm9yZy8yMDAxL1hNTFNjaGVtYS1pbnN0YW5jZSIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC00LjMvbWV0YWRhdGEueHNkIj4KICA8aWRlbnRpZmllciBpZGVudGlmaWVyVHlwZT0iRE9JIj4xMC40ODU1MC9BUlhJVi4xNDEwLjQ4MDM8L2lkZW50aWZpZXI+CiAgPGFsdGVybmF0ZUlkZW50aWZpZXJzPgogICAgPGFsdGVybmF0ZUlkZW50aWZpZXIgYWx0ZXJuYXRlSWRlbnRpZmllclR5cGU9ImFyWGl2Ij4xNDEwLjQ4MDM8L2FsdGVybmF0ZUlkZW50aWZpZXI+CiAgPC9hbHRlcm5hdGVJZGVudGlmaWVycz4KICA8Y3JlYXRvcnM+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+Q2hhbmcsIENocmlzdG9waGVyIEMuPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5DaHJpc3RvcGhlciBDLjwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5DaGFuZzwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5DaG93LCBDYXJzb24gQy48L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPkNhcnNvbiBDLjwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5DaG93PC9mYW1pbHlOYW1lPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZSBuYW1lVHlwZT0iUGVyc29uYWwiPlRlbGxpZXIsIExhdXJlbnQgQy4gQS4gTS48L2NyZWF0b3JOYW1lPgogICAgICA8Z2l2ZW5OYW1lPkxhdXJlbnQgQy4gQS4gTS48L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+VGVsbGllcjwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5WYXR0aWt1dGksIFNoYXNoYWFuazwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+U2hhc2hhYW5rPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPlZhdHRpa3V0aTwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5QdXJjZWxsLCBTaGF1biBNLjwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+U2hhdW4gTS48L2dpdmVuTmFtZT4KICAgICAgPGZhbWlseU5hbWU+UHVyY2VsbDwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5MZWUsIEphbWVzIEouPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5KYW1lcyBKLjwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5MZWU8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgPC9jcmVhdG9ycz4KICA8dGl0bGVzPgogICAgPHRpdGxlPlNlY29uZC1nZW5lcmF0aW9uIFBMSU5LOiByaXNpbmcgdG8gdGhlIGNoYWxsZW5nZSBvZiBsYXJnZXIgYW5kIHJpY2hlciBkYXRhc2V0czwvdGl0bGU+CiAgPC90aXRsZXM+CiAgPHB1Ymxpc2hlcj5hclhpdjwvcHVibGlzaGVyPgogIDxwdWJsaWNhdGlvblllYXI+MjAxNDwvcHVibGljYXRpb25ZZWFyPgogIDxzdWJqZWN0cz4KICAgIDxzdWJqZWN0IHhtbDpsYW5nPSJlbiIgc3ViamVjdFNjaGVtZT0iYXJYaXYiPkdlbm9taWNzIChxLWJpby5HTik8L3N1YmplY3Q+CiAgICA8c3ViamVjdCB4bWw6bGFuZz0iZW4iIHN1YmplY3RTY2hlbWU9ImFyWGl2Ij5Db21wdXRhdGlvbiAoc3RhdC5DTyk8L3N1YmplY3Q+CiAgICA8c3ViamVjdCBzdWJqZWN0U2NoZW1lPSJGaWVsZHMgb2YgU2NpZW5jZSBhbmQgVGVjaG5vbG9neSAoRk9TKSI+Rk9TOiBCaW9sb2dpY2FsIHNjaWVuY2VzPC9zdWJqZWN0PgogICAgPHN1YmplY3Qgc3ViamVjdFNjaGVtZT0iRmllbGRzIG9mIFNjaWVuY2UgYW5kIFRlY2hub2xvZ3kgKEZPUykiPkZPUzogQ29tcHV0ZXIgYW5kIGluZm9ybWF0aW9uIHNjaWVuY2VzPC9zdWJqZWN0PgogICAgPHN1YmplY3QgeG1sOmxhbmc9ImVuIiBzdWJqZWN0U2NoZW1lPSJBQ00iPkcuMzsgRy40OyBKLjM8L3N1YmplY3Q+CiAgICA8c3ViamVjdCB4bWw6bGFuZz0iZW4iIHN1YmplY3RTY2hlbWU9Ik1TQyI+NjItMDQ8L3N1YmplY3Q+CiAgPC9zdWJqZWN0cz4KICA8ZGF0ZXM+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iU3VibWl0dGVkIiBkYXRlSW5mb3JtYXRpb249InYxIj4yMDE0LTEwLTE3VDE3OjM3OjAyWjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJVcGRhdGVkIiBkYXRlSW5mb3JtYXRpb249InYxIj4yMDE1LTAzLTAzVDAxOjA2OjQxWjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJBdmFpbGFibGUiIGRhdGVJbmZvcm1hdGlvbj0idjEiPjIwMTQtMTA8L2RhdGU+CiAgPC9kYXRlcz4KICA8cmVzb3VyY2VUeXBlIHJlc291cmNlVHlwZUdlbmVyYWw9IlRleHQiPkFydGljbGU8L3Jlc291cmNlVHlwZT4KICA8cmVsYXRlZElkZW50aWZpZXJzPgogICAgPHJlbGF0ZWRJZGVudGlmaWVyIHJlbGF0ZWRJZGVudGlmaWVyVHlwZT0iRE9JIiByZWxhdGlvblR5cGU9IklzVmVyc2lvbk9mIj4xMC4xMTg2L3MxMzc0Mi0wMTUtMDA0Ny04PC9yZWxhdGVkSWRlbnRpZmllcj4KICA8L3JlbGF0ZWRJZGVudGlmaWVycz4KICA8dmVyc2lvbj4xPC92ZXJzaW9uPgogIDxyaWdodHNMaXN0PgogICAgPHJpZ2h0cyByaWdodHNVUkk9Imh0dHA6Ly9hcnhpdi5vcmcvbGljZW5zZXMvbm9uZXhjbHVzaXZlLWRpc3RyaWIvMS4wLyI+YXJYaXYub3JnIHBlcnBldHVhbCwgbm9uLWV4Y2x1c2l2ZSBsaWNlbnNlPC9yaWdodHM+CiAgPC9yaWdodHNMaXN0PgogIDxkZXNjcmlwdGlvbnM+CiAgICA8ZGVzY3JpcHRpb24gZGVzY3JpcHRpb25UeXBlPSJBYnN0cmFjdCI+UExJTksgMSBpcyBhIHdpZGVseSB1c2VkIG9wZW4tc291cmNlIEMvQysrIHRvb2xzZXQgZm9yIGdlbm9tZS13aWRlIGFzc29jaWF0aW9uIHN0dWRpZXMgKEdXQVMpIGFuZCByZXNlYXJjaCBpbiBwb3B1bGF0aW9uIGdlbmV0aWNzLiBIb3dldmVyLCB0aGUgc3RlYWR5IGFjY3VtdWxhdGlvbiBvZiBkYXRhIGZyb20gaW1wdXRhdGlvbiBhbmQgd2hvbGUtZ2Vub21lIHNlcXVlbmNpbmcgc3R1ZGllcyBoYXMgZXhwb3NlZCBhIHN0cm9uZyBuZWVkIGZvciBldmVuIGZhc3RlciBhbmQgbW9yZSBzY2FsYWJsZSBpbXBsZW1lbnRhdGlvbnMgb2Yga2V5IGZ1bmN0aW9ucy4gSW4gYWRkaXRpb24sIEdXQVMgYW5kIHBvcHVsYXRpb24tZ2VuZXRpYyBkYXRhIG5vdyBmcmVxdWVudGx5IGNvbnRhaW4gcHJvYmFiaWxpc3RpYyBjYWxscywgcGhhc2UgaW5mb3JtYXRpb24sIGFuZC9vciBtdWx0aWFsbGVsaWMgdmFyaWFudHMsIG5vbmUgb2Ygd2hpY2ggY2FuIGJlIHJlcHJlc2VudGVkIGJ5IFBMSU5LIDEncyBwcmltYXJ5IGRhdGEgZm9ybWF0LgogIFRvIGFkZHJlc3MgdGhlc2UgaXNzdWVzLCB3ZSBhcmUgZGV2ZWxvcGluZyBhIHNlY29uZC1nZW5lcmF0aW9uIGNvZGViYXNlIGZvciBQTElOSy4gVGhlIGZpcnN0IG1ham9yIHJlbGVhc2UgZnJvbSB0aGlzIGNvZGViYXNlLCBQTElOSyAxLjksIGludHJvZHVjZXMgZXh0ZW5zaXZlIHVzZSBvZiBiaXQtbGV2ZWwgcGFyYWxsZWxpc20sIE8oc3FydChuKSktdGltZS9jb25zdGFudC1zcGFjZSBIYXJkeS1XZWluYmVyZyBlcXVpbGlicml1bSBhbmQgRmlzaGVyJ3MgZXhhY3QgdGVzdHMsIGFuZCBtYW55IG90aGVyIGFsZ29yaXRobWljIGltcHJvdmVtZW50cy4gSW4gY29tYmluYXRpb24sIHRoZXNlIGNoYW5nZXMgYWNjZWxlcmF0ZSBtb3N0IG9wZXJhdGlvbnMgYnkgMS00IG9yZGVycyBvZiBtYWduaXR1ZGUsIGFuZCBhbGxvdyB0aGUgcHJvZ3JhbSB0byBoYW5kbGUgZGF0YXNldHMgdG9vIGxhcmdlIHRvIGZpdCBpbiBSQU0uIFRoaXMgd2lsbCBiZSBmb2xsb3dlZCBieSBQTElOSyAyLjAsIHdoaWNoIHdpbGwgaW50cm9kdWNlIChhKSBhIG5ldyBkYXRhIGZvcm1hdCBjYXBhYmxlIG9mIGVmZmljaWVudGx5IHJlcHJlc2VudGluZyBwcm9iYWJpbGl0aWVzLCBwaGFzZSwgYW5kIG11bHRpYWxsZWxpYyB2YXJpYW50cywgYW5kIChiKSBleHRlbnNpb25zIG9mIG1hbnkgZnVuY3Rpb25zIHRvIGFjY291bnQgZm9yIHRoZSBuZXcgdHlwZXMgb2YgaW5mb3JtYXRpb24uCiAgVGhlIHNlY29uZC1nZW5lcmF0aW9uIHZlcnNpb25zIG9mIFBMSU5LIHdpbGwgb2ZmZXIgZHJhbWF0aWMgaW1wcm92ZW1lbnRzIGluIHBlcmZvcm1hbmNlIGFuZCBjb21wYXRpYmlsaXR5LiBGb3IgdGhlIGZpcnN0IHRpbWUsIHVzZXJzIHdpdGhvdXQgYWNjZXNzIHRvIGhpZ2gtZW5kIGNvbXB1dGluZyByZXNvdXJjZXMgY2FuIHBlcmZvcm0gc2V2ZXJhbCBlc3NlbnRpYWwgYW5hbHlzZXMgb2YgdGhlIGZlYXR1cmUtcmljaCBhbmQgdmVyeSBsYXJnZSBnZW5ldGljIGRhdGFzZXRzIGNvbWluZyBpbnRvIHVzZS48L2Rlc2NyaXB0aW9uPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iT3RoZXIiPjIgZmlndXJlcywgMSBhZGRpdGlvbmFsIGZpbGU8L2Rlc2NyaXB0aW9uPgogIDwvZGVzY3JpcHRpb25zPgo8L3Jlc291cmNlPg==","url":"https://arxiv.org/abs/1410.4803","contentUrl":null,"metadataVersion":0,"schemaVersion":"http://datacite.org/schema/kernel-4","source":"mds","isActive":true,"state":"findable","reason":null,"viewCount":0,"viewsOverTime":[],"downloadCount":0,"downloadsOverTime":[],"referenceCount":0,"citationCount":0,"citationsOverTime":[],"partCount":0,"partOfCount":0,"versionCount":0,"versionOfCount":0,"created":"2022-03-09T17:25:25.000Z","registered":"2022-03-09T17:25:26.000Z","published":"2014","updated":"2022-03-09T17:25:26.000Z"},"relationships":{"client":{"data":{"id":"arxiv.content","type":"clients"}},"provider":{"data":{"id":"arxiv","type":"providers"}},"media":{"data":{"id":"10.48550/arxiv.1410.4803","type":"media"}},"references":{"data":[]},"citations":{"data":[]},"parts":{"data":[]},"partOf":{"data":[]},"versions":{"data":[]},"versionOf":{"data":[]}}}}