{"data":{"id":"10.48550/arxiv.0709.1640","type":"dois","attributes":{"doi":"10.48550/arxiv.0709.1640","prefix":"10.48550","suffix":"arxiv.0709.1640","identifiers":[{"identifier":"0709.1640","identifierType":"arXiv"}],"alternateIdentifiers":[{"alternateIdentifierType":"arXiv","alternateIdentifier":"0709.1640"}],"creators":[{"name":"Ssali, George","nameType":"Personal","givenName":"George","familyName":"Ssali","affiliation":[],"nameIdentifiers":[]},{"name":"Marwala, Tshilidzi","nameType":"Personal","givenName":"Tshilidzi","familyName":"Marwala","affiliation":[],"nameIdentifiers":[]}],"titles":[{"title":"Estimation of Missing Data Using Computational Intelligence and Decision Trees"}],"publisher":"arXiv","container":{},"publicationYear":2007,"subjects":[{"lang":"en","subject":"Applications (stat.AP)","subjectScheme":"arXiv"},{"subject":"FOS: Computer and information sciences","subjectScheme":"Fields of Science and Technology (FOS)"},{"subject":"FOS: Computer and information sciences","schemeUri":"http://www.oecd.org/science/inno/38235147.pdf","subjectScheme":"Fields of Science and Technology (FOS)"}],"contributors":[],"dates":[{"date":"2007-09-11T14:48:19Z","dateType":"Submitted","dateInformation":"v1"},{"date":"2009-12-01T09:44:11Z","dateType":"Updated","dateInformation":"v1"},{"date":"2007-09","dateType":"Available","dateInformation":"v1"},{"date":"2007","dateType":"Issued"}],"language":null,"types":{"ris":"GEN","bibtex":"misc","citeproc":"article","schemaOrg":"CreativeWork","resourceType":"Article","resourceTypeGeneral":"Preprint"},"relatedIdentifiers":[],"relatedItems":[],"sizes":[],"formats":[],"version":"1","rightsList":[{"rights":"Assumed arXiv.org perpetual, non-exclusive license to distribute this article for submissions made before January 2004","rightsUri":"http://arxiv.org/licenses/assumed-1991-2003/"}],"descriptions":[{"description":"This paper introduces a novel paradigm to impute missing data that combines a decision tree with an auto-associative neural network (AANN) based model and a principal component analysis-neural network (PCA-NN) based model. For each model, the decision tree is used to predict search bounds for a genetic algorithm that minimize an error function derived from the respective model. The models' ability to impute missing data is tested and compared using HIV sero-prevalance data. Results indicate an average increase in accuracy of 13% with the AANN based model's average accuracy increasing from 75.8% to 86.3% while that of the PCA-NN based model increasing from 66.1% to 81.6%.","descriptionType":"Abstract"},{"description":"14 pages","descriptionType":"Other"}],"geoLocations":[],"fundingReferences":[],"xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0idXRmLTgiPz4KPHJlc291cmNlIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCIgeG1sbnM6eHNpPSJodHRwOi8vd3d3LnczLm9yZy8yMDAxL1hNTFNjaGVtYS1pbnN0YW5jZSIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC00LjMvbWV0YWRhdGEueHNkIj4KICA8aWRlbnRpZmllciBpZGVudGlmaWVyVHlwZT0iRE9JIj4xMC40ODU1MC9BUlhJVi4wNzA5LjE2NDA8L2lkZW50aWZpZXI+CiAgPGFsdGVybmF0ZUlkZW50aWZpZXJzPgogICAgPGFsdGVybmF0ZUlkZW50aWZpZXIgYWx0ZXJuYXRlSWRlbnRpZmllclR5cGU9ImFyWGl2Ij4wNzA5LjE2NDA8L2FsdGVybmF0ZUlkZW50aWZpZXI+CiAgPC9hbHRlcm5hdGVJZGVudGlmaWVycz4KICA8Y3JlYXRvcnM+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+U3NhbGksIEdlb3JnZTwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+R2VvcmdlPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPlNzYWxpPC9mYW1pbHlOYW1lPgogICAgPC9jcmVhdG9yPgogICAgPGNyZWF0b3I+CiAgICAgIDxjcmVhdG9yTmFtZSBuYW1lVHlwZT0iUGVyc29uYWwiPk1hcndhbGEsIFRzaGlsaWR6aTwvY3JlYXRvck5hbWU+CiAgICAgIDxnaXZlbk5hbWU+VHNoaWxpZHppPC9naXZlbk5hbWU+CiAgICAgIDxmYW1pbHlOYW1lPk1hcndhbGE8L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgPC9jcmVhdG9ycz4KICA8dGl0bGVzPgogICAgPHRpdGxlPkVzdGltYXRpb24gb2YgTWlzc2luZyBEYXRhIFVzaW5nIENvbXB1dGF0aW9uYWwgSW50ZWxsaWdlbmNlIGFuZCBEZWNpc2lvbiBUcmVlczwvdGl0bGU+CiAgPC90aXRsZXM+CiAgPHB1Ymxpc2hlcj5hclhpdjwvcHVibGlzaGVyPgogIDxwdWJsaWNhdGlvblllYXI+MjAwNzwvcHVibGljYXRpb25ZZWFyPgogIDxzdWJqZWN0cz4KICAgIDxzdWJqZWN0IHhtbDpsYW5nPSJlbiIgc3ViamVjdFNjaGVtZT0iYXJYaXYiPkFwcGxpY2F0aW9ucyAoc3RhdC5BUCk8L3N1YmplY3Q+CiAgICA8c3ViamVjdCBzdWJqZWN0U2NoZW1lPSJGaWVsZHMgb2YgU2NpZW5jZSBhbmQgVGVjaG5vbG9neSAoRk9TKSI+Rk9TOiBDb21wdXRlciBhbmQgaW5mb3JtYXRpb24gc2NpZW5jZXM8L3N1YmplY3Q+CiAgPC9zdWJqZWN0cz4KICA8ZGF0ZXM+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iU3VibWl0dGVkIiBkYXRlSW5mb3JtYXRpb249InYxIj4yMDA3LTA5LTExVDE0OjQ4OjE5WjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJVcGRhdGVkIiBkYXRlSW5mb3JtYXRpb249InYxIj4yMDA5LTEyLTAxVDA5OjQ0OjExWjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJBdmFpbGFibGUiIGRhdGVJbmZvcm1hdGlvbj0idjEiPjIwMDctMDk8L2RhdGU+CiAgPC9kYXRlcz4KICA8cmVzb3VyY2VUeXBlIHJlc291cmNlVHlwZUdlbmVyYWw9IlByZXByaW50Ij5BcnRpY2xlPC9yZXNvdXJjZVR5cGU+CiAgPHZlcnNpb24+MTwvdmVyc2lvbj4KICA8cmlnaHRzTGlzdD4KICAgIDxyaWdodHMgcmlnaHRzVVJJPSJodHRwOi8vYXJ4aXYub3JnL2xpY2Vuc2VzL2Fzc3VtZWQtMTk5MS0yMDAzLyI+QXNzdW1lZCBhclhpdi5vcmcgcGVycGV0dWFsLCBub24tZXhjbHVzaXZlIGxpY2Vuc2UgdG8gZGlzdHJpYnV0ZSB0aGlzIGFydGljbGUgZm9yIHN1Ym1pc3Npb25zIG1hZGUgYmVmb3JlIEphbnVhcnkgMjAwNDwvcmlnaHRzPgogIDwvcmlnaHRzTGlzdD4KICA8ZGVzY3JpcHRpb25zPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iQWJzdHJhY3QiPlRoaXMgcGFwZXIgaW50cm9kdWNlcyBhIG5vdmVsIHBhcmFkaWdtIHRvIGltcHV0ZSBtaXNzaW5nIGRhdGEgdGhhdCBjb21iaW5lcyBhIGRlY2lzaW9uIHRyZWUgd2l0aCBhbiBhdXRvLWFzc29jaWF0aXZlIG5ldXJhbCBuZXR3b3JrIChBQU5OKSBiYXNlZCBtb2RlbCBhbmQgYSBwcmluY2lwYWwgY29tcG9uZW50IGFuYWx5c2lzLW5ldXJhbCBuZXR3b3JrIChQQ0EtTk4pIGJhc2VkIG1vZGVsLiBGb3IgZWFjaCBtb2RlbCwgdGhlIGRlY2lzaW9uIHRyZWUgaXMgdXNlZCB0byBwcmVkaWN0IHNlYXJjaCBib3VuZHMgZm9yIGEgZ2VuZXRpYyBhbGdvcml0aG0gdGhhdCBtaW5pbWl6ZSBhbiBlcnJvciBmdW5jdGlvbiBkZXJpdmVkIGZyb20gdGhlIHJlc3BlY3RpdmUgbW9kZWwuIFRoZSBtb2RlbHMnIGFiaWxpdHkgdG8gaW1wdXRlIG1pc3NpbmcgZGF0YSBpcyB0ZXN0ZWQgYW5kIGNvbXBhcmVkIHVzaW5nIEhJViBzZXJvLXByZXZhbGFuY2UgZGF0YS4gUmVzdWx0cyBpbmRpY2F0ZSBhbiBhdmVyYWdlIGluY3JlYXNlIGluIGFjY3VyYWN5IG9mIDEzJSB3aXRoIHRoZSBBQU5OIGJhc2VkIG1vZGVsJ3MgYXZlcmFnZSBhY2N1cmFjeSBpbmNyZWFzaW5nIGZyb20gNzUuOCUgdG8gODYuMyUgd2hpbGUgdGhhdCBvZiB0aGUgUENBLU5OIGJhc2VkIG1vZGVsIGluY3JlYXNpbmcgZnJvbSA2Ni4xJSB0byA4MS42JS48L2Rlc2NyaXB0aW9uPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iT3RoZXIiPjE0IHBhZ2VzPC9kZXNjcmlwdGlvbj4KICA8L2Rlc2NyaXB0aW9ucz4KPC9yZXNvdXJjZT4=","url":"https://arxiv.org/abs/0709.1640","contentUrl":null,"metadataVersion":0,"schemaVersion":"http://datacite.org/schema/kernel-4","source":"mds","isActive":true,"state":"findable","reason":null,"viewCount":0,"viewsOverTime":[],"downloadCount":0,"downloadsOverTime":[],"referenceCount":0,"citationCount":0,"citationsOverTime":[],"partCount":0,"partOfCount":0,"versionCount":0,"versionOfCount":0,"created":"2022-03-16T03:08:10.000Z","registered":"2022-03-16T03:08:11.000Z","published":"2007","updated":"2022-03-16T03:08:11.000Z"},"relationships":{"client":{"data":{"id":"arxiv.content","type":"clients"}},"provider":{"data":{"id":"arxiv","type":"providers"}},"media":{"data":{"id":"10.48550/arxiv.0709.1640","type":"media"}},"references":{"data":[]},"citations":{"data":[]},"parts":{"data":[]},"partOf":{"data":[]},"versions":{"data":[]},"versionOf":{"data":[]}}}}