{"data":{"id":"10.48550/arxiv.cond-mat/0108530","type":"dois","attributes":{"doi":"10.48550/arxiv.cond-mat/0108530","prefix":"10.48550","suffix":"arxiv.cond-mat/0108530","identifiers":[{"identifier":"cond-mat/0108530","identifierType":"arXiv"}],"alternateIdentifiers":[{"alternateIdentifierType":"arXiv","alternateIdentifier":"cond-mat/0108530"}],"creators":[{"name":"Benedetto, Dario","nameType":"Personal","givenName":"Dario","familyName":"Benedetto","affiliation":[],"nameIdentifiers":[]},{"name":"Caglioti, Emanuele","nameType":"Personal","givenName":"Emanuele","familyName":"Caglioti","affiliation":[],"nameIdentifiers":[]},{"name":"Loreto, Vittorio","nameType":"Personal","givenName":"Vittorio","familyName":"Loreto","affiliation":[],"nameIdentifiers":[]}],"titles":[{"title":"Language Trees and Zipping"}],"publisher":"arXiv","container":{},"publicationYear":2001,"subjects":[{"lang":"en","subject":"Statistical Mechanics (cond-mat.stat-mech)","subjectScheme":"arXiv"},{"subject":"FOS: Physical sciences","subjectScheme":"Fields of Science and Technology (FOS)"},{"subject":"FOS: Physical sciences","schemeUri":"http://www.oecd.org/science/inno/38235147.pdf","subjectScheme":"Fields of Science and Technology (FOS)"}],"contributors":[],"dates":[{"date":"2001-08-31T07:05:38Z","dateType":"Submitted","dateInformation":"v1"},{"date":"2009-11-30T19:56:13Z","dateType":"Updated","dateInformation":"v1"},{"date":"2001-12-19T12:24:55Z","dateType":"Submitted","dateInformation":"v2"},{"date":"2009-11-30T19:56:13Z","dateType":"Updated","dateInformation":"v2"},{"date":"2001-08","dateType":"Available","dateInformation":"v1"},{"date":"2001","dateType":"Issued"}],"language":null,"types":{"ris":"RPRT","bibtex":"article","citeproc":"article-journal","schemaOrg":"ScholarlyArticle","resourceType":"Article","resourceTypeGeneral":"Text"},"relatedIdentifiers":[{"relationType":"IsVersionOf","relatedIdentifier":"10.1103/physrevlett.88.048702","relatedIdentifierType":"DOI"}],"relatedItems":[],"sizes":[],"formats":[],"version":"2","rightsList":[{"rights":"Assumed arXiv.org perpetual, non-exclusive license to distribute this article for submissions made before January 2004","rightsUri":"http://arxiv.org/licenses/assumed-1991-2003/"}],"descriptions":[{"description":"In this letter we present a very general method to extract information from a generic string of characters, e.g. a text, a DNA sequence or a time series. Based on data-compression techniques, its key point is the computation of a suitable measure of the remoteness of two bodies of knowledge. We present the implementation of the method to linguistic motivated problems, featuring highly accurate results for language recognition, authorship attribution and language classification.","descriptionType":"Abstract"},{"description":"5 pages, RevTeX4, 1 eps figure. In press in Phys. Rev. Lett. (January 2002)","descriptionType":"Other"}],"geoLocations":[],"fundingReferences":[],"xml":"PD94bWwgdmVyc2lvbj0iMS4wIiBlbmNvZGluZz0idXRmLTgiPz4KPHJlc291cmNlIHhtbG5zPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCIgeG1sbnM6eHNpPSJodHRwOi8vd3d3LnczLm9yZy8yMDAxL1hNTFNjaGVtYS1pbnN0YW5jZSIgeHNpOnNjaGVtYUxvY2F0aW9uPSJodHRwOi8vZGF0YWNpdGUub3JnL3NjaGVtYS9rZXJuZWwtNCBodHRwOi8vc2NoZW1hLmRhdGFjaXRlLm9yZy9tZXRhL2tlcm5lbC00LjMvbWV0YWRhdGEueHNkIj4KICA8aWRlbnRpZmllciBpZGVudGlmaWVyVHlwZT0iRE9JIj4xMC40ODU1MC9BUlhJVi5DT05ELU1BVC8wMTA4NTMwPC9pZGVudGlmaWVyPgogIDxhbHRlcm5hdGVJZGVudGlmaWVycz4KICAgIDxhbHRlcm5hdGVJZGVudGlmaWVyIGFsdGVybmF0ZUlkZW50aWZpZXJUeXBlPSJhclhpdiI+Y29uZC1tYXQvMDEwODUzMDwvYWx0ZXJuYXRlSWRlbnRpZmllcj4KICA8L2FsdGVybmF0ZUlkZW50aWZpZXJzPgogIDxjcmVhdG9ycz4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5CZW5lZGV0dG8sIERhcmlvPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5EYXJpbzwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5CZW5lZGV0dG88L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgICA8Y3JlYXRvcj4KICAgICAgPGNyZWF0b3JOYW1lIG5hbWVUeXBlPSJQZXJzb25hbCI+Q2FnbGlvdGksIEVtYW51ZWxlPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5FbWFudWVsZTwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5DYWdsaW90aTwvZmFtaWx5TmFtZT4KICAgIDwvY3JlYXRvcj4KICAgIDxjcmVhdG9yPgogICAgICA8Y3JlYXRvck5hbWUgbmFtZVR5cGU9IlBlcnNvbmFsIj5Mb3JldG8sIFZpdHRvcmlvPC9jcmVhdG9yTmFtZT4KICAgICAgPGdpdmVuTmFtZT5WaXR0b3JpbzwvZ2l2ZW5OYW1lPgogICAgICA8ZmFtaWx5TmFtZT5Mb3JldG88L2ZhbWlseU5hbWU+CiAgICA8L2NyZWF0b3I+CiAgPC9jcmVhdG9ycz4KICA8dGl0bGVzPgogICAgPHRpdGxlPkxhbmd1YWdlIFRyZWVzIGFuZCBaaXBwaW5nPC90aXRsZT4KICA8L3RpdGxlcz4KICA8cHVibGlzaGVyPmFyWGl2PC9wdWJsaXNoZXI+CiAgPHB1YmxpY2F0aW9uWWVhcj4yMDAxPC9wdWJsaWNhdGlvblllYXI+CiAgPHN1YmplY3RzPgogICAgPHN1YmplY3QgeG1sOmxhbmc9ImVuIiBzdWJqZWN0U2NoZW1lPSJhclhpdiI+U3RhdGlzdGljYWwgTWVjaGFuaWNzIChjb25kLW1hdC5zdGF0LW1lY2gpPC9zdWJqZWN0PgogICAgPHN1YmplY3Qgc3ViamVjdFNjaGVtZT0iRmllbGRzIG9mIFNjaWVuY2UgYW5kIFRlY2hub2xvZ3kgKEZPUykiPkZPUzogUGh5c2ljYWwgc2NpZW5jZXM8L3N1YmplY3Q+CiAgPC9zdWJqZWN0cz4KICA8ZGF0ZXM+CiAgICA8ZGF0ZSBkYXRlVHlwZT0iU3VibWl0dGVkIiBkYXRlSW5mb3JtYXRpb249InYxIj4yMDAxLTA4LTMxVDA3OjA1OjM4WjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJVcGRhdGVkIiBkYXRlSW5mb3JtYXRpb249InYxIj4yMDA5LTExLTMwVDE5OjU2OjEzWjwvZGF0ZT4KICAgIDxkYXRlIGRhdGVUeXBlPSJTdWJtaXR0ZWQiIGRhdGVJbmZvcm1hdGlvbj0idjIiPjIwMDEtMTItMTlUMTI6MjQ6NTVaPC9kYXRlPgogICAgPGRhdGUgZGF0ZVR5cGU9IlVwZGF0ZWQiIGRhdGVJbmZvcm1hdGlvbj0idjIiPjIwMDktMTEtMzBUMTk6NTY6MTNaPC9kYXRlPgogICAgPGRhdGUgZGF0ZVR5cGU9IkF2YWlsYWJsZSIgZGF0ZUluZm9ybWF0aW9uPSJ2MSI+MjAwMS0wODwvZGF0ZT4KICA8L2RhdGVzPgogIDxyZXNvdXJjZVR5cGUgcmVzb3VyY2VUeXBlR2VuZXJhbD0iVGV4dCI+QXJ0aWNsZTwvcmVzb3VyY2VUeXBlPgogIDxyZWxhdGVkSWRlbnRpZmllcnM+CiAgICA8cmVsYXRlZElkZW50aWZpZXIgcmVsYXRlZElkZW50aWZpZXJUeXBlPSJET0kiIHJlbGF0aW9uVHlwZT0iSXNWZXJzaW9uT2YiPjEwLjExMDMvUGh5c1JldkxldHQuODguMDQ4NzAyPC9yZWxhdGVkSWRlbnRpZmllcj4KICA8L3JlbGF0ZWRJZGVudGlmaWVycz4KICA8dmVyc2lvbj4yPC92ZXJzaW9uPgogIDxyaWdodHNMaXN0PgogICAgPHJpZ2h0cyByaWdodHNVUkk9Imh0dHA6Ly9hcnhpdi5vcmcvbGljZW5zZXMvYXNzdW1lZC0xOTkxLTIwMDMvIj5Bc3N1bWVkIGFyWGl2Lm9yZyBwZXJwZXR1YWwsIG5vbi1leGNsdXNpdmUgbGljZW5zZSB0byBkaXN0cmlidXRlIHRoaXMgYXJ0aWNsZSBmb3Igc3VibWlzc2lvbnMgbWFkZSBiZWZvcmUgSmFudWFyeSAyMDA0PC9yaWdodHM+CiAgPC9yaWdodHNMaXN0PgogIDxkZXNjcmlwdGlvbnM+CiAgICA8ZGVzY3JpcHRpb24gZGVzY3JpcHRpb25UeXBlPSJBYnN0cmFjdCI+SW4gdGhpcyBsZXR0ZXIgd2UgcHJlc2VudCBhIHZlcnkgZ2VuZXJhbCBtZXRob2QgdG8gZXh0cmFjdCBpbmZvcm1hdGlvbiBmcm9tIGEgZ2VuZXJpYyBzdHJpbmcgb2YgY2hhcmFjdGVycywgZS5nLiBhIHRleHQsIGEgRE5BIHNlcXVlbmNlIG9yIGEgdGltZSBzZXJpZXMuIEJhc2VkIG9uIGRhdGEtY29tcHJlc3Npb24gdGVjaG5pcXVlcywgaXRzIGtleSBwb2ludCBpcyB0aGUgY29tcHV0YXRpb24gb2YgYSBzdWl0YWJsZSBtZWFzdXJlIG9mIHRoZSByZW1vdGVuZXNzIG9mIHR3byBib2RpZXMgb2Yga25vd2xlZGdlLiBXZSBwcmVzZW50IHRoZSBpbXBsZW1lbnRhdGlvbiBvZiB0aGUgbWV0aG9kIHRvIGxpbmd1aXN0aWMgbW90aXZhdGVkIHByb2JsZW1zLCBmZWF0dXJpbmcgaGlnaGx5IGFjY3VyYXRlIHJlc3VsdHMgZm9yIGxhbmd1YWdlIHJlY29nbml0aW9uLCBhdXRob3JzaGlwIGF0dHJpYnV0aW9uIGFuZCBsYW5ndWFnZSBjbGFzc2lmaWNhdGlvbi48L2Rlc2NyaXB0aW9uPgogICAgPGRlc2NyaXB0aW9uIGRlc2NyaXB0aW9uVHlwZT0iT3RoZXIiPjUgcGFnZXMsIFJldlRlWDQsIDEgZXBzIGZpZ3VyZS4gSW4gcHJlc3MgaW4gUGh5cy4gUmV2LiBMZXR0LiAoSmFudWFyeSAyMDAyKTwvZGVzY3JpcHRpb24+CiAgPC9kZXNjcmlwdGlvbnM+CjwvcmVzb3VyY2U+","url":"https://arxiv.org/abs/cond-mat/0108530","contentUrl":null,"metadataVersion":0,"schemaVersion":"http://datacite.org/schema/kernel-4","source":"mds","isActive":true,"state":"findable","reason":null,"viewCount":0,"viewsOverTime":[],"downloadCount":0,"downloadsOverTime":[],"referenceCount":0,"citationCount":0,"citationsOverTime":[],"partCount":0,"partOfCount":0,"versionCount":0,"versionOfCount":0,"created":"2022-03-19T06:19:47.000Z","registered":"2022-03-19T06:19:48.000Z","published":"2001","updated":"2022-03-19T06:19:48.000Z"},"relationships":{"client":{"data":{"id":"arxiv.content","type":"clients"}},"provider":{"data":{"id":"arxiv","type":"providers"}},"media":{"data":{"id":"10.48550/arxiv.cond-mat/0108530","type":"media"}},"references":{"data":[]},"citations":{"data":[]},"parts":{"data":[]},"partOf":{"data":[]},"versions":{"data":[]},"versionOf":{"data":[]}}}}