<rdf:RDF xmlns:community="http://www.bibsonomy.org/ontologies/2008/05/community#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:admin="http://webns.net/mvcb/" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:syn="http://purl.org/rss/1.0/modules/syndication/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" xmlns:cc="http://web.resource.org/cc/" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns:swrc="http://swrc.ontoware.org/ontology#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns="http://purl.org/rss/1.0/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xml:base="http://www.bibsonomy.org/author/Cilibrasi"><owl:Ontology rdf:about=""><rdfs:comment>BibSonomy publications for /author/Cilibrasi</rdfs:comment><owl:imports rdf:resource="http://swrc.ontoware.org/ontology/portal"/></owl:Ontology><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/226f35d6a29010583da2a68eedaaf690e/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/226f35d6a29010583da2a68eedaaf690e/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/corr/corr0312.html#cs-CV-0312044"/><swrc:date>Mon Dec 05 00:00:00 CET 2011</swrc:date><swrc:journal>CoRR</swrc:journal><swrc:title>Clustering by compression</swrc:title><swrc:volume>cs.CV/0312044</swrc:volume><swrc:year>2003</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/cs.CV/0312044" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitányi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/24ee6e45b8093dd9b85f4a7a7283c4073/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/24ee6e45b8093dd9b85f4a7a7283c4073/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/corr/corr0612.html#abs-cs-0612043"/><swrc:date>Mon Dec 05 00:00:00 CET 2011</swrc:date><swrc:journal>CoRR</swrc:journal><swrc:title>About the Lifespan of Peer to Peer Networks</swrc:title><swrc:volume>abs/cs/0612043</swrc:volume><swrc:year>2006</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/cs/0612043" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Zvi Lotker"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Alfredo Navarra"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Stéphane Pérennes"/></rdf:_4><rdf:_5><swrc:Person swrc:name="Paul M. B. Vitányi"/></rdf:_5></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2104bb0bb1c60788ad33a2dcbb667a9c0/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2104bb0bb1c60788ad33a2dcbb667a9c0/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/corr/corr0412.html#abs-cs-0412098"/><swrc:date>Mon Dec 05 00:00:00 CET 2011</swrc:date><swrc:journal>CoRR</swrc:journal><swrc:title>The Google Similarity Distance</swrc:title><swrc:volume>abs/cs/0412098</swrc:volume><swrc:year>2004</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/cs/0412098" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitányi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2980e695898971b62190c24968d6dc4ba/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2980e695898971b62190c24968d6dc4ba/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/corr/corr0303.html#cs-SD-0303025"/><swrc:date>Mon Dec 05 00:00:00 CET 2011</swrc:date><swrc:journal>CoRR</swrc:journal><swrc:title>Algorithmic Clustering of Music</swrc:title><swrc:volume>cs.SD/0303025</swrc:volume><swrc:year>2003</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/cs.SD/0303025" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitányi"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Ronald de Wolf"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2843814ffb84515f3d8473d783fd92bc0/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2843814ffb84515f3d8473d783fd92bc0/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/corr/corr0602.html#abs-cs-0602065"/><swrc:date>Mon Dec 05 00:00:00 CET 2011</swrc:date><swrc:journal>CoRR</swrc:journal><swrc:title>Similarity of Objects and the Meaning of Words</swrc:title><swrc:volume>abs/cs/0602065</swrc:volume><swrc:year>2006</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/cs/0602065" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitányi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2437af6bd0bd018d8ca52d51ecc169d40/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2437af6bd0bd018d8ca52d51ecc169d40/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/corr/corr0905.html#abs-0905-4039"/><swrc:date>Mon Dec 05 00:00:00 CET 2011</swrc:date><swrc:journal>CoRR</swrc:journal><swrc:title>Normalized Web Distance and Word Similarity</swrc:title><swrc:volume>abs/0905.4039</swrc:volume><swrc:year>2009</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/0905.4039" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitányi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/24097e4eb25f3f99979360e6e13c40256/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/24097e4eb25f3f99979360e6e13c40256/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/corr/corr0606.html#abs-cs-0606048"/><swrc:date>Mon Dec 05 00:00:00 CET 2011</swrc:date><swrc:journal>CoRR</swrc:journal><swrc:title>A New Quartet Tree Heuristic for Hierarchical Clustering</swrc:title><swrc:volume>abs/cs/0606048</swrc:volume><swrc:year>2006</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/cs/0606048" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitányi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2f83e6f389f2afe8bb829abf62db308f0/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2f83e6f389f2afe8bb829abf62db308f0/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/corr/corr0502.html#abs-cs-0502068"/><swrc:date>Mon Dec 05 00:00:00 CET 2011</swrc:date><swrc:journal>CoRR</swrc:journal><swrc:title>Limits of Rush Hour Logic Complexity</swrc:title><swrc:volume>abs/cs/0502068</swrc:volume><swrc:year>2005</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/cs/0502068" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="John Tromp"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2d9a48907c77e47a0097dfe2a6160e82c/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2d9a48907c77e47a0097dfe2a6160e82c/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/corr/corr0809.html#abs-0809-2553"/><swrc:date>Mon Dec 05 00:00:00 CET 2011</swrc:date><swrc:journal>CoRR</swrc:journal><swrc:title>Normalized Information Distance</swrc:title><swrc:volume>abs/0809.2553</swrc:volume><swrc:year>2008</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/0809.2553" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Paul M. B. Vitányi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Frank J. Balbach"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Ming Li"/></rdf:_4></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/250308d5168f519ce89a71fa67574ac25/gromgull"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/250308d5168f519ce89a71fa67574ac25/gromgull"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://homepages.cwi.nl/~paulv/papers/amdug.pdf"/><swrc:date>Wed Nov 23 16:24:13 CET 2011</swrc:date><swrc:month>15 March</swrc:month><swrc:note>v2</swrc:note><swrc:number>cs.CL/0412098</swrc:number><swrc:pages>370-383</swrc:pages><swrc:title>Automatic Meaning Discovery Using Google</swrc:title><swrc:year>2004</swrc:year><swrc:keywords>distance-measure google machine-learning </swrc:keywords><swrc:abstract>We have found a method to automatically extract the
                 meaning of words and phrases from the world-wide-web
                 using Google page counts. The approach is novel in its
                 unrestricted problem domain, simplicity of
                 implementation, and manifestly ontological
                 underpinnings. The world-wide-web is the largest
                 database on earth, and the latent semantic context
                 information entered by millions of independent users
                 averages out to provide automatic meaning of useful
                 quality. We demonstrate positive correlations,
                 evidencing an underlying semantic structure, in both
                 numerical symbol notations and number-name words in a
                 variety of natural languages and contexts. Next, we
                 demonstrate the ability to distinguish between colours
                 and numbers, and to distinguish between 17th century
                 Dutch painters; the ability to understand electrical
                 terms, religious terms, and emergency incidents; we
                 conduct a massive experiment in understanding WordNet
                 categories; and finally we demonstrate the ability to
                 do a simple automatic English-Spanish translation.</swrc:abstract><swrc:hasExtraField><swrc:Field swrc:value="ACM-class: I.2.4; I.2.7

                 Date (v1): Tue, 21 Dec 2004 16:05:36 GMT (127kb,S) Date
                 (revised v2): Tue, 15 Mar 2005 16:53:43 GMT
                 (58kb)

                 cited by \cite{graham-rowe:2005:complearn}

                 Code http://www.complearn.org/" swrc:key="notes"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="31 pages" swrc:key="size"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitanyi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2aadd39f3c0413848cbc72092e9ac4fb1/wyswilson"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2aadd39f3c0413848cbc72092e9ac4fb1/wyswilson"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Misc"/><swrc:date>Thu Apr 14 07:06:28 CEST 2011</swrc:date><swrc:address> Seattle, USA</swrc:address><swrc:booktitle> Proceedings of the IEEE International Symposium on Information Theory</swrc:booktitle><swrc:title> Automatic Extraction of Meaning from the Web</swrc:title><swrc:year> 2006</swrc:year><swrc:keywords>imported </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="R. Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="P. Vitanyi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2cb260a59280a6312cdd532222ec10930/wyswilson"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2cb260a59280a6312cdd532222ec10930/wyswilson"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="/brokenurl# http://publication.wilsonwong.me"/><swrc:date>Thu Apr 14 07:06:28 CEST 2011</swrc:date><swrc:journal> IEEE Transactions on Knowledge and Data Engineering</swrc:journal><swrc:number> 3</swrc:number><swrc:pages> 370-383</swrc:pages><swrc:title> The Google Similarity Distance</swrc:title><swrc:volume> 19</swrc:volume><swrc:year> 2007</swrc:year><swrc:keywords>imported </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="R. Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="P. Vitanyi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2d7887bf271cc02fda6713e9d64c7f0bf/wyswilson"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2d7887bf271cc02fda6713e9d64c7f0bf/wyswilson"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InCollection"/><owl:sameAs rdf:resource="/brokenurl# http://publication.wilsonwong.me"/><swrc:date>Thu Apr 14 07:06:28 CEST 2011</swrc:date><swrc:booktitle> Information Theory and Statistical Learning</swrc:booktitle><swrc:publisher><swrc:Organization swrc:name=" New-York: Springer"/></swrc:publisher><swrc:title> Normalized Information Distance</swrc:title><swrc:year> 2009</swrc:year><swrc:keywords>imported </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="P. Vitanyi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="F. Balbach"/></rdf:_2><rdf:_3><swrc:Person swrc:name="R. Cilibrasi"/></rdf:_3><rdf:_4><swrc:Person swrc:name="M. Li"/></rdf:_4></rdf:Seq></swrc:author><swrc:editor><rdf:Seq><rdf:_1><swrc:Person swrc:name="F. Emmert-Streib"/></rdf:_1><rdf:_2><swrc:Person swrc:name="M. Dehmer"/></rdf:_2></rdf:Seq></swrc:editor></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2e2ae8887137141b9d5f895b5333cf226/lina.wolf"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2e2ae8887137141b9d5f895b5333cf226/lina.wolf"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><swrc:date>Tue Mar 08 08:43:28 CET 2011</swrc:date><swrc:title>The Google Similarity Distance</swrc:title><swrc:year>2007</swrc:year><swrc:keywords>google similarity </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi L. Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M.B. Vitáni"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/200ba496f53767b92d5965db71eeea8bf/dbenz"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/200ba496f53767b92d5965db71eeea8bf/dbenz"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://www.citebase.org/abstract?id=oai:arXiv.org:cs/0412098"/><swrc:date>Fri Jan 28 11:34:03 CET 2011</swrc:date><swrc:journal>IEEE Transactions on Knowledge and Data Engineering</swrc:journal><swrc:pages>370</swrc:pages><swrc:title>The Google Similarity Distance</swrc:title><swrc:volume>19</swrc:volume><swrc:year>2007</swrc:year><swrc:keywords>google relatedness_measures web_based imported </swrc:keywords><swrc:abstract> Words and phrases acquire meaning from the way they are used in society, from their relative semantics to other words and phrases. For computers the equivalent of `society&#039; is `database,&#039; and the equivalent of `use&#039; is `way to search the database.&#039; We present a new theory of similarity between words and phrases based on information distance and Kolmogorov complexity. To fix thoughts we use the world-wide-web as database, and Google as search engine. The method is also applicable to other search engines and databases. This theory is then applied to construct a method to automatically extract similarity, the Google similarity distance, of words and phrases from the world-wide-web using Google page counts. The world-wide-web is the largest database on earth, and the context information entered by millions of independent users averages out to provide automatic semantics of useful quality. We give applications in hierarchical clustering, classification, and language translation. We give examples to distinguish between colors and numbers, cluster names of paintings by 17th century Dutch masters and names of books by English novelists, the ability to understand emergencies, and primes, and we demonstrate the ability to do a simple automatic English-Spanish translation. Finally, we use the WordNet database as an objective baseline against which to judge the performance of our method. We conduct a massive randomized trial in binary classification using support vector machines to learn categories based on our Google distance, resulting in an a mean agreement of 87% with the expert crafted WordNet categories.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitanyi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/25156d51daa332b82b27cc4665dbff1f5/dbenz"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/25156d51daa332b82b27cc4665dbff1f5/dbenz"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><swrc:date>Fri Jan 28 11:32:21 CET 2011</swrc:date><swrc:journal>IEEE Transactions on Information Theory</swrc:journal><swrc:month>April</swrc:month><swrc:number>4</swrc:number><swrc:pages> 1523-1545</swrc:pages><swrc:title>Clustering by compression</swrc:title><swrc:volume>51</swrc:volume><swrc:year>2005</swrc:year><swrc:keywords>toread compression clustering </swrc:keywords><swrc:abstract> We present a new method for clustering based on compression. The method does not use subject-specific features or background knowledge, and works as follows: First, we determine a parameter-free, universal, similarity distance, the normalized compression distance or NCD, computed from the lengths of compressed data files (singly and in pairwise concatenation). Second, we apply a hierarchical clustering method. The NCD is not restricted to a specific application area, and works across application area boundaries. A theoretical precursor, the normalized information distance, co-developed by one of the authors, is provably optimal. However, the optimality comes at the price of using the noncomputable notion of Kolmogorov complexity. We propose axioms to capture the real-world setting, and show that the NCD approximates optimality. To extract a hierarchy of clusters from the distance matrix, we determine a dendrogram (ternary tree) by a new quartet method and a fast heuristic to implement it. The method is implemented and available as public software, and is robust under choice of different compressors. To substantiate our claims of universality and robustness, we report evidence of successful application in areas as diverse as genomics, virology, languages, literature, music, handwritten digits, astronomy, and combinations of objects from completely different domains, using statistical, dictionary, and block sorting compressors. In genomics, we presented new evidence for major questions in Mammalian evolution, based on whole-mitochondrial genomic analysis: the Eutherian orders and the Marsupionta hypothesis against the Theria hypothesis.</swrc:abstract><swrc:hasExtraField><swrc:Field swrc:value="0018-9448" swrc:key="issn"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="10.1109/TIT.2005.844059" swrc:key="doi"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="R. Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="P.M.B. Vitanyi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/24e823daa890d0bafff91045fd4bedb0b/mortimer_m8"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/24e823daa890d0bafff91045fd4bedb0b/mortimer_m8"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://arxiv.org/abs/cs.CL/0412098"/><swrc:date>Fri Dec 17 18:47:41 CET 2010</swrc:date><swrc:month>May</swrc:month><swrc:title>{The Google Similarity Distance}</swrc:title><swrc:year>2007</swrc:year><swrc:keywords>automatic-learning, google, linguistics, ontology, semantic </swrc:keywords><swrc:day>30</swrc:day><swrc:abstract>{Words and phrases acquire meaning from the way they are used in society, from
their relative semantics to other words and phrases. For computers the
equivalent of `society&#039; is `database,&#039; and the equivalent of `use&#039; is `way to
search the database.&#039; We present a new theory of similarity between words and
phrases based on information distance and Kolmogorov complexity. To fix
thoughts we use the world-wide-web as database, and Google as search engine.
The method is also applicable to other search engines and databases. This
theory is then applied to construct a method to automatically extract
similarity, the Google similarity distance, of words and phrases from the
world-wide-web using Google page counts. The world-wide-web is the largest
database on earth, and the context information entered by millions of
independent users averages out to provide automatic semantics of useful
quality. We give applications in hierarchical clustering, classification, and
language translation. We give examples to distinguish between colors and
numbers, cluster names of paintings by 17th century Dutch masters and names of
books by English novelists, the ability to understand emergencies, and primes,
and we demonstrate the ability to do a simple automatic English-Spanish
translation. Finally, we use the WordNet database as an objective baseline
against which to judge the performance of our method. We conduct a massive
randomized trial in binary classification using support vector machines to
learn categories based on our Google distance, resulting in an a mean agreement
of 87\% with the expert crafted WordNet categories.}</swrc:abstract><swrc:hasExtraField><swrc:Field swrc:value="2004-12-28 20:46:48" swrc:key="posted-at"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="arXiv" swrc:key="archiveprefix"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="4" swrc:key="priority"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="4487" swrc:key="citeulike-article-id"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/pdf/cs.CL/0412098" swrc:key="citeulike-linkout-1"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="http://arxiv.org/abs/cs.CL/0412098" swrc:key="citeulike-linkout-0"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="cs.CL/0412098" swrc:key="eprint"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitanyi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/29d1d18e90d3b3c38d04e78d0471800b8/dblp"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/29d1d18e90d3b3c38d04e78d0471800b8/dblp"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/journals/pr/pr44.html#CilibrasiV11"/><swrc:date>Mon Dec 06 00:00:00 CET 2010</swrc:date><swrc:journal>Pattern Recognition</swrc:journal><swrc:number>3</swrc:number><swrc:pages>662-677</swrc:pages><swrc:title>A Fast Quartet tree heuristic for hierarchical clustering.</swrc:title><swrc:volume>44</swrc:volume><swrc:year>2011</swrc:year><swrc:keywords>dblp </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://dx.doi.org/10.1016/j.patcog.2010.08.033" swrc:key="ee"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Rudi Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Paul M. B. Vitányi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/25797b28e3963b54f8e748b764a3c0896/wyswilson"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/25797b28e3963b54f8e748b764a3c0896/wyswilson"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InCollection"/><owl:sameAs rdf:resource="http://ontology.csse.uwa.edu.au/reference/browse_paper.php?pid=233282036"/><swrc:date>Fri Nov 26 09:32:26 CET 2010</swrc:date><swrc:booktitle>Information Theory and Statistical Learning</swrc:booktitle><swrc:publisher><swrc:Organization swrc:name="New-York: Springer"/></swrc:publisher><swrc:title>Normalized Information Distance</swrc:title><swrc:year>2009</swrc:year><swrc:keywords>imported </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="P. Vitanyi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="F. Balbach"/></rdf:_2><rdf:_3><swrc:Person swrc:name="R. Cilibrasi"/></rdf:_3><rdf:_4><swrc:Person swrc:name="M. Li"/></rdf:_4></rdf:Seq></swrc:author><swrc:editor><rdf:Seq><rdf:_1><swrc:Person swrc:name="F. Emmert-Streib"/></rdf:_1><rdf:_2><swrc:Person swrc:name="M. Dehmer"/></rdf:_2></rdf:Seq></swrc:editor></rdf:Description><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2049b2bfae97bca112c4153f4742f3ca1/wyswilson"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2049b2bfae97bca112c4153f4742f3ca1/wyswilson"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Misc"/><swrc:date>Fri Nov 26 09:32:26 CET 2010</swrc:date><swrc:address>Seattle, USA</swrc:address><swrc:booktitle>Proceedings of the IEEE International Symposium on Information Theory</swrc:booktitle><swrc:title>Automatic Extraction of Meaning from the Web</swrc:title><swrc:year>2006</swrc:year><swrc:keywords>imported </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="R. Cilibrasi"/></rdf:_1><rdf:_2><swrc:Person swrc:name="P. Vitanyi"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description></rdf:RDF>
