<?xml version="1.0" encoding="UTF-8"?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" xmlns:burst="http://xmlns.com/burst/0.1/" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns="http://purl.org/rss/1.0/" xmlns:admin="http://webns.net/mvcb/" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:syn="http://purl.org/rss/1.0/modules/syndication/" xmlns:swrc="http://swrc.ontoware.org/ontology#" xmlns:cc="http://web.resource.org/cc/"><channel rdf:about="http://www.bibsonomy.org/user/pitman/ml"><title>BibSonomy publications for /user/pitman/ml</title><link>BibSonomyburst/user/pitman/ml</link><description>BibSonomy RSS feed for /user/pitman/ml</description><dc:date>2012-02-15T20:13:44+01:00</dc:date><items><rdf:Seq><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/24ce9a832df16ba8a0c876b9c71c8461d/pitman"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2e1c6f29f7a54860167cbfd035f31eb39/pitman"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2624d2a29008c475245aa0bca052e7c0f/pitman"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2b2e5eae7c1cc273831d431b2c833f835/pitman"/></rdf:Seq></items></channel><item rdf:about="http://www.bibsonomy.org/bibtex/24ce9a832df16ba8a0c876b9c71c8461d/pitman"><title>Hierarchical mixture models: a probabilistic analysis</title><link>http://www.bibsonomy.org/bibtex/24ce9a832df16ba8a0c876b9c71c8461d/pitman</link><dc:creator>pitman</dc:creator><dc:date>2008-01-15T05:49:09+01:00</dc:date><dc:subject>classification ml </dc:subject><content:encoded>&lt;span class=&#034;authorEditorList&#034;&gt;&lt;a href=&#034;/author/Sandler&#034;&gt;Mark Sandler&lt;/a&gt; &lt;/span&gt;&lt;em&gt;KDD &amp;#039;07: Proceedings of the 13th ACM SIGKDD international conference on Knowledge discovery and data mining, &lt;/em&gt;&lt;em&gt;page 580--589. &lt;/em&gt;&lt;em&gt;New York, NY, USA, &lt;/em&gt;&lt;em&gt;ACM, &lt;/em&gt;(&lt;em&gt;2007&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/classification"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/ml"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/24ce9a832df16ba8a0c876b9c71c8461d/pitman"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/24ce9a832df16ba8a0c876b9c71c8461d/pitman"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://portal.acm.org/citation.cfm?doid=1281192.1281255"/><swrc:date>Tue Jan 15 05:49:09 CET 2008</swrc:date><swrc:address>New York, NY, USA</swrc:address><swrc:booktitle>KDD &#039;07: Proceedings of the 13th ACM SIGKDD international conference on Knowledge discovery and data mining</swrc:booktitle><swrc:pages>580--589</swrc:pages><swrc:publisher><swrc:Organization swrc:name="ACM"/></swrc:publisher><swrc:title>Hierarchical mixture models: a probabilistic analysis</swrc:title><swrc:year>2007</swrc:year><swrc:keywords>classification ml </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="San Jose, California, USA" swrc:key="location"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="978-1-59593-609-7" swrc:key="isbn"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="http://doi.acm.org/10.1145/1281192.1281255" swrc:key="doi"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Mark Sandler"/></rdf:_1></rdf:Seq></swrc:author></rdf:Description></burst:publication><description>Hierarchical mixture models</description></item><item rdf:about="http://www.bibsonomy.org/bibtex/2e1c6f29f7a54860167cbfd035f31eb39/pitman"><title>Algorithmic learning theory</title><link>http://www.bibsonomy.org/bibtex/2e1c6f29f7a54860167cbfd035f31eb39/pitman</link><dc:creator>pitman</dc:creator><dc:date>2008-01-15T01:27:53+01:00</dc:date><dc:subject>algorithmic learning ml theory </dc:subject><content:encoded>&lt;span class=&#034;authorEditorList&#034;&gt;&lt;a href=&#034;/author/Abe&#034;&gt;N. Abe&lt;/a&gt;,  and &lt;a href=&#034;/author/Khardon&#034;&gt;R. Khardon&lt;/a&gt; (Eds.).
		 &lt;/span&gt;&lt;em&gt;Elsevier Science Publishers B.V., &lt;/em&gt;&lt;em&gt;Amsterdam, &lt;/em&gt;(&lt;em&gt;2004&lt;/em&gt;)&lt;em&gt;Papers from the 12th Annual Conference ALT&amp;#039;01 held in Washington, DC, November 25--28, 2001, Theoret. Comput. Sci. \bf 313 2004, no. 2
		    .
	    &lt;/em&gt;</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/algorithmic"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/learning"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/ml"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/theory"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2e1c6f29f7a54860167cbfd035f31eb39/pitman"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2e1c6f29f7a54860167cbfd035f31eb39/pitman"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Book"/><swrc:date>Tue Jan 15 01:27:53 CET 2008</swrc:date><swrc:address>Amsterdam</swrc:address><swrc:note>Papers from the 12th Annual Conference (ALT&#039;01) held in Washington, DC, November 25--28, 2001, Theoret. Comput. Sci. {\bf 313} (2004), no. 2</swrc:note><swrc:pages>i--iv and 173--</swrc:pages><swrc:publisher><swrc:Organization swrc:name="Elsevier Science Publishers B.V."/></swrc:publisher><swrc:title>Algorithmic learning theory</swrc:title><swrc:year>2004</swrc:year><swrc:keywords>algorithmic learning ml theory </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="MR2051784" swrc:key="mrnumber"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="0304-3975" swrc:key="issn"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="68-06 (68Q32 68T05)" swrc:key="mrclass"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="TCSDI" swrc:key="coden"/></swrc:hasExtraField><swrc:editor><rdf:Seq><rdf:_1><swrc:Person swrc:name="N. Abe"/></rdf:_1><rdf:_2><swrc:Person swrc:name="R. Khardon"/></rdf:_2></rdf:Seq></swrc:editor></rdf:Description></burst:publication><description>MR lookup</description></item><item rdf:about="http://www.bibsonomy.org/bibtex/2624d2a29008c475245aa0bca052e7c0f/pitman"><title>Efficient topic-based unsupervised name disambiguation</title><link>http://www.bibsonomy.org/bibtex/2624d2a29008c475245aa0bca052e7c0f/pitman</link><dc:creator>pitman</dc:creator><dc:date>2008-01-09T01:08:56+01:00</dc:date><dc:subject>ml </dc:subject><content:encoded>&lt;span class=&#034;authorEditorList&#034;&gt;&lt;a href=&#034;/author/Song&#034;&gt;Yang Song&lt;/a&gt;, &lt;a href=&#034;/author/Huang&#034;&gt;Jian Huang&lt;/a&gt;, &lt;a href=&#034;/author/Councill&#034;&gt;Isaac G. Councill&lt;/a&gt;, &lt;a href=&#034;/author/Li&#034;&gt;Jia Li&lt;/a&gt;,  and &lt;a href=&#034;/author/Giles&#034;&gt;C. Lee Giles&lt;/a&gt; &lt;/span&gt;&lt;em&gt;JCDL &amp;#039;07: Proceedings of the 2007 conference on Digital libraries, &lt;/em&gt;&lt;em&gt;page 342--351. &lt;/em&gt;&lt;em&gt;New York, NY, USA, &lt;/em&gt;&lt;em&gt;ACM, &lt;/em&gt;(&lt;em&gt;2007&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/ml"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2624d2a29008c475245aa0bca052e7c0f/pitman"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2624d2a29008c475245aa0bca052e7c0f/pitman"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://clgiles.ist.psu.edu/papers/JCDL2007-topic_based_name_disambiguation.pdf "/><swrc:date>Wed Jan 09 01:08:56 CET 2008</swrc:date><swrc:address>New York, NY, USA</swrc:address><swrc:booktitle>JCDL &#039;07: Proceedings of the 2007 conference on Digital libraries</swrc:booktitle><swrc:pages>342--351</swrc:pages><swrc:publisher><swrc:Organization swrc:name="ACM"/></swrc:publisher><swrc:title>Efficient topic-based unsupervised name disambiguation</swrc:title><swrc:year>2007</swrc:year><swrc:keywords>ml </swrc:keywords><swrc:abstract>Name ambiguity is a special case of identity uncertainty where one person can be referenced by multiple name variations in different situations or even share the same name with other people. In this paper, we focus on the problem of disambiguating person names within web pages and scientific documents. We present an efficient and effective two-stage approach to disambiguate names. In the first stage, two novel topic-based models are proposed by extending two hierarchical Bayesian text models, namely Probabilistic Latent Semantic Analysis (PLSA) and Latent Dirichlet Allocation (LDA). Our models explicitly introduce a new variable for persons and learn the distribution of topics with regard to persons and words. After learning an initial model, the topic distributions are treated as feature sets and names are disambiguated by leveraging a hierarchical agglomerative clustering method. Experiments on web data and scientific documents from CiteSeer indicate that our approach consistently outperforms other unsupervised learning methods such as spectral clustering and DBSCAN clustering and could be extended to other research fields. We empirically addressed the issue of scalability by disambiguating authors in over 750,000 papers from the entire CiteSeer dataset.

</swrc:abstract><swrc:hasExtraField><swrc:Field swrc:value="http://portal.acm.org/citation.cfm?id=1255243" swrc:key="acm"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="Vancouver, BC, Canada" swrc:key="location"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="978-1-59593-644-8" swrc:key="isbn"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="http://doi.acm.org/10.1145/1255175.1255243" swrc:key="doi"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Yang Song"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Jian Huang"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Isaac G. Councill"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Jia Li"/></rdf:_4><rdf:_5><swrc:Person swrc:name="C. Lee Giles"/></rdf:_5></rdf:Seq></swrc:author></rdf:Description></burst:publication><description>Efficient topic-based unsupervised name disambiguation</description></item><item rdf:about="http://www.bibsonomy.org/bibtex/2b2e5eae7c1cc273831d431b2c833f835/pitman"><title>Generating Summary Keywords for Emails Using Topics</title><link>http://www.bibsonomy.org/bibtex/2b2e5eae7c1cc273831d431b2c833f835/pitman</link><dc:creator>pitman</dc:creator><dc:date>2008-01-09T00:18:12+01:00</dc:date><dc:subject>ml </dc:subject><content:encoded>&lt;span class=&#034;authorEditorList&#034;&gt;&lt;a href=&#034;/author/et al&#034;&gt;C.L. Giles et al&lt;/a&gt; &lt;/span&gt;(&lt;em&gt;2008&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/ml"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2b2e5eae7c1cc273831d431b2c833f835/pitman"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2b2e5eae7c1cc273831d431b2c833f835/pitman"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Unpublished"/><owl:sameAs rdf:resource="http://www.seas.upenn.edu/~mdredze/publications/dredze_summarization_iui08.pdf"/><swrc:date>Wed Jan 09 00:18:12 CET 2008</swrc:date><swrc:title>Generating Summary Keywords for Emails Using Topics</swrc:title><swrc:year>2008</swrc:year><swrc:keywords>ml </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="C.L. Giles et al"/></rdf:_1></rdf:Seq></swrc:author></rdf:Description></burst:publication></item></rdf:RDF>
