<rdf:RDF xmlns:burst="http://xmlns.com/burst/0.1/" xmlns:admin="http://webns.net/mvcb/" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:syn="http://purl.org/rss/1.0/modules/syndication/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:cc="http://web.resource.org/cc/" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns:swrc="http://swrc.ontoware.org/ontology#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns="http://purl.org/rss/1.0/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"><channel rdf:about="http://www.bibsonomy.org/burst/user/renew/topic"><title>BibSonomy publications for /user/renew/topic</title><link>http://www.bibsonomy.org/burst/user/renew/topic</link><description>BibSonomy BuRST Feed for /user/renew/topic</description><dc:date>2008-07-26T21:29:50+02:00</dc:date><items><rdf:Seq><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/25f0e2f5fef43b240f92eaa24fd203cc0/renew"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/28ca69f31e7ab051f5576807162bf31bb/renew"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/247d9bbc0a4295471084bffaf29c75d74/renew"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2f81bc9315be5c3fb426ee22b2508c4d6/renew"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/25095275ddb32f4138ee5018a6a4f3fc6/renew"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2c0663174db640752e756736e636e0cf9/renew"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/220fb4bab61662864357a9edf960a9b9b/renew"/></rdf:Seq></items></channel><item rdf:about="http://www.bibsonomy.org/bibtex/25f0e2f5fef43b240f92eaa24fd203cc0/renew"><title>NIST's 1998 Topic Detection and Tracking Evaluation (TDT2)</title><description>The big one</description><link>http://www.bibsonomy.org/bibtex/25f0e2f5fef43b240f92eaa24fd203cc0/renew</link><dc:creator>renew</dc:creator><dc:date>2008-04-21T13:44:43+02:00</dc:date><dc:subject>tracking topic evaluation detection tdt </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Jonathan G. &lt;a href=&#034;http://www.bibsonomy.org/author/Fiscus&#034;&gt;Fiscus&lt;/a&gt;  and George &lt;a href=&#034;http://www.bibsonomy.org/author/Doddington&#034;&gt;Doddington&lt;/a&gt;  and John S. &lt;a href=&#034;http://www.bibsonomy.org/author/Garofolo&#034;&gt;Garofolo&lt;/a&gt;  and Alvin &lt;a href=&#034;http://www.bibsonomy.org/author/Martin&#034;&gt;Martin&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Proc. of the DARPA Broadcast News Workshop, &lt;/em&gt;&lt;em&gt;Virginia, US, &lt;/em&gt;(&lt;em&gt;1998&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/tracking"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/topic"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/evaluation"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/detection"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/tdt"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/25f0e2f5fef43b240f92eaa24fd203cc0/renew"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/25f0e2f5fef43b240f92eaa24fd203cc0/renew"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><swrc:date>Mon Apr 21 13:44:43 CEST 2008</swrc:date><swrc:address>Virginia, US</swrc:address><swrc:booktitle>Proc. of the DARPA Broadcast News Workshop</swrc:booktitle><swrc:title>NIST&#039;s 1998 Topic Detection and Tracking Evaluation (TDT2)</swrc:title><swrc:year>1998</swrc:year><swrc:keywords>tracking topic evaluation detection tdt </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Jonathan G. Fiscus"/></rdf:_1><rdf:_2><swrc:Person swrc:name="George Doddington"/></rdf:_2><rdf:_3><swrc:Person swrc:name="John S. Garofolo"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Alvin Martin"/></rdf:_4></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/28ca69f31e7ab051f5576807162bf31bb/renew"><title>Topic Detection and Tracking with Spatio-Temporal Evidence.</title><description>dblp</description><link>http://www.bibsonomy.org/bibtex/28ca69f31e7ab051f5576807162bf31bb/renew</link><dc:creator>renew</dc:creator><dc:date>2008-04-21T13:05:32+02:00</dc:date><dc:subject>detection temporal topic tdt </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Juha &lt;a href=&#034;http://www.bibsonomy.org/author/Makkonen&#034;&gt;Makkonen&lt;/a&gt;  and Helena &lt;a href=&#034;http://www.bibsonomy.org/author/Ahonen-Myka&#034;&gt;Ahonen-Myka&lt;/a&gt;  and Marko &lt;a href=&#034;http://www.bibsonomy.org/author/Salmenkivi&#034;&gt;Salmenkivi&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;ECIR, &lt;/em&gt;&lt;em&gt;volume2633ofLecture Notes in Computer Science, &lt;/em&gt;&lt;em&gt;page251-265. &lt;/em&gt;&lt;em&gt;Springer, &lt;/em&gt;(&lt;em&gt;2003&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/detection"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/temporal"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/topic"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/tdt"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/28ca69f31e7ab051f5576807162bf31bb/renew"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/28ca69f31e7ab051f5576807162bf31bb/renew"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/conf/ecir/ecir2003.html#MakkonenAS03"/><swrc:date>Mon Apr 21 13:05:32 CEST 2008</swrc:date><swrc:booktitle>ECIR</swrc:booktitle><swrc:crossref>conf/ecir/2003</swrc:crossref><swrc:pages>251-265</swrc:pages><swrc:publisher><swrc:Organization swrc:name="Springer"/></swrc:publisher><swrc:series>Lecture Notes in Computer Science</swrc:series><swrc:title>Topic Detection and Tracking with Spatio-Temporal Evidence.</swrc:title><swrc:volume>2633</swrc:volume><swrc:year>2003</swrc:year><swrc:keywords>detection temporal topic tdt </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://link.springer.de/link/service/series/0558/bibs/2633/26330251.htm" swrc:key="ee"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="3-540-01274-5" swrc:key="isbn"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="2003-04-30" swrc:key="date"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Juha Makkonen"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Helena Ahonen-Myka"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Marko Salmenkivi"/></rdf:_3></rdf:Seq></swrc:author><swrc:editor><rdf:Seq><rdf:_1><swrc:Person swrc:name="Fabrizio Sebastiani"/></rdf:_1></rdf:Seq></swrc:editor></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/247d9bbc0a4295471084bffaf29c75d74/renew"><title>Utilizing Temporal Information in Topic Detection and Tracking.</title><description>dblp</description><link>http://www.bibsonomy.org/bibtex/247d9bbc0a4295471084bffaf29c75d74/renew</link><dc:creator>renew</dc:creator><dc:date>2008-04-21T13:02:44+02:00</dc:date><dc:subject>tdt temporal detection topic </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Juha &lt;a href=&#034;http://www.bibsonomy.org/author/Makkonen&#034;&gt;Makkonen&lt;/a&gt;  and Helena &lt;a href=&#034;http://www.bibsonomy.org/author/Ahonen-Myka&#034;&gt;Ahonen-Myka&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;ECDL, &lt;/em&gt;&lt;em&gt;volume2769ofLecture Notes in Computer Science, &lt;/em&gt;&lt;em&gt;page393-404. &lt;/em&gt;&lt;em&gt;Springer, &lt;/em&gt;(&lt;em&gt;2003&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/tdt"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/temporal"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/detection"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/topic"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/247d9bbc0a4295471084bffaf29c75d74/renew"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/247d9bbc0a4295471084bffaf29c75d74/renew"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/conf/ercimdl/ecdl2003.html#MakkonenA03"/><swrc:date>Mon Apr 21 13:02:44 CEST 2008</swrc:date><swrc:booktitle>ECDL</swrc:booktitle><swrc:crossref>conf/ercimdl/2003</swrc:crossref><swrc:pages>393-404</swrc:pages><swrc:publisher><swrc:Organization swrc:name="Springer"/></swrc:publisher><swrc:series>Lecture Notes in Computer Science</swrc:series><swrc:title>Utilizing Temporal Information in Topic Detection and Tracking.</swrc:title><swrc:volume>2769</swrc:volume><swrc:year>2003</swrc:year><swrc:keywords>tdt temporal detection topic </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="3-540-40726-X" swrc:key="isbn"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="2003-10-10" swrc:key="date"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Juha Makkonen"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Helena Ahonen-Myka"/></rdf:_2></rdf:Seq></swrc:author><swrc:editor><rdf:Seq><rdf:_1><swrc:Person swrc:name="Traugott Koch"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Ingeborg Sølvberg"/></rdf:_2></rdf:Seq></swrc:editor></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2f81bc9315be5c3fb426ee22b2508c4d6/renew"><title>A Dynamic Probabilistic Model to Visualise Topic Evolution in Text Streams</title><link>http://www.bibsonomy.org/bibtex/2f81bc9315be5c3fb426ee22b2508c4d6/renew</link><dc:creator>renew</dc:creator><dc:date>2008-04-21T12:58:08+02:00</dc:date><dc:subject>tdt visualization evolution topic </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Ata &lt;a href=&#034;http://www.bibsonomy.org/author/Kaban&#034;&gt;Kaban&lt;/a&gt;  and Mark &lt;a href=&#034;http://www.bibsonomy.org/author/Girolami&#034;&gt;Girolami&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Journal of Intelligent Information Systems&lt;/em&gt;&lt;em&gt;18(2/3):107--125&lt;/em&gt;(&lt;em&gt;2002&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/tdt"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/visualization"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/evolution"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/topic"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2f81bc9315be5c3fb426ee22b2508c4d6/renew"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2f81bc9315be5c3fb426ee22b2508c4d6/renew"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://www.wkap.nl/article.pdf?391242"/><swrc:date>Mon Apr 21 12:58:08 CEST 2008</swrc:date><swrc:journal>Journal of Intelligent Information Systems</swrc:journal><swrc:number>2/3</swrc:number><swrc:pages>107--125</swrc:pages><swrc:title>A Dynamic Probabilistic Model to Visualise Topic Evolution in Text Streams</swrc:title><swrc:volume>18</swrc:volume><swrc:year>2002</swrc:year><swrc:keywords>tdt visualization evolution topic </swrc:keywords><swrc:abstract>We propose a novel probabilistic method, based on latent variable models, for unsupervised topographic visualisation of dynamically evolving, coherent textual information. This can be seen as a complementary tool for topic detection and tracking applications. This is achieved by the exploitation of the a priori domain knowledge available, that there are relatively homogeneous temporal segments in the data stream. In a different manner from topographical techniques previously utilized for static text collections, the topography is an outcome of the coherence in time of the data stream in the proposed model. Simulation results on both toy-data settings and an actual application on Internet chat line discussion analysis is presented by way of demonstration.</swrc:abstract><swrc:hasExtraField><swrc:Field swrc:value="393563" swrc:key="id"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="3" swrc:key="priority"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="Special Issue on Automated Text Categorization" swrc:key="comment"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Ata Kaban"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Mark Girolami"/></rdf:_2></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/25095275ddb32f4138ee5018a6a4f3fc6/renew"><title>Topic discovery based on text mining techniques</title><description>Topic discovery based on text mining techniques</description><link>http://www.bibsonomy.org/bibtex/25095275ddb32f4138ee5018a6a4f3fc6/renew</link><dc:creator>renew</dc:creator><dc:date>2008-02-23T00:37:49+01:00</dc:date><dc:subject>topic mining detection text </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Aurora &lt;a href=&#034;http://www.bibsonomy.org/author/Pons-Porrata&#034;&gt;Pons-Porrata&lt;/a&gt;  and Rafael &lt;a href=&#034;http://www.bibsonomy.org/author/Berlanga-Llavori&#034;&gt;Berlanga-Llavori&lt;/a&gt;  and Jos&#039;e &lt;a href=&#034;http://www.bibsonomy.org/author/Ruiz-Shulcloper&#034;&gt;Ruiz-Shulcloper&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Inf. Process. Manage.&lt;/em&gt;&lt;em&gt;43(3):752--768&lt;/em&gt;(&lt;em&gt;2007&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/topic"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/mining"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/detection"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/text"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/25095275ddb32f4138ee5018a6a4f3fc6/renew"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/25095275ddb32f4138ee5018a6a4f3fc6/renew"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><owl:sameAs rdf:resource="http://portal.acm.org/citation.cfm?id=1224718"/><swrc:date>Sat Feb 23 00:37:49 CET 2008</swrc:date><swrc:address>Tarrytown, NY, USA</swrc:address><swrc:journal>Inf. Process. Manage.</swrc:journal><swrc:number>3</swrc:number><swrc:pages>752--768</swrc:pages><swrc:publisher><swrc:Organization swrc:name="Pergamon Press, Inc."/></swrc:publisher><swrc:title>Topic discovery based on text mining techniques</swrc:title><swrc:volume>43</swrc:volume><swrc:year>2007</swrc:year><swrc:keywords>topic mining detection text </swrc:keywords><swrc:abstract>In this paper, we present a topic discovery system aimed to reveal the implicit knowledge present in news streams. This knowledge is expressed as a hierarchy of topic/subtopics, where each topic contains the set of documents that are related to it and a summary extracted from these documents. Summaries so built are useful to browse and select topics of interest from the generated hierarchies. Our proposal consists of a new incremental hierarchical clustering algorithm, which combines both partitional and agglomerative approaches, taking the main benefits from them. Finally, a new summarization method based on Testor Theory has been proposed to build the topic summaries. Experimental results in the TDT2 collection demonstrate its usefulness and effectiveness not only as a topic detection system, but also as a classification and summarization tool.</swrc:abstract><swrc:hasExtraField><swrc:Field swrc:value="0306-4573" swrc:key="issn"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="http://dx.doi.org/10.1016/j.ipm.2006.06.001" swrc:key="doi"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Aurora Pons-Porrata"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Rafael Berlanga-Llavori"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Jos\&#039;{e} Ruiz-Shulcloper"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2c0663174db640752e756736e636e0cf9/renew"><title>BuzzTrack: topic detection and tracking in email.</title><description>dblp</description><link>http://www.bibsonomy.org/bibtex/2c0663174db640752e756736e636e0cf9/renew</link><dc:creator>renew</dc:creator><dc:date>2008-02-22T02:37:01+01:00</dc:date><dc:subject>detection topic email </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Gabor &lt;a href=&#034;http://www.bibsonomy.org/author/Cselle&#034;&gt;Cselle&lt;/a&gt;  and Keno &lt;a href=&#034;http://www.bibsonomy.org/author/Albrecht&#034;&gt;Albrecht&lt;/a&gt;  and Roger &lt;a href=&#034;http://www.bibsonomy.org/author/Wattenhofer&#034;&gt;Wattenhofer&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;Intelligent User Interfaces, &lt;/em&gt;&lt;em&gt;page190-197. &lt;/em&gt;&lt;em&gt;ACM, &lt;/em&gt;(&lt;em&gt;2007&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/detection"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/topic"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/email"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2c0663174db640752e756736e636e0cf9/renew"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2c0663174db640752e756736e636e0cf9/renew"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://dblp.uni-trier.de/db/conf/iui/iui2007.html#CselleAW07"/><swrc:date>Fri Feb 22 02:37:01 CET 2008</swrc:date><swrc:booktitle>Intelligent User Interfaces</swrc:booktitle><swrc:crossref>conf/iui/2007</swrc:crossref><swrc:pages>190-197</swrc:pages><swrc:publisher><swrc:Organization swrc:name="ACM"/></swrc:publisher><swrc:title>BuzzTrack: topic detection and tracking in email.</swrc:title><swrc:year>2007</swrc:year><swrc:keywords>detection topic email </swrc:keywords><swrc:hasExtraField><swrc:Field swrc:value="http://doi.acm.org/10.1145/1216295.1216331" swrc:key="ee"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="1-59593-481-2" swrc:key="isbn"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="2007-04-30" swrc:key="date"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Gabor Cselle"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Keno Albrecht"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Roger Wattenhofer"/></rdf:_3></rdf:Seq></swrc:author><swrc:editor><rdf:Seq><rdf:_1><swrc:Person swrc:name="David N. Chin"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Michelle X. Zhou"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Tessa A. Lau"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Angel R. Puerta"/></rdf:_4></rdf:Seq></swrc:editor></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/220fb4bab61662864357a9edf960a9b9b/renew"><title>Probabilistic author-topic models for information discovery</title><link>http://www.bibsonomy.org/bibtex/220fb4bab61662864357a9edf960a9b9b/renew</link><dc:creator>renew</dc:creator><dc:date>2008-02-22T02:35:49+01:00</dc:date><dc:subject>topic </dc:subject><content:encoded>&lt;span style=&#034;color:#555555;&#034;&gt;Mark &lt;a href=&#034;http://www.bibsonomy.org/author/Steyvers&#034;&gt;Steyvers&lt;/a&gt;  and Padhraic &lt;a href=&#034;http://www.bibsonomy.org/author/Smyth&#034;&gt;Smyth&lt;/a&gt;  and Michal &lt;a href=&#034;http://www.bibsonomy.org/author/Rosen-Zvi&#034;&gt;Rosen-Zvi&lt;/a&gt;  and Thomas &lt;a href=&#034;http://www.bibsonomy.org/author/Griffiths&#034;&gt;Griffiths&lt;/a&gt;  &lt;/span&gt;&lt;em&gt;KDD &#039;04: Proceedings of the tenth ACM SIGKDD international conference on Knowledge discovery and data mining, &lt;/em&gt;&lt;em&gt;page306--315. &lt;/em&gt;&lt;em&gt;New York, NY, USA, &lt;/em&gt;&lt;em&gt;ACM Press, &lt;/em&gt;(&lt;em&gt;2004&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/topic"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/220fb4bab61662864357a9edf960a9b9b/renew"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/220fb4bab61662864357a9edf960a9b9b/renew"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#InProceedings"/><owl:sameAs rdf:resource="http://dx.doi.org/10.1145/1014052.1014087"/><swrc:date>Fri Feb 22 02:35:49 CET 2008</swrc:date><swrc:address>New York, NY, USA</swrc:address><swrc:booktitle>KDD &#039;04: Proceedings of the tenth ACM SIGKDD international conference on Knowledge discovery and data mining</swrc:booktitle><swrc:pages>306--315</swrc:pages><swrc:publisher><swrc:Organization swrc:name="ACM Press"/></swrc:publisher><swrc:title>Probabilistic author-topic models for information discovery</swrc:title><swrc:year>2004</swrc:year><swrc:keywords>topic </swrc:keywords><swrc:abstract>We propose a new unsupervised learning technique for extracting information from large text collections. We model documents as if they were generated by a two-stage stochastic process. Each author is represented by a probability distribution over topics, and each topic is represented as a probability distribution over words for that topic. The words in a multi-author paper are assumed to be the result of a mixture of each authors&#039; topic mixture. The topic-word and author-topic distributions are learned from data in an unsupervised manner using a Markov chain Monte Carlo algorithm. We apply the methodology to a large corpus of 160,000 abstracts and 85,000 authors from the well-known CiteSeer digital library, and learn a model with 300 topics. We discuss in detail the interpretation of the results discovered by the system including specific topic and author models, ranking of authors by topic and topics by author, significant trends in the computer science literature between 1990 and 2002, parsing of abstracts by topics and authors and detection of unusual papers by specific authors. An online query interface to the model is also discussed that allows interactive exploration of author-topic models for corpora such as CiteSeer.</swrc:abstract><swrc:hasExtraField><swrc:Field swrc:value="378119" swrc:key="id"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="0" swrc:key="priority"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="1581138889" swrc:key="isbn"/></swrc:hasExtraField><swrc:hasExtraField><swrc:Field swrc:value="10.1145/1014052.1014087" swrc:key="doi"/></swrc:hasExtraField><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Mark Steyvers"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Padhraic Smyth"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Michal Rosen-Zvi"/></rdf:_3><rdf:_4><swrc:Person swrc:name="Thomas Griffiths"/></rdf:_4></rdf:Seq></swrc:author></rdf:Description></burst:publication></item></rdf:RDF>