<?xml version="1.0" encoding="UTF-8"?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" xmlns:burst="http://xmlns.com/burst/0.1/" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns="http://purl.org/rss/1.0/" xmlns:admin="http://webns.net/mvcb/" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:syn="http://purl.org/rss/1.0/modules/syndication/" xmlns:swrc="http://swrc.ontoware.org/ontology#" xmlns:cc="http://web.resource.org/cc/"><channel rdf:about="http://www.bibsonomy.org/user/cschenk/email"><title>BibSonomy publications for /user/cschenk/email</title><link>BibSonomyburst/user/cschenk/email</link><description>BibSonomy RSS feed for /user/cschenk/email</description><dc:date>2012-02-16T06:44:35+01:00</dc:date><items><rdf:Seq><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/243d2c72e40212957f3d6ed66a4a104b3/cschenk"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/22e725bdb785392dfa38fe4ff68fd965f/cschenk"/><rdf:li rdf:resource="http://www.bibsonomy.org/bibtex/2c66fa858b58398f469558c5d85cf8a7a/cschenk"/></rdf:Seq></items></channel><item rdf:about="http://www.bibsonomy.org/bibtex/243d2c72e40212957f3d6ed66a4a104b3/cschenk"><title>Blockwerk. IP-Blacklists sinnvoll kombinieren</title><link>http://www.bibsonomy.org/bibtex/243d2c72e40212957f3d6ed66a4a104b3/cschenk</link><dc:creator>cschenk</dc:creator><dc:date>2008-06-30T16:14:54+02:00</dc:date><dc:subject>article blacklists email ip ix read:2008 spam </dc:subject><content:encoded>&lt;span class=&#034;authorEditorList&#034;&gt;&lt;a href=&#034;/author/Rossow&#034;&gt;Christian Rossow&lt;/a&gt;, &lt;a href=&#034;/author/Dietrich&#034;&gt;Christian Dietrich&lt;/a&gt;,  and &lt;a href=&#034;/author/Pohlmann&#034;&gt;Norbert Pohlmann&lt;/a&gt; &lt;/span&gt;&lt;em&gt;iX&lt;/em&gt;  (&lt;em&gt;January 2008&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/article"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/blacklists"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/email"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/ip"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/ix"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/read:2008"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/spam"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/243d2c72e40212957f3d6ed66a4a104b3/cschenk"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/243d2c72e40212957f3d6ed66a4a104b3/cschenk"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><swrc:date>Mon Jun 30 16:14:54 CEST 2008</swrc:date><swrc:journal>iX</swrc:journal><swrc:month>Januar</swrc:month><swrc:pages>56-61</swrc:pages><swrc:title>Blockwerk. IP-Blacklists sinnvoll kombinieren</swrc:title><swrc:volume>1</swrc:volume><swrc:year>2008</swrc:year><swrc:keywords>article blacklists email ip ix read:2008 spam </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Christian Rossow"/></rdf:_1><rdf:_2><swrc:Person swrc:name="Christian Dietrich"/></rdf:_2><rdf:_3><swrc:Person swrc:name="Norbert Pohlmann"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/22e725bdb785392dfa38fe4ff68fd965f/cschenk"><title>Vorsorgemaßnahmen. Korrekter Umgang mit E-Mail-Adressen</title><link>http://www.bibsonomy.org/bibtex/22e725bdb785392dfa38fe4ff68fd965f/cschenk</link><dc:creator>cschenk</dc:creator><dc:date>2008-06-30T16:03:06+02:00</dc:date><dc:subject>adressen article email ix newsletter read:2008 spam </dc:subject><content:encoded>&lt;span class=&#034;authorEditorList&#034;&gt;&lt;a href=&#034;/author/Ungerer&#034;&gt;Bert Ungerer&lt;/a&gt; &lt;/span&gt;&lt;em&gt;iX&lt;/em&gt;  (&lt;em&gt;January 2008&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/adressen"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/article"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/email"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/ix"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/newsletter"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/read:2008"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/spam"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/22e725bdb785392dfa38fe4ff68fd965f/cschenk"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/22e725bdb785392dfa38fe4ff68fd965f/cschenk"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><swrc:date>Mon Jun 30 16:03:06 CEST 2008</swrc:date><swrc:journal>iX</swrc:journal><swrc:month>Januar</swrc:month><swrc:pages>48-54</swrc:pages><swrc:title>Vorsorgemaßnahmen. Korrekter Umgang mit E-Mail-Adressen</swrc:title><swrc:volume>1</swrc:volume><swrc:year>2008</swrc:year><swrc:keywords>adressen article email ix newsletter read:2008 spam </swrc:keywords><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="Bert Ungerer"/></rdf:_1></rdf:Seq></swrc:author></rdf:Description></burst:publication></item><item rdf:about="http://www.bibsonomy.org/bibtex/2c66fa858b58398f469558c5d85cf8a7a/cschenk"><title>Automatic Categorization of Email into Folders: Benchmark Experiments on Enron and SRI Corpora</title><link>http://www.bibsonomy.org/bibtex/2c66fa858b58398f469558c5d85cf8a7a/cschenk</link><dc:creator>cschenk</dc:creator><dc:date>2008-06-21T18:52:26+02:00</dc:date><dc:subject>algorithms automatic bayes benchmark categorization classification email enron folders information ir paper read:2008 retrieval sri svm winnow </dc:subject><content:encoded>&lt;span class=&#034;authorEditorList&#034;&gt;&lt;a href=&#034;/author/Bekkerman&#034;&gt;R. Bekkerman&lt;/a&gt;, &lt;a href=&#034;/author/McCallum&#034;&gt;A. McCallum&lt;/a&gt;,  and &lt;a href=&#034;/author/Huang&#034;&gt;G. Huang&lt;/a&gt; &lt;/span&gt;&lt;em&gt;Center for Intelligent Information Retrieval, Technical Report IR&lt;/em&gt;  (&lt;em&gt;2004&lt;/em&gt;)</content:encoded><taxo:topics><rdf:Bag><rdf:li rdf:resource="http://www.bibsonomy.org/tag/algorithms"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/automatic"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/bayes"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/benchmark"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/categorization"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/classification"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/email"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/enron"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/folders"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/information"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/ir"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/paper"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/read:2008"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/retrieval"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/sri"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/svm"/><rdf:li rdf:resource="http://www.bibsonomy.org/tag/winnow"/></rdf:Bag></taxo:topics><burst:publication><rdf:Description rdf:about="http://www.bibsonomy.org/bibtex/2c66fa858b58398f469558c5d85cf8a7a/cschenk"><owl:sameAs rdf:resource="http://www.bibsonomy.org/uri/bibtex/2c66fa858b58398f469558c5d85cf8a7a/cschenk"/><rdf:type rdf:resource="http://swrc.ontoware.org/ontology#Article"/><swrc:date>Sat Jun 21 18:52:26 CEST 2008</swrc:date><swrc:journal>Center for Intelligent Information Retrieval, Technical Report IR</swrc:journal><swrc:title>Automatic Categorization of Email into Folders: Benchmark Experiments on Enron and SRI Corpora</swrc:title><swrc:volume>418</swrc:volume><swrc:year>2004</swrc:year><swrc:keywords>algorithms automatic bayes benchmark categorization classification email enron folders information ir paper read:2008 retrieval sri svm winnow </swrc:keywords><swrc:abstract>Office workers everywhere are drowning in email—not only spam, but also large quantities of legitimate email to be read and organized for browsing. Although there have been extensive investigations of automatic document categorization, email gives rise to a number of unique challenges, and there has been relatively little study of classifying email into folders. 
This paper presents an extensive benchmark study of email foldering using two large corpora of real-world email messages and foldering schemes: one from former Enron employees, another from participants in an SRI research pro ject. We discuss the challenges that arise from differences between email foldering and traditional document classification. We show experimental results from an array of automated classiﬁcation methods and evaluation methodologies, including a new evaluation method of foldering results based on the email timeline, and including enhancements to the exponential gradient method Winnow, providing top-tier accuracy with a fraction the training time of alternative methods. We also establish that classiﬁcation accuracy in many cases is relatively low, confirming the challenges of email data, and pointing toward email foldering as an important area for further research.</swrc:abstract><swrc:author><rdf:Seq><rdf:_1><swrc:Person swrc:name="R. Bekkerman"/></rdf:_1><rdf:_2><swrc:Person swrc:name="A. McCallum"/></rdf:_2><rdf:_3><swrc:Person swrc:name="G. Huang"/></rdf:_3></rdf:Seq></swrc:author></rdf:Description></burst:publication></item></rdf:RDF>
