@article{Craven200069, abstract = {The World Wide Web is a vast source of information accessible to computers, but understandable only to humans. The goal of the research described here is to automatically create a computer understandable knowledge base whose content mirrors that of the World Wide Web. Such a knowledge base would enable much more effective retrieval of Web information, and promote new uses of the Web to support knowledge-based inference and problem solving. Our approach is to develop a trainable information extraction system that takes two inputs. The first is an ontology that defines the classes (e.g., company, person, employee, product) and relations (e.g., employed_by, produced_by) of interest when creating the knowledge base. The second is a set of training data consisting of labeled regions of hypertext that represent instances of these classes and relations. Given these inputs, the system learns to extract information from other pages and hyperlinks on the Web. This article describes our general approach, several machine learning algorithms for this task, and promising initial results with a prototype system that has created a knowledge base describing university people, courses, and research projects.}, added-at = {2012-02-02T16:13:22.000+0100}, author = {Craven, Mark and DiPasquo, Dan and Freitag, Dayne and McCallum, Andrew and Mitchell, Tom and Nigam, Kamal and Slattery, Seán}, biburl = {http://www.bibsonomy.org/bibtex/25a061b694a475d34557c7e0a9ff9854b/telekoma}, description = {Learning to construct knowledge bases from the World Wide Web 10.1016/S0004-3702(00)00004-7 : Artificial Intelligence | ScienceDirect.com}, doi = {10.1016/S0004-3702(00)00004-7}, interhash = {68683ddac8974e9b3867c4b076a2b52f}, intrahash = {5a061b694a475d34557c7e0a9ff9854b}, issn = {0004-3702}, journal = {Artificial Intelligence}, keywords = {ai bachelor:2011:bachmann naiveBayes webclassificatoion www}, number = {1–2}, pages = {69 - 113}, title = {Learning to construct knowledge bases from the World Wide Web}, url = {http://www.sciencedirect.com/science/article/pii/S0004370200000047}, volume = 118, year = 2000 } @inproceedings{conf/cnsm/CravenLLRS11, added-at = {2011-12-27T00:00:00.000+0100}, author = {Craven, Robert and Lobo, Jorge and Lupu, Emil and Russo, Alessandra and Sloman, Morris}, biburl = {http://www.bibsonomy.org/bibtex/2b5d8fdd4bda6a36180332df1ff4cf51b/dblp}, booktitle = {CNSM}, crossref = {conf/cnsm/2011}, ee = {http://ieeexplore.ieee.org/xpl/freeabs_all.jsp?arnumber=6103981}, interhash = {9882ad215bb32fba2e4fb3afd5a5c453}, intrahash = {b5d8fdd4bda6a36180332df1ff4cf51b}, isbn = {978-1-4577-1588-4}, keywords = {dblp}, pages = {1-9}, publisher = {IEEE}, title = {Policy refinement: Decomposition and operationalization for dynamic domains.}, url = {http://dblp.uni-trier.de/db/conf/cnsm/cnsm2011.html#CravenLLRS11}, year = 2011 } @inproceedings{conf/aaai/CravenFMMNS98, added-at = {2011-12-23T00:00:00.000+0100}, author = {Craven, Mark and DiPasquo, Dan and Freitag, Dayne and McCallum, Andrew and Mitchell, Tom M. and Nigam, Kamal and Slattery, Seán}, biburl = {http://www.bibsonomy.org/bibtex/2cacaad360450a36338bdc94a7cb326b4/dblp}, booktitle = {AAAI/IAAI}, crossref = {conf/aaai/1998}, editor = {Mostow, Jack and Rich, Chuck}, ee = {http://www.aaai.org/Conferences/AAAI/aaai98.php}, interhash = {42e8183f7f62885a9d4c369a42c8ed4d}, intrahash = {cacaad360450a36338bdc94a7cb326b4}, isbn = {0-262-51098-7}, keywords = {dblp}, pages = {509-516}, publisher = {AAAI Press / The MIT Press}, title = {Learning to Extract Symbolic Knowledge from the World Wide Web.}, url = {http://dblp.uni-trier.de/db/conf/aaai/aaai98.html#CravenFMMNS98}, year = 1998 } @inproceedings{conf/mm/GreenhalghPBCDT00, added-at = {2011-12-23T00:00:00.000+0100}, author = {Greenhalgh, Chris and Purbrick, Jim and Benford, Steve and Craven, Michael P. and Drozd, Adam and Taylor, Ian}, biburl = {http://www.bibsonomy.org/bibtex/2a3d3bfc23ef77c4a70b21ed2d9e19378/dblp}, booktitle = {ACM Multimedia}, crossref = {conf/mm/2000}, editor = {Ghandeharizadeh, Shahram and Chang, Shih-Fu and Fischer, Stephen and Konstan, Joseph A. and Nahrstedt, Klara}, ee = {http://doi.acm.org/10.1145/354384.354429}, interhash = {bea37fdf0df49d21bd2d9be1c8665e1f}, intrahash = {a3d3bfc23ef77c4a70b21ed2d9e19378}, isbn = {1-58113-198-4}, keywords = {dblp}, pages = {67-74}, publisher = {ACM}, title = {Temporal links: recording and replaying virtual environments.}, url = {http://dblp.uni-trier.de/db/conf/mm/mm2000.html#GreenhalghPBCDT00}, year = 2000 } @inproceedings{conf/icml/TowellCS91, added-at = {2011-12-23T00:00:00.000+0100}, author = {Towell, Geoffrey G. and Craven, Mark and Shavlik, Jude W.}, biburl = {http://www.bibsonomy.org/bibtex/2c96ea3f9f8c14a3afed71a76c2ad4b43/dblp}, booktitle = {ML}, crossref = {conf/icml/1991}, editor = {Birnbaum, Lawrence and Collins, Gregg}, interhash = {bea24a8e240c433838a0d0689eb94f20}, intrahash = {c96ea3f9f8c14a3afed71a76c2ad4b43}, isbn = {1-55860-200-3}, keywords = {dblp}, pages = {213-217}, publisher = {Morgan Kaufmann}, title = {Constructive Induction in Knowledge-Based Neural Networks.}, url = {http://dblp.uni-trier.de/db/conf/icml/ml1991.html#TowellCS91}, year = 1991 } @inproceedings{conf/icml/CravenS94, added-at = {2011-12-23T00:00:00.000+0100}, author = {Craven, Mark and Shavlik, Jude W.}, biburl = {http://www.bibsonomy.org/bibtex/2e3cb86a3c3666eb5f9b170bfa27ee5c1/dblp}, booktitle = {ICML}, crossref = {conf/icml/1994}, editor = {Cohen, William W. and Hirsh, Haym}, interhash = {294aa62047fa047d4c92d5e4416fbb68}, intrahash = {e3cb86a3c3666eb5f9b170bfa27ee5c1}, isbn = {1-55860-335-2}, keywords = {dblp}, pages = {37-45}, publisher = {Morgan Kaufmann}, title = {Using Sampling and Queries to Extract Rules from Trained Neural Networks.}, url = {http://dblp.uni-trier.de/db/conf/icml/icml1994.html#CravenS94}, year = 1994 } @inproceedings{conf/icml/CravenS93, added-at = {2011-12-23T00:00:00.000+0100}, author = {Craven, Mark and Shavlik, Jude W.}, biburl = {http://www.bibsonomy.org/bibtex/2e9f1b728dde4f67554315c7836010673/dblp}, booktitle = {ICML}, crossref = {conf/icml/1993}, interhash = {dbb91c990757eeaa6d31180014f52e23}, intrahash = {e9f1b728dde4f67554315c7836010673}, isbn = {1-55860-307-7}, keywords = {dblp}, pages = {73-80}, publisher = {Morgan Kaufmann}, title = {Learning Symbolic Rules Using Artificial Neural Networks.}, url = {http://dblp.uni-trier.de/db/conf/icml/icml1993.html#CravenS93}, year = 1993 } @inproceedings{conf/chi/CravenTDPGBFBJLH01, added-at = {2011-12-21T00:00:00.000+0100}, author = {Craven, Michael P. and Taylor, Ian and Drozd, Adam and Purbrick, Jim and Greenhalgh, Chris and Benford, Steve and Fraser, Mike and Bowers, John and Jää-Aro, Kai-Mikael and Lintermann, Bernd and Hoch, Michael}, biburl = {http://www.bibsonomy.org/bibtex/243c9a610c68af48d04df0be5b4bb272b/dblp}, booktitle = {CHI}, crossref = {conf/chi/2001}, editor = {Jacko, Julie A. and Sears, Andrew}, ee = {http://doi.acm.org/10.1145/365024.365032}, interhash = {d2e13aeebef13e6668cfe3fd1a84710a}, intrahash = {43c9a610c68af48d04df0be5b4bb272b}, isbn = {1-58113-327-8}, keywords = {dblp}, pages = {30-37}, publisher = {ACM}, title = {Exploiting interactivity, influence, space and time to explore non-linear drama in virtual worlds.}, url = {http://dblp.uni-trier.de/db/conf/chi/chi2001.html#CravenTDPGBFBJLH01}, year = 2001 } @inproceedings{conf/uai/NotoC08, added-at = {2011-12-15T00:00:00.000+0100}, author = {Noto, Keith and Craven, Mark}, biburl = {http://www.bibsonomy.org/bibtex/22a6b3ffdd041a13a64e6b7349e8e3cd1/dblp}, booktitle = {UAI}, crossref = {conf/uai/2008}, editor = {McAllester, David A. and Myllymäki, Petri}, ee = {http://uai.sis.pitt.edu/displayArticleDetails.jsp?mmnu=1&smnu=2&article_id=1339&proceeding_id=24}, interhash = {a09881db5467f4bf82615b5418aae66e}, intrahash = {2a6b3ffdd041a13a64e6b7349e8e3cd1}, isbn = {0-9749039-4-9}, keywords = {dblp}, pages = {444-451}, publisher = {AUAI Press}, title = {Learning Hidden Markov Models for Regression using Path Aggregation.}, url = {http://dblp.uni-trier.de/db/conf/uai/uai2008.html#NotoC08}, year = 2008 } @article{journals/presence/GreenhalghBC01, added-at = {2011-11-28T00:00:00.000+0100}, author = {Greenhalgh, Chris and Benford, Steve and Craven, Michael P.}, biburl = {http://www.bibsonomy.org/bibtex/2c1169ac1650748f65e060943387a509d/dblp}, ee = {http://dx.doi.org/10.1162/105474601750182306}, interhash = {cdcf8d10881b55b48a7ed430e913da3f}, intrahash = {c1169ac1650748f65e060943387a509d}, journal = {Presence}, keywords = {dblp}, number = 1, pages = {35-50}, title = {Patterns of Network and User Activity in an Inhabited Television Event.}, url = {http://dblp.uni-trier.de/db/journals/presence/presence10.html#GreenhalghBC01}, volume = 10, year = 2001 } @incollection{reference/opt/Craven09, added-at = {2011-11-25T00:00:00.000+0100}, author = {Craven, B. D.}, biburl = {http://www.bibsonomy.org/bibtex/2e949e1c7a2b33056d6b7157cde76df9c/dblp}, booktitle = {Encyclopedia of Optimization}, crossref = {reference/opt/2009}, editor = {Floudas, Christodoulos A. and Pardalos, Panos M.}, ee = {http://dx.doi.org/10.1007/978-0-387-74759-0_310}, interhash = {9d9e21b5853a15229fc13617ae7eca07}, intrahash = {e949e1c7a2b33056d6b7157cde76df9c}, isbn = {978-0-387-74758-3}, keywords = {dblp}, pages = {1770-1774}, publisher = {Springer}, title = {Invexity and its Applications.}, url = {http://dblp.uni-trier.de/db/reference/opt/opt2009.html#Craven09}, year = 2009 } @article{journals/ait/BhanuSCBHGG11, added-at = {2011-11-09T00:00:00.000+0100}, author = {Bhanu, Harakrishnan and Schwier, Jason M. and Craven, Ryan and Brooks, Richard R. and Hempstalk, Kathryn and Gunetti, Daniele and Griffin, Christopher}, biburl = {http://www.bibsonomy.org/bibtex/2642f199e867387bd947f773e2f0e2775/dblp}, ee = {http://dx.doi.org/10.4236/ait.2011.12003}, interhash = {ef3e85f65f3971143a334f7029871e20}, intrahash = {642f199e867387bd947f773e2f0e2775}, journal = {Adv. Internet of Things}, keywords = {dblp}, number = 2, pages = {13-26}, title = {Side-Channel Analysis for Detecting Protocol Tunneling.}, url = {http://dblp.uni-trier.de/db/journals/ait/ait1.html#BhanuSCBHGG11}, volume = 1, year = 2011 } @article{journals/firstmonday/Craven05, added-at = {2011-11-08T00:00:00.000+0100}, author = {Craven, Timothy C.}, biburl = {http://www.bibsonomy.org/bibtex/218d78e3f87c055b67297adf89ec69243/dblp}, ee = {http://firstmonday.org/htbin/cgiwrap/bin/ojs/index.php/fm/article/view/1224}, interhash = {31c600c1b9c4901111811ac534c040a3}, intrahash = {18d78e3f87c055b67297adf89ec69243}, journal = {First Monday}, keywords = {dblp}, number = 4, title = {Where does Web bibliographies' author information come from?}, url = {http://dblp.uni-trier.de/db/journals/firstmonday/firstmonday10.html#Craven05}, volume = 10, year = 2005 } @article{journals/firstmonday/Craven01, added-at = {2011-11-08T00:00:00.000+0100}, author = {Craven, Timothy C.}, biburl = {http://www.bibsonomy.org/bibtex/2a4754ef624c3857c805b7cba07fab458/dblp}, ee = {http://firstmonday.org/htbin/cgiwrap/bin/ojs/index.php/fm/article/view/895}, interhash = {5607f7ebd1387e22dc59917e5617fa29}, intrahash = {a4754ef624c3857c805b7cba07fab458}, journal = {First Monday}, keywords = {dblp}, number = 10, title = {Changes in Metatag Descriptions Over Time.}, url = {http://dblp.uni-trier.de/db/journals/firstmonday/firstmonday6.html#Craven01}, volume = 6, year = 2001 } @inproceedings{conf/fpl/IskanderPC11, added-at = {2011-10-24T00:00:00.000+0200}, author = {Iskander, Yousef and Patterson, Cameron and Craven, Stephen D.}, biburl = {http://www.bibsonomy.org/bibtex/2ae744d33bcff39dff61c01454e529190/dblp}, booktitle = {FPL}, crossref = {conf/fpl/2011}, ee = {http://doi.ieeecomputersociety.org/10.1109/FPL.2011.102}, interhash = {c0c362ee0c87d87ef3ca8711d26d4640}, intrahash = {ae744d33bcff39dff61c01454e529190}, isbn = {978-1-4577-1484-9}, keywords = {dblp}, pages = {518-523}, publisher = {IEEE}, title = {Improved Abstractions and Turnaround Time for FPGA Design Validation and Debug.}, url = {http://dblp.uni-trier.de/db/conf/fpl/fpl2011.html#IskanderPC11}, year = 2011 } @article{Elhassan1997167, abstract = {The Area method, developed recently for solving multicomponent phase equilibrium problems, has been extended to pure fluids. The method is based on maximizing a single objective function in the Helmholtz-volume surface along any given isotherm, which reduces the number of independent variables to only two: the saturated liquid and vapour volumes. Two techniques are employed to find the maximum of the objective function, the integral and iterative. The integral always finds the thermodynamically stable solution without any prior assumptions about the values of the molar volumes. This factor distinguishes the integral from the iterative technique and also from methods based on the Maxwell equal-area principle. The method has been applied to a group of high accuracy non-cubic equations of state and some of the thermodynamic inconsistencies which occur inside the two-phase region are explored. A new inequality constraint which eliminates these inconsistencies during the development of new equations of state is proposed, and initial results with fitting a preliminary Helmholtz equation of state for benzene are encouraging.}, added-at = {2011-10-11T19:16:07.000+0200}, author = {Elhassan, A.E and Craven, R.J.B and de Reuck, K.M}, biburl = {http://www.bibsonomy.org/bibtex/20fa6c686bbe75b565d3ab583caa4a2df/thorade}, doi = {10.1016/S0378-3812(96)03222-0}, interhash = {66dede91c9ef10d82f113060e1dbd843}, intrahash = {0fa6c686bbe75b565d3ab583caa4a2df}, issn = {0378-3812}, journal = {Fluid Phase Equilibria}, keywords = {1997 equation-of-state equilibrium two-phase}, number = {1-2}, pages = {167 - 187}, title = {The Area method for pure fluids and an analysis of the two-phase region}, url = {http://dx.doi.org/10.1016/S0378-3812(96)03222-0}, volume = 130, year = 1997 } @inproceedings{conf/iwcmc/BhanuSCOGB11, added-at = {2011-09-15T00:00:00.000+0200}, author = {Bhanu, Harakrishnan and Schwier, Jason M. and Craven, Ryan and Ozcelik, Ilker and Griffin, Christopher and Brooks, Richard R.}, biburl = {http://www.bibsonomy.org/bibtex/2797ae280336f7d092a9c466a34befbb0/dblp}, booktitle = {IWCMC}, crossref = {conf/iwcmc/2011}, ee = {http://dx.doi.org/10.1109/IWCMC.2011.5982729}, interhash = {fcb1f1d60d99fdb6b27479661cd0920f}, intrahash = {797ae280336f7d092a9c466a34befbb0}, isbn = {978-1-4244-9539-9}, keywords = {dblp}, pages = {1310-1314}, publisher = {IEEE}, title = {Noise tolerant symbolic learning of Markov models of tunneled protocols.}, url = {http://dblp.uni-trier.de/db/conf/iwcmc/iwcmc2011.html#BhanuSCOGB11}, year = 2011 } @inproceedings{conf/ijcai/AndrzejewskiZCR11, added-at = {2011-08-09T00:00:00.000+0200}, author = {Andrzejewski, David and Zhu, Xiaojin and Craven, Mark and Recht, Benjamin}, biburl = {http://www.bibsonomy.org/bibtex/25b10cec21982b18ee7c05f3b0874308b/dblp}, booktitle = {IJCAI}, crossref = {conf/ijcai/2011}, editor = {Walsh, Toby}, ee = {http://ijcai.org/papers11/Papers/IJCAI11-200.pdf}, interhash = {cd99d0f45a9b1f50c71dd20e88f21ae4}, intrahash = {5b10cec21982b18ee7c05f3b0874308b}, isbn = {978-1-57735-516-8}, keywords = {dblp}, pages = {1171-1177}, publisher = {IJCAI/AAAI}, title = {A Framework for Incorporating General Domain Knowledge into Latent Dirichlet Allocation Using First-Order Logic.}, url = {http://dblp.uni-trier.de/db/conf/ijcai/ijcai2011.html#AndrzejewskiZCR11}, year = 2011 } @inproceedings{conf/recomb/NotoC04, added-at = {2011-08-08T00:00:00.000+0200}, author = {Noto, Keith and Craven, Mark}, biburl = {http://www.bibsonomy.org/bibtex/2c643ee3164a5b48339cba662803591ae/dblp}, booktitle = {Regulatory Genomics}, crossref = {conf/recomb/2004rrg}, editor = {Eskin, Eleazar and Workman, Christopher T.}, ee = {http://dx.doi.org/10.1007/978-3-540-32280-1_6}, interhash = {0a7c774206d092adfbe6d2a7f012a860}, intrahash = {c643ee3164a5b48339cba662803591ae}, isbn = {3-540-24456-5}, keywords = {dblp}, pages = {52-64}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, title = {Learning Regulatory Network Models that Represent Regulator States and Roles.}, url = {http://dblp.uni-trier.de/db/conf/recomb/rrg2004.html#NotoC04}, volume = 3318, year = 2004 } @article{journals/jct/Craven80, added-at = {2011-08-03T00:00:00.000+0200}, author = {Craven, Thomas C.}, biburl = {http://www.bibsonomy.org/bibtex/20deacaad6847da6539336c203af441ba/dblp}, ee = {http://dx.doi.org/10.1016/0097-3165(80)90006-0}, interhash = {ff01a1a91f4465eed5fb532a0d112adc}, intrahash = {0deacaad6847da6539336c203af441ba}, journal = {J. Comb. Theory, Ser. A}, keywords = {dblp}, number = 2, pages = {174-181}, title = {An Application of Pólya's Theory of Counting to an Enumeration Problem Arising in Quadratic Form Theory.}, url = {http://dblp.uni-trier.de/db/journals/jct/jcta29.html#Craven80}, volume = 29, year = 1980 }