<?xml version="1.0"?>

<!DOCTYPE owl [
  <!ENTITY rdf "http://www.w3.org/1999/02/22-rdf-syntax-ns#">
  <!ENTITY rdfs "http://www.w3.org/2000/01/rdf-schema#">
  <!ENTITY xsd "http://www.w3.org/2001/XMLSchema#">
  <!ENTITY owl "http://www.w3.org/2002/07/owl#">
  <!ENTITY cc "http://web.resource.org/cc/#">
  <!ENTITY project "http://ebiquity.umbc.edu/ontology/project.owl#">
  <!ENTITY person "http://ebiquity.umbc.edu/ontology/person.owl#">
  <!ENTITY pub "http://ebiquity.umbc.edu/ontology/publication.owl#">
  <!ENTITY assert "http://ebiquity.umbc.edu/ontology/assertion.owl#">]>

<!--
  This ontology document is licensed under the Creative Commons
  Attribution License. To view a copy of this license, visit
  http://creativecommons.org/licenses/by/2.0/ or send a letter to
  Creative Commons, 559 Nathan Abbott Way, Stanford, California
  94305, USA.
-->

<rdf:RDF 
  xmlns:rdf = "&rdf;"
  xmlns:rdfs = "&rdfs;"
  xmlns:xsd = "&xsd;"
  xmlns:owl = "&owl;"
  xmlns:cc = "&cc;"
  xmlns:project = "&project;"
  xmlns:person = "&person;"
  xmlns:pub = "&pub;"
  xmlns:assert = "&assert;">
  <pub:InProceedings rdf:about="http://ebiquity.umbc.edu/paper/html/id/269/SVMs-for-the-Blogosphere-Blog-Identification-and-Splog-Detection">
    <rdfs:label><![CDATA[SVMs for the Blogosphere: Blog Identification and Splog Detection]]></rdfs:label>
    <pub:title><![CDATA[SVMs for the Blogosphere: Blog Identification and Splog Detection]]></pub:title>
    <pub:publishedOn rdf:datatype="&xsd;dateTime">2006-03-27T00:00:00-05:00</pub:publishedOn>
    <pub:abstract><![CDATA[Weblogs, or blogs have become an important new way to publish
information, engage in discussions and form communities. The
increasing popularity of blogs has given rise to search and analysis
engines focusing on the 'blogosphere'.  A key requirement of such
systems is to identify blogs as they crawl the Web.
While this ensures that only blogs are indexed, blog search engines
are also often overwhelmed by spam blogs (splogs). Splogs not only
incur computational overheads but also reduce user satisfaction. In
this paper we first describe our experiments on blog identification
using Support Vector Machines (SVM). We compare results of using
different feature sets and introduce new features for blog
identification. We then report preliminary results on splog detection
and identify future work.]]></pub:abstract>
    <pub:note><![CDATA[Also available as technical report TR-CS-05-13]]></pub:note>
    <pub:organization><![CDATA[Computer Science and Electrical Engineering]]></pub:organization>
    <pub:counter>6020</pub:counter>
    <pub:googleKey>EGVbfbEUYT4J</pub:googleKey>
    <pub:googleCitations>79</pub:googleCitations>
    <pub:tag><![CDATA[blog]]></pub:tag>
    <pub:tag><![CDATA[splog]]></pub:tag>
    <pub:tag><![CDATA[blogosphere]]></pub:tag>
    <pub:tag><![CDATA[categorization]]></pub:tag>
    <pub:tag><![CDATA[blog]]></pub:tag>
    <pub:tag><![CDATA[metadata]]></pub:tag>
    <pub:tag><![CDATA[splog]]></pub:tag>
    <pub:tag><![CDATA[blog]]></pub:tag>
    <pub:tag><![CDATA[web spam]]></pub:tag>
    <pub:tag><![CDATA[learning]]></pub:tag>
    <pub:tag><![CDATA[spam]]></pub:tag>
    <pub:booktitle><![CDATA[AAAI Spring Symposium on Computational Approaches to Analysing Weblogs]]></pub:booktitle>
    <pub:publisher><![CDATA[University of Maryland, Baltimore County]]></pub:publisher>
    <pub:author>
       <rdf:List>
         <rdf:first><person:Alumnus rdf:about="http://ebiquity.umbc.edu/person/html/Pranam/Kolari/"><person:name><![CDATA[Pranam  Kolari]]></person:name><rdfs:label><![CDATA[Pranam  Kolari]]></rdfs:label></person:Alumnus></rdf:first>
         <rdf:rest>
           <rdf:List>
             <rdf:first><person:PrincipalFaculty rdf:about="http://ebiquity.umbc.edu/person/html/Tim/Finin/"><person:name><![CDATA[Tim  Finin]]></person:name><rdfs:label><![CDATA[Tim  Finin]]></rdfs:label></person:PrincipalFaculty></rdf:first>
             <rdf:rest>
               <rdf:List>
                 <rdf:first><person:PrincipalFaculty rdf:about="http://ebiquity.umbc.edu/person/html/Anupam/Joshi/"><person:name><![CDATA[Anupam  Joshi]]></person:name><rdfs:label><![CDATA[Anupam  Joshi]]></rdfs:label></person:PrincipalFaculty></rdf:first>
                 <rdf:rest rdf:resource="&rdf;nil" />
               </rdf:List>
             </rdf:rest>
           </rdf:List>
         </rdf:rest>
       </rdf:List>
    </pub:author>
    <pub:firstAuthor><person:Alumnus rdf:about="http://ebiquity.umbc.edu/person/html/Pranam/Kolari/"><person:name><![CDATA[Pranam  Kolari]]></person:name><rdfs:label><![CDATA[Pranam  Kolari]]></rdfs:label></person:Alumnus></pub:firstAuthor>
    <pub:relatedProject><project:PastProject rdf:about="http://ebiquity.umbc.edu/project/html/id/68/memeta"><project:title><![CDATA[memeta]]></project:title><rdfs:label><![CDATA[memeta]]></rdfs:label></project:PastProject></pub:relatedProject>
    <pub:relatedProject><project:PastProject rdf:about="http://ebiquity.umbc.edu/project/html/id/56/Semantic-Discovery-Discovering-Complex-Relationships-in-Semantic-Web"><project:title><![CDATA[Semantic Discovery: Discovering Complex Relationships in Semantic Web]]></project:title><rdfs:label><![CDATA[Semantic Discovery: Discovering Complex Relationships in Semantic Web]]></rdfs:label></project:PastProject></pub:relatedProject>
    <pub:softCopy><pub:SoftCopy>
      <pub:softCopyFormat><![CDATA[PDF Document]]></pub:softCopyFormat>
      <pub:softCopyURI><![CDATA[http://ebiquity.umbc.edu/get/a/publication/213.pdf]]></pub:softCopyURI>
      <pub:softCopySize>100493</pub:softCopySize>
    </pub:SoftCopy></pub:softCopy>
    <pub:softCopy><pub:SoftCopy>
      <pub:softCopyFormat><![CDATA[Microsoft PowerPoint]]></pub:softCopyFormat>
      <pub:softCopyURI><![CDATA[http://ebiquity.umbc.edu/get/a/publication/264.ppt]]></pub:softCopyURI>
      <pub:softCopySize>4669952</pub:softCopySize>
    </pub:SoftCopy></pub:softCopy>
  </pub:InProceedings>

  <rdf:Description rdf:about="">
    <cc:License rdf:resource="http://creativecommons.org/licenses/by/2.0/" />
  </rdf:Description>

</rdf:RDF>
