<?xml version="1.0"?>

<!DOCTYPE owl [
  <!ENTITY rdf "http://www.w3.org/1999/02/22-rdf-syntax-ns#">
  <!ENTITY rdfs "http://www.w3.org/2000/01/rdf-schema#">
  <!ENTITY xsd "http://www.w3.org/2001/XMLSchema#">
  <!ENTITY owl "http://www.w3.org/2002/07/owl#">
  <!ENTITY cc "http://web.resource.org/cc/#">
  <!ENTITY project "http://ebiquity.umbc.edu/ontology/project.owl#">
  <!ENTITY person "http://ebiquity.umbc.edu/ontology/person.owl#">
  <!ENTITY pub "http://ebiquity.umbc.edu/ontology/publication.owl#">
  <!ENTITY assert "http://ebiquity.umbc.edu/ontology/assertion.owl#">]>

<!--
  This ontology document is licensed under the Creative Commons
  Attribution License. To view a copy of this license, visit
  http://creativecommons.org/licenses/by/2.0/ or send a letter to
  Creative Commons, 559 Nathan Abbott Way, Stanford, California
  94305, USA.
-->

<rdf:RDF 
  xmlns:rdf = "&rdf;"
  xmlns:rdfs = "&rdfs;"
  xmlns:xsd = "&xsd;"
  xmlns:owl = "&owl;"
  xmlns:cc = "&cc;"
  xmlns:project = "&project;"
  xmlns:person = "&person;"
  xmlns:pub = "&pub;"
  xmlns:assert = "&assert;">
  <pub:Resource rdf:about="http://ebiquity.umbc.edu/resource/html/id/212/Splog-Blog-Dataset">
    <rdfs:label><![CDATA[Splog Blog Dataset]]></rdfs:label>
    <pub:title><![CDATA[Splog Blog Dataset]]></pub:title>
    <pub:publishedOn rdf:datatype="&xsd;dateTime">2006-11-14T00:00:00-05:00</pub:publishedOn>
    <pub:description><![CDATA[<p>
This dataset consists of 3000 blog homepages, out of which 700 have been labeled as splogs, and another 700 as authentic blogs.
</p>
<p>
This training set was used in results of three papers, with emphasis on identifying blogs [1], on detecting spam blogs [2], and on analysing the splogosphere [3].
</p>
<p>
This collection can be used in further experimenting with splogs, or for building filters that could be deployed in real world systems. We, and our academic and industrial collaborators have been using such filters to eliminate spam blogs, with good results.
</p>
<BR/>
[1] Pranam Kolari, Tim Finin, Anupam Joshi, <a href="http://ebiquity.umbc.edu/paper/html/id/269/SVMs-for-the-Blogosphere-Blog-Identification-and-Splog-Detection">SVMs for the Blogosphere: Blog Identification and Splog Detection</a>, AAAI Spring Symposium on Computational Approaches to Analysing Weblogs, March 2006 <BR/>
[2] Pranam Kolari, Akshay Java, Tim Finin, Tim Oates, Anupam Joshi, <a href="http://ebiquity.umbc.edu/paper/html/id/296/Detecting-Spam-Blogs-A-Machine-Learning-Approach">Detecting Spam Blogs: A Machine Learning Approach</a>, Proceedings of the 21st National Conference on Artificial Intelligence (AAAI 2006), July 2006 <BR/>
[3] Pranam Kolari, Akshay Java, Tim Finin, <a href="http://ebiquity.umbc.edu/paper/html/id/299/Characterizing-the-Splogosphere">Characterizing the Splogosphere</a>, 3rd Annual Workshop on Weblogging Ecosystem: Aggregation, Analysis and Dynamics, 15th World Wid Web Conference, May 2006]]></pub:description>
    <pub:counter>1468</pub:counter>
    <pub:author>
       <rdf:List>
         <rdf:first><person:Alumnus rdf:about="http://ebiquity.umbc.edu/person/html/Pranam/Kolari/"><person:name><![CDATA[Pranam  Kolari]]></person:name><rdfs:label><![CDATA[Pranam  Kolari]]></rdfs:label></person:Alumnus></rdf:first>
         <rdf:rest>
           <rdf:List>
             <rdf:first></rdf:first>
             <rdf:rest>
               <rdf:List>
                 <rdf:first><person:Alumnus rdf:about="http://ebiquity.umbc.edu/person/html/Akshay/Java/"><person:name><![CDATA[Akshay  Java]]></person:name><rdfs:label><![CDATA[Akshay  Java]]></rdfs:label></person:Alumnus></rdf:first>
                 <rdf:rest>
                   <rdf:List>
                     <rdf:first><person:PrincipalFaculty rdf:about="http://ebiquity.umbc.edu/person/html/Anupam/Joshi/"><person:name><![CDATA[Anupam  Joshi]]></person:name><rdfs:label><![CDATA[Anupam  Joshi]]></rdfs:label></person:PrincipalFaculty></rdf:first>
                     <rdf:rest rdf:resource="&rdf;nil" />
                   </rdf:List>
                 </rdf:rest>
               </rdf:List>
             </rdf:rest>
           </rdf:List>
         </rdf:rest>
       </rdf:List>
    </pub:author>
    <pub:firstAuthor><person:Alumnus rdf:about="http://ebiquity.umbc.edu/person/html/Pranam/Kolari/"><person:name><![CDATA[Pranam  Kolari]]></person:name><rdfs:label><![CDATA[Pranam  Kolari]]></rdfs:label></person:Alumnus></pub:firstAuthor>
  </pub:Resource>

  <rdf:Description rdf:about="">
    <cc:License rdf:resource="http://creativecommons.org/licenses/by/2.0/" />
  </rdf:Description>

</rdf:RDF>
