<?xml version="1.0" encoding="UTF-8"?>

<rss version='2.0' 
     xmlns:creativeCommons="http://backend.userland.com/creativeCommonsRssModule"
     xmlns:doap="http://usefulinc.com/ns/doap#"
     xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#">

    <channel>
        <!-- This XML Feed shows details for the page webir 
             and everything recently tagged webir -->
        <creativeCommons:license>http://creativecommons.org/licenses/by-sa/2.5/
          </creativeCommons:license>
        <title>webir on SWiK</title>
        <doap:name>webir</doap:name>
        <doap:description></doap:description>
        <description></description> 
	  <!-- see doap:description for full description -->
        <link>http://swik.net/webir</link>
        <doap:homepage></doap:homepage>
        
        <pubDate></pubDate>
        <lastBuildDate></lastBuildDate>
            
        <item>
            <title>Jeff&#039;s Search Engine Caffè: Current Open Source Search Engine Libraries</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/Jeff%27s+Search+Engine+Caff%C3%A8%3A+Current+Open+Source+Search+Engine+Libraries/b4x7x</link>
            <description>&amp;quot;Here is my short list of the most important open source [free] information retrieval libraries being used today that are undergoing active development as of writing.&amp;quot;</description>
            
            <pubDate>Sun, 11 May 2008 02:12:47 -0700</pubDate>
        </item>
            
        <item>
            <title>Amazon Web Services Developer Connection : Running Hadoop MapReduce on Amazon EC2 and Amazon S3</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/Amazon+Web+Services+Developer+Connection+%3A+Running+Hadoop+MapReduce+on+Amazon+EC2+and+Amazon+S3/boxdv</link>
            <description>&amp;quot;AWS and Hadoop developer Tom White illustrates how to use Hadoop and Amazon Web Services together using a large collection of web access logs.&amp;quot;</description>
            
            <pubDate>Wed, 03 Oct 2007 10:54:22 -0700</pubDate>
        </item>
            
        <item>
            <title>COSIN - WP5 - index</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/COSIN+-+WP5+-+index/boxdu</link>
            <description>&amp;quot;The main topic of the COSIN project is to develop a series of theoretical, graphical, analytical and computational tools to describe the complex behaviour of networks.&amp;quot;</description>
            
            <pubDate>Wed, 03 Oct 2007 10:54:21 -0700</pubDate>
        </item>
            
        <item>
            <title>Grub&#039;s Distributed Web Crawling Project</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/Grub%27s+Distributed+Web+Crawling+Project/bgla3</link>
            <description>&amp;quot;Grub started back in 2000 with a simple concept of distributing part of the search process pipeline: crawling.&amp;quot;</description>
            
            <pubDate>Sat, 28 Jul 2007 15:32:59 -0700</pubDate>
        </item>
            
        <item>
            <title>WebLA :: Web Linkage Analysis</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/WebLA+%3A%3A+Web+Linkage+Analysis/v4hd</link>
            <description>&quot;WebLA is a Java package for handling Web Graphs, implementing popular algorithms such as PageRank, HITS, CoCitation Similarity and SimRank. It is of particular interest for research in Information Retrieval, [...]&quot;</description>
            
            <pubDate>Thu, 01 Feb 2007 03:25:41 -0800</pubDate>
        </item>
            
        <item>
            <title>Swish-e :: Home Page</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/Swish-e+%3A%3A+Home+Page/uyau</link>
            <description>&quot;Swish-e is a fast, flexible, and free open source system for indexing collections of Web pages or other files. Swish-e is ideally suited for collections of a million documents or smaller.&quot;</description>
            
            <pubDate>Mon, 22 Jan 2007 07:56:56 -0800</pubDate>
        </item>
            
        <item>
            <title>Helios, Building an Open Source Meta-Search Engine</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/Helios%2C+Building+an+Open+Source+Meta-Search+Engine/tn6i</link>
            <description></description>
            
            <pubDate>Tue, 09 Jan 2007 08:51:15 -0800</pubDate>
        </item>
            
        <item>
            <title>TCatNG Toolkit :: Text Categorization via N-Grams</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/TCatNG+Toolkit+%3A%3A+Text+Categorization+via+N-Grams/dazs</link>
            <description>&quot;The TCatNG Toolkit is a Java package that you can use to apply N-Gram analysis techniques to the process of categorizing text files. [Namely] categorizing documents by topic, detecting the author of a text, or recognizing the language [...]&quot;</description>
            
            <pubDate>Fri, 28 Apr 2006 10:47:29 -0700</pubDate>
        </item>
            
        <item>
            <title>Focused crawler - Combine System Homepage</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/Focused+crawler+-+Combine+System+Homepage/dazo</link>
            <description>&quot;Combine is an open system for crawling [harvesting and threshing (indexing)] Internet resources. It can be used both as a general and focused crawler.&quot;</description>
            
            <pubDate>Fri, 28 Apr 2006 10:47:29 -0700</pubDate>
        </item>
            
        <item>
            <title>Heritrix - Home Page</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/Heritrix+-+Home+Page/dazn</link>
            <description>&quot;Heritrix is the Internet Archive&#039;s open-source, extensible, web-scale, archival-quality web crawler project.&quot;</description>
            
            <pubDate>Fri, 28 Apr 2006 10:47:29 -0700</pubDate>
        </item>
            
        <item>
            <title>WIRE (Web Information Retrieval Environment)::Center for Web Research</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/WIRE+%28Web+Information+Retrieval+Environment%29%3A%3ACenter+for+Web+Research/dazm</link>
            <description>&quot;The WIRE project is an effort started by the Center for Web Research for creating an application for information retrieval, designed to be used on the Web.&quot;</description>
            
            <pubDate>Fri, 28 Apr 2006 10:47:28 -0700</pubDate>
        </item>
            
        <item>
            <title>Welcome to Nutch!</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/Welcome+to+Nutch%21/dazl</link>
            <description>&quot;Nutch is open source web-search software. It builds on Lucene Java, adding web-specifics, such as a crawler, a link-graph database, parsers for HTML and other document formats, etc.&quot;</description>
            
            <pubDate>Fri, 28 Apr 2006 10:47:28 -0700</pubDate>
        </item>
            
        <item>
            <title>Open Source Search - OpenSourceSearch</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/Open+Source+Search+-+OpenSourceSearch/dazk</link>
            <description></description>
            
            <pubDate>Fri, 28 Apr 2006 10:47:28 -0700</pubDate>
        </item>
            
        <item>
            <title>2005 workshop on Open Source Web Information Retrieval</title>
            <link>http://swik.net/open-source/del.icio.us+tag%2Fopen-source/2005+workshop+on+Open+Source+Web+Information+Retrieval/dazi</link>
            <description></description>
            
            <pubDate>Fri, 28 Apr 2006 10:47:28 -0700</pubDate>
        </item>
                </channel>
</rss>
