<?xml version="1.0" encoding="utf-8" ?>

<rss version="2.0">
  <channel>
    <docs>This is an RSS file.  It is intended to be read by a software program called a "feed reader". Search on Google for more details.</docs>
    <title><![CDATA[otis's Feed]]></title>
    <link>http://www.simpy.com/user/otis</link>
    <url>http://www.simpy.com/</url>
    <description><![CDATA[otis's Feed]]></description>
    <image>
      <url>http://www.simpy.com/img/simpy-icon-16x16.png</url>
      <title>Simpy</title>
      <link>http://www.simpy.com/user/otis</link>
    </image>
    <lastBuildDate></lastBuildDate>
    <ttl>1440</ttl>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[behemoth-pebble - Project Hosting on Google Code]]></title>
        <link><![CDATA[http://code.google.com/p/behemoth-pebble/]]></link>
        <description><![CDATA[Behemoth allows to deploy GATE or UIMA applications over a Hadoop cluster in order to do very large scale document analysis. It uses a simple representation format which can be used as a common ground between UIMA and GATE-generated annotations, hence achieving compatibility between both systems. Since it is Hadoop-based it benefits from all its features, namely scalability, fault-tolerance and most notably the back up of a thriving open source community. Quite a few Apache resources will fit into it: Nutch, Tika, Mahout, Hbase etc...
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://code.google.com/p/behemoth-pebble/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://code.google.com/p/behemoth-pebble/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22UIMA%22">UIMA</a>,

<a href="http://www.simpy.com/user/otis/tag/%22gate%22">gate</a>,

<a href="http://www.simpy.com/user/otis/tag/%22hadoop%22">hadoop</a>,

<a href="http://www.simpy.com/user/otis/tag/%22text+mining%22">text mining</a>,

<a href="http://www.simpy.com/user/otis/tag/%22text+analysis%22">text analysis</a>,

<a href="http://www.simpy.com/user/otis/tag/%22MapReduce%22">MapReduce</a>,

<a href="http://www.simpy.com/user/otis/tag/%22distributed+computing%22">distributed computing</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,


]]>
</description>
        
        <category><![CDATA[UIMA]]></category>
        
        <category><![CDATA[gate]]></category>
        
        <category><![CDATA[hadoop]]></category>
        
        <category><![CDATA[text mining]]></category>
        
        <category><![CDATA[text analysis]]></category>
        
        <category><![CDATA[MapReduce]]></category>
        
        <category><![CDATA[distributed computing]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Tue, 01 Dec 2009 10:35:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[Getting To The SuperTweet: Speedi.ly Classifies The Real Time Web]]></title>
        <link><![CDATA[http://www.techcrunch.com/2009/11/20/getting-to-the-supertweet-speedi-ly-classifies-the-real-time-web/]]></link>
        <description><![CDATA[Speedi.ly takes a piece of content, or grabs the content from a URL, and analyzes it. It does this very fast and it outputs some key data. Speedi.ly tells you the language of the content, categorizes it (topics, keywords), and additional metadata.
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.techcrunch.com/2009/11/20/getting-to-the-supertweet-speedi-ly-classifies-the-real-time-web/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.techcrunch.com/2009/11/20/getting-to-the-supertweet-speedi-ly-classifies-the-real-time-web/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22classification%22">classification</a>,

<a href="http://www.simpy.com/user/otis/tag/%22service%22">service</a>,

<a href="http://www.simpy.com/user/otis/tag/%22saas%22">saas</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22named+entity+extraction%22">named entity extraction</a>,


]]>
</description>
        
        <category><![CDATA[classification]]></category>
        
        <category><![CDATA[service]]></category>
        
        <category><![CDATA[saas]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[named entity extraction]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Mon, 23 Nov 2009 12:06:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[uClassify - free text classifier web service]]></title>
        <link><![CDATA[http://uclassify.com/]]></link>
        <description><![CDATA[
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://uclassify.com/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://uclassify.com/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22classification%22">classification</a>,

<a href="http://www.simpy.com/user/otis/tag/%22service%22">service</a>,

<a href="http://www.simpy.com/user/otis/tag/%22saas%22">saas</a>,

<a href="http://www.simpy.com/user/otis/tag/%22windows%22">windows</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,


]]>
</description>
        
        <category><![CDATA[classification]]></category>
        
        <category><![CDATA[service]]></category>
        
        <category><![CDATA[saas]]></category>
        
        <category><![CDATA[windows]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Mon, 23 Nov 2009 12:05:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[Untitled]]></title>
        <link><![CDATA[http://www.semanticsoftware.info/]]></link>
        <description><![CDATA[
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.semanticsoftware.info/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.semanticsoftware.info/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22information+retrieval%22">information retrieval</a>,

<a href="http://www.simpy.com/user/otis/tag/%22semantic%22">semantic</a>,

<a href="http://www.simpy.com/user/otis/tag/%22gate%22">gate</a>,

<a href="http://www.simpy.com/user/otis/tag/%22software%22">software</a>,


]]>
</description>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[information retrieval]]></category>
        
        <category><![CDATA[semantic]]></category>
        
        <category><![CDATA[gate]]></category>
        
        <category><![CDATA[software]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Wed, 18 Nov 2009 05:36:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[Morphix-NLP -- The most NLP applications on one CD!]]></title>
        <link><![CDATA[http://morphix-nlp.berlios.de/]]></link>
        <description><![CDATA[
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://morphix-nlp.berlios.de/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://morphix-nlp.berlios.de/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22morphix%22">morphix</a>,

<a href="http://www.simpy.com/user/otis/tag/%22linux%22">linux</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22software%22">software</a>,


]]>
</description>
        
        <category><![CDATA[morphix]]></category>
        
        <category><![CDATA[linux]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[software]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Wed, 18 Nov 2009 05:33:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[Multi-lingual Noun Phrase Extractor (MuNPEx) | semanticsoftware.info]]></title>
        <link><![CDATA[http://www.semanticsoftware.info/munpex]]></link>
        <description><![CDATA[MuNPEx is a multi-lingual noun phrase (NP) extraction component developed for the GATE architecture, implemented in JAPE. It currently supports English, German, French, and Spanish (in beta). MuNPEx requires a part-of-speech (POS) tagger to work and can additionally use detected named entities (NEs) to improve chunking performance. Please read the documentation (or source code) for more details.
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.semanticsoftware.info/munpex"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.semanticsoftware.info/munpex" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22information+retrieval%22">information retrieval</a>,

<a href="http://www.simpy.com/user/otis/tag/%22key+phrases%22">key phrases</a>,

<a href="http://www.simpy.com/user/otis/tag/%22information+extraction%22">information extraction</a>,

<a href="http://www.simpy.com/user/otis/tag/%22computational+linguistics%22">computational linguistics</a>,

<a href="http://www.simpy.com/user/otis/tag/%22software%22">software</a>,

<a href="http://www.simpy.com/user/otis/tag/%22gate%22">gate</a>,


]]>
</description>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[information retrieval]]></category>
        
        <category><![CDATA[key phrases]]></category>
        
        <category><![CDATA[information extraction]]></category>
        
        <category><![CDATA[computational linguistics]]></category>
        
        <category><![CDATA[software]]></category>
        
        <category><![CDATA[gate]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Wed, 18 Nov 2009 05:30:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[Extracting Text from Wikipedia]]></title>
        <link><![CDATA[http://evanjones.ca/software/wikipedia2text.html]]></link>
        <description><![CDATA[
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://evanjones.ca/software/wikipedia2text.html"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://evanjones.ca/software/wikipedia2text.html" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22wikipedia%22">wikipedia</a>,

<a href="http://www.simpy.com/user/otis/tag/%22dump%22">dump</a>,

<a href="http://www.simpy.com/user/otis/tag/%22extract%22">extract</a>,

<a href="http://www.simpy.com/user/otis/tag/%22text%22">text</a>,

<a href="http://www.simpy.com/user/otis/tag/%22data+mining%22">data mining</a>,

<a href="http://www.simpy.com/user/otis/tag/%22text+mining%22">text mining</a>,

<a href="http://www.simpy.com/user/otis/tag/%22corporation%22">corporation</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,


]]>
</description>
        
        <category><![CDATA[wikipedia]]></category>
        
        <category><![CDATA[dump]]></category>
        
        <category><![CDATA[extract]]></category>
        
        <category><![CDATA[text]]></category>
        
        <category><![CDATA[data mining]]></category>
        
        <category><![CDATA[text mining]]></category>
        
        <category><![CDATA[corporation]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Sat, 07 Nov 2009 01:34:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[AI ACCESS e-books]]></title>
        <link><![CDATA[http://www.aiaccess.net/English/Glossaries/Shop/bookstore.htm]]></link>
        <description><![CDATA[PROBABILITIES, STATISTICS AND DATA MODELING
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.aiaccess.net/English/Glossaries/Shop/bookstore.htm"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.aiaccess.net/English/Glossaries/Shop/bookstore.htm" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22statistics%22">statistics</a>,

<a href="http://www.simpy.com/user/otis/tag/%22probability%22">probability</a>,

<a href="http://www.simpy.com/user/otis/tag/%22math%22">math</a>,

<a href="http://www.simpy.com/user/otis/tag/%22matrix%22">matrix</a>,

<a href="http://www.simpy.com/user/otis/tag/%22tutorial%22">tutorial</a>,

<a href="http://www.simpy.com/user/otis/tag/%22reference%22">reference</a>,

<a href="http://www.simpy.com/user/otis/tag/%22ebook%22">ebook</a>,

<a href="http://www.simpy.com/user/otis/tag/%22pdf%22">pdf</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,


]]>
</description>
        
        <category><![CDATA[statistics]]></category>
        
        <category><![CDATA[probability]]></category>
        
        <category><![CDATA[math]]></category>
        
        <category><![CDATA[matrix]]></category>
        
        <category><![CDATA[tutorial]]></category>
        
        <category><![CDATA[reference]]></category>
        
        <category><![CDATA[ebook]]></category>
        
        <category><![CDATA[pdf]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Tue, 03 Nov 2009 04:27:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[Web as Corpus ToolKit - Home Page]]></title>
        <link><![CDATA[http://www.drni.de/wac-tk/]]></link>
        <description><![CDATA[
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.drni.de/wac-tk/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.drni.de/wac-tk/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22software%22">software</a>,

<a href="http://www.simpy.com/user/otis/tag/%22information+retrieval%22">information retrieval</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22perl%22">perl</a>,

<a href="http://www.simpy.com/user/otis/tag/%22corpus%22">corpus</a>,

<a href="http://www.simpy.com/user/otis/tag/%22text+mining%22">text mining</a>,

<a href="http://www.simpy.com/user/otis/tag/%22dataset%22">dataset</a>,


]]>
</description>
        
        <category><![CDATA[software]]></category>
        
        <category><![CDATA[information retrieval]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[perl]]></category>
        
        <category><![CDATA[corpus]]></category>
        
        <category><![CDATA[text mining]]></category>
        
        <category><![CDATA[dataset]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Mon, 02 Nov 2009 01:59:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[home - FreeLing Home Page]]></title>
        <link><![CDATA[http://www.lsi.upc.edu/~nlp/freeling/]]></link>
        <description><![CDATA[C++ (but has Java API), GPL
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.lsi.upc.edu/~nlp/freeling/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.lsi.upc.edu/~nlp/freeling/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22information+retrieval%22">information retrieval</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22software%22">software</a>,

<a href="http://www.simpy.com/user/otis/tag/%22library%22">library</a>,

<a href="http://www.simpy.com/user/otis/tag/%22api%22">api</a>,


]]>
</description>
        
        <category><![CDATA[information retrieval]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[software]]></category>
        
        <category><![CDATA[library]]></category>
        
        <category><![CDATA[api]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Mon, 02 Nov 2009 01:51:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[nlpFarm - Home]]></title>
        <link><![CDATA[http://herd.ida.liu.se:8180/nlpfarm/]]></link>
        <description><![CDATA[
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://herd.ida.liu.se:8180/nlpfarm/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://herd.ida.liu.se:8180/nlpfarm/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22information+retrieval%22">information retrieval</a>,

<a href="http://www.simpy.com/user/otis/tag/%22computational+linguistics%22">computational linguistics</a>,

<a href="http://www.simpy.com/user/otis/tag/%22java%22">java</a>,

<a href="http://www.simpy.com/user/otis/tag/%22software%22">software</a>,

<a href="http://www.simpy.com/user/otis/tag/%22api%22">api</a>,

<a href="http://www.simpy.com/user/otis/tag/%22library%22">library</a>,


]]>
</description>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[information retrieval]]></category>
        
        <category><![CDATA[computational linguistics]]></category>
        
        <category><![CDATA[java]]></category>
        
        <category><![CDATA[software]]></category>
        
        <category><![CDATA[api]]></category>
        
        <category><![CDATA[library]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Mon, 02 Nov 2009 01:33:00 -0500</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[MaltParser]]></title>
        <link><![CDATA[http://maltparser.org/]]></link>
        <description><![CDATA[MaltParser is a system for data-driven dependency parsing, which can be used to induce a parsing model from treebank data and to parse new data using an induced model.
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://maltparser.org/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://maltparser.org/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22machine+learning%22">machine learning</a>,

<a href="http://www.simpy.com/user/otis/tag/%22parse%22">parse</a>,

<a href="http://www.simpy.com/user/otis/tag/%22computational+linguistics%22">computational linguistics</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22java%22">java</a>,

<a href="http://www.simpy.com/user/otis/tag/%22software%22">software</a>,

<a href="http://www.simpy.com/user/otis/tag/%22api%22">api</a>,

<a href="http://www.simpy.com/user/otis/tag/%22library%22">library</a>,


]]>
</description>
        
        <category><![CDATA[machine learning]]></category>
        
        <category><![CDATA[parse]]></category>
        
        <category><![CDATA[computational linguistics]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[java]]></category>
        
        <category><![CDATA[software]]></category>
        
        <category><![CDATA[api]]></category>
        
        <category><![CDATA[library]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Thu, 29 Oct 2009 04:20:00 -0400</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[Factual]]></title>
        <link><![CDATA[http://www.factual.com/]]></link>
        <description><![CDATA[Platform where anyone can share and mash open data on any subject
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.factual.com/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.factual.com/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22data%22">data</a>,

<a href="http://www.simpy.com/user/otis/tag/%22information+retrieval%22">information retrieval</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22machine+learning%22">machine learning</a>,

<a href="http://www.simpy.com/user/otis/tag/%22mashup%22">mashup</a>,


]]>
</description>
        
        <category><![CDATA[data]]></category>
        
        <category><![CDATA[information retrieval]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[machine learning]]></category>
        
        <category><![CDATA[mashup]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Thu, 29 Oct 2009 12:24:00 -0400</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[Wikipedia:Lists of common misspellings/For machines - Wikipedia, the free encyclopedia]]></title>
        <link><![CDATA[http://en.wikipedia.org/wiki/Wikipedia:Lists_of_common_misspellings/For_machines]]></link>
        <description><![CDATA[Common English misspellings from Wikipedia
4107 misspellings as of 2009-10-29
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://en.wikipedia.org/wiki/Wikipedia:Lists_of_common_misspellings/For_machines"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://en.wikipedia.org/wiki/Wikipedia:Lists_of_common_misspellings/For_machines" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22wikipedia%22">wikipedia</a>,

<a href="http://www.simpy.com/user/otis/tag/%22spell%22">spell</a>,

<a href="http://www.simpy.com/user/otis/tag/%22english%22">english</a>,

<a href="http://www.simpy.com/user/otis/tag/%22language%22">language</a>,

<a href="http://www.simpy.com/user/otis/tag/%22search%22">search</a>,

<a href="http://www.simpy.com/user/otis/tag/%22information+retrieval%22">information retrieval</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,


]]>
</description>
        
        <category><![CDATA[wikipedia]]></category>
        
        <category><![CDATA[spell]]></category>
        
        <category><![CDATA[english]]></category>
        
        <category><![CDATA[language]]></category>
        
        <category><![CDATA[search]]></category>
        
        <category><![CDATA[information retrieval]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Thu, 29 Oct 2009 12:20:00 -0400</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[sen: Home]]></title>
        <link><![CDATA[https://sen.dev.java.net/]]></link>
        <description><![CDATA[Sen is the first opensource morphological analyzer written in pure Java.
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=https://sen.dev.java.net/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=https://sen.dev.java.net/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22japanese%22">japanese</a>,

<a href="http://www.simpy.com/user/otis/tag/%22morphology%22">morphology</a>,

<a href="http://www.simpy.com/user/otis/tag/%22analysis%22">analysis</a>,

<a href="http://www.simpy.com/user/otis/tag/%22lucene%22">lucene</a>,

<a href="http://www.simpy.com/user/otis/tag/%22search%22">search</a>,

<a href="http://www.simpy.com/user/otis/tag/%22index%22">index</a>,

<a href="http://www.simpy.com/user/otis/tag/%22information+retrieval%22">information retrieval</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22library%22">library</a>,


]]>
</description>
        
        <category><![CDATA[japanese]]></category>
        
        <category><![CDATA[morphology]]></category>
        
        <category><![CDATA[analysis]]></category>
        
        <category><![CDATA[lucene]]></category>
        
        <category><![CDATA[search]]></category>
        
        <category><![CDATA[index]]></category>
        
        <category><![CDATA[information retrieval]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[library]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Fri, 16 Oct 2009 11:39:00 -0400</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[http://www.cs.uic.edu/~liub/FBS/NLP-handbook-sentiment-analysis.pdf]]></title>
        <link><![CDATA[http://www.cs.uic.edu/~liub/FBS/NLP-handbook-sentiment-analysis.pdf]]></link>
        <description><![CDATA[
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.cs.uic.edu/~liub/FBS/NLP-handbook-sentiment-analysis.pdf"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.cs.uic.edu/~liub/FBS/NLP-handbook-sentiment-analysis.pdf" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22sentiment%22">sentiment</a>,

<a href="http://www.simpy.com/user/otis/tag/%22reference%22">reference</a>,


]]>
</description>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[sentiment]]></category>
        
        <category><![CDATA[reference]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Wed, 07 Oct 2009 09:55:00 -0400</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[OPUS - an open source parallel corpus]]></title>
        <link><![CDATA[http://urd.let.rug.nl/tiedeman/OPUS/]]></link>
        <description><![CDATA[OPUS is an attempt to collect translated texts from the web, to convert and align the entire collection, to add linguistic annotation, and to provide the community with a publicly available parallel corpus. OPUS is based on open source products and is also delivered as an open source package.
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://urd.let.rug.nl/tiedeman/OPUS/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://urd.let.rug.nl/tiedeman/OPUS/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22corpus%22">corpus</a>,

<a href="http://www.simpy.com/user/otis/tag/%22information+retrieval%22">information retrieval</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,


]]>
</description>
        
        <category><![CDATA[corpus]]></category>
        
        <category><![CDATA[information retrieval]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Wed, 07 Oct 2009 10:54:00 -0400</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[OntoWare:Text2Onto: Project Info]]></title>
        <link><![CDATA[http://ontoware.org/projects/text2onto/]]></link>
        <description><![CDATA[Text2Onto is the official successor of TextToOnto, a framework for ontology learning from text.
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://ontoware.org/projects/text2onto/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://ontoware.org/projects/text2onto/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22ontology%22">ontology</a>,

<a href="http://www.simpy.com/user/otis/tag/%22corpus%22">corpus</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22semantic%22">semantic</a>,


]]>
</description>
        
        <category><![CDATA[ontology]]></category>
        
        <category><![CDATA[corpus]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[semantic]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Sat, 12 Sep 2009 10:36:00 -0400</pubDate>
      </item>
    
      
      
      


  
    
  
  
  


      <item>
        <title><![CDATA[zemberek - Turkish NLP library]]></title>
        <link><![CDATA[http://code.google.com/p/zemberek/]]></link>
        <description><![CDATA[Zemberek is an open source, platform independent, general purpose Natural Language Processing library and toolset designed for Turkic languages, especially Turkish.

Zemberek is officially used as spell checker in Open Office Turkish version and Turkish national Linux Distribution Pardus. Google Code will host Zemberek-2, Zemberek Corpus and Wordnet projects. These projects has Mozilla Public License. 
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://code.google.com/p/zemberek/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://code.google.com/p/zemberek/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22turkish%22">turkish</a>,

<a href="http://www.simpy.com/user/otis/tag/%22language%22">language</a>,

<a href="http://www.simpy.com/user/otis/tag/%22analysis%22">analysis</a>,

<a href="http://www.simpy.com/user/otis/tag/%22search%22">search</a>,

<a href="http://www.simpy.com/user/otis/tag/%22tokenizer%22">tokenizer</a>,

<a href="http://www.simpy.com/user/otis/tag/%22stemming%22">stemming</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,

<a href="http://www.simpy.com/user/otis/tag/%22library%22">library</a>,


]]>
</description>
        
        <category><![CDATA[turkish]]></category>
        
        <category><![CDATA[language]]></category>
        
        <category><![CDATA[analysis]]></category>
        
        <category><![CDATA[search]]></category>
        
        <category><![CDATA[tokenizer]]></category>
        
        <category><![CDATA[stemming]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <category><![CDATA[library]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Fri, 24 Jul 2009 09:41:00 -0400</pubDate>
      </item>
    
      
      
      


  
  
    
  
  


      <item>
        <title><![CDATA[Near-duplicates and shingling]]></title>
        <link><![CDATA[http://nlp.stanford.edu/IR-book/html/htmledition/near-duplicates-and-shingling-1.html]]></link>
        <description><![CDATA[Near duplicate detection algorithm for deduplication (deduping)
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://nlp.stanford.edu/IR-book/html/htmledition/near-duplicates-and-shingling-1.html"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://nlp.stanford.edu/IR-book/html/htmledition/near-duplicates-and-shingling-1.html" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/otis">otis</a> under 
         
<a href="http://www.simpy.com/user/otis/tag/%22duplicate+detection%22">duplicate detection</a>,

<a href="http://www.simpy.com/user/otis/tag/%22NLP%22">NLP</a>,


]]>
</description>
        
        <category><![CDATA[duplicate detection]]></category>
        
        <category><![CDATA[NLP]]></category>
        
        <author><![CDATA[otis]]></author>
        <pubDate>Tue, 14 Jul 2009 10:30:00 -0400</pubDate>
      </item>
    
  </channel>
</rss>
