<?xml version="1.0" encoding="utf-8" ?>

<rss version="2.0">
  <channel>
    <docs>This is an RSS file.  It is intended to be read by a software program called a "feed reader". Search on Google for more details.</docs>
    <title><![CDATA[segphault's Feed]]></title>
    <link>http://www.simpy.com/user/segphault</link>
    <url>http://www.simpy.com/</url>
    <description><![CDATA[segphault's Feed]]></description>
    <image>
      <url>http://www.simpy.com/img/simpy-icon-16x16.png</url>
      <title>Simpy</title>
      <link>http://www.simpy.com/user/segphault</link>
    </image>
    <lastBuildDate></lastBuildDate>
    <ttl>1440</ttl>
    
      
      
      


  
    
  
  
  


      <item>
        <title><![CDATA[Python library for parsing bad HTML markup]]></title>
        <link><![CDATA[http://www.crummy.com/software/BeautifulSoup/]]></link>
        <description><![CDATA[I often struggle to extract information from crappy HTML. My default approach typically involves using grep or sed while issuing a steady stream of expletives. This library makes it easy to extricate useful content from a veritable soup of insidiously crafted HTML.
          <img src="http://www.simpy.com/t/fir.gif"/>
<!--
	  <br/>
          <a href="http://www.pheedo.com/click.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.crummy.com/software/BeautifulSoup/"><img
             src="http://www.pheedo.com/img.phdo?x=0b8a1e9c81c14341a5689c3f903dd631&u=http://www.crummy.com/software/BeautifulSoup/" border="0"/></a>
          <p/>
-->
          Tagged by <a href="http://www.simpy.com/user/segphault">segphault</a> under 
         
<a href="http://www.simpy.com/user/segphault/tag/%22Python%22">Python</a>,

<a href="http://www.simpy.com/user/segphault/tag/%22development%22">development</a>,

<a href="http://www.simpy.com/user/segphault/tag/%22HTML%22">HTML</a>,

<a href="http://www.simpy.com/user/segphault/tag/%22parsing%22">parsing</a>,


]]>
</description>
        
        <category><![CDATA[Python]]></category>
        
        <category><![CDATA[development]]></category>
        
        <category><![CDATA[HTML]]></category>
        
        <category><![CDATA[parsing]]></category>
        
        <author><![CDATA[segphault]]></author>
        <pubDate>Sat, 04 Aug 2007 04:57:00 -0400</pubDate>
      </item>
    
  </channel>
</rss>
