<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>OpenWebSpider &#187; crawler</title>
	<atom:link href="http://www.openwebspider.org/tag/crawler/feed/" rel="self" type="application/rss+xml" />
	<link>http://www.openwebspider.org</link>
	<description>Open Source Web Spider</description>
	<lastBuildDate>Mon, 18 May 2009 09:59:46 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.org/?v=3.2.1</generator>
<xhtml:meta xmlns:xhtml="http://www.w3.org/1999/xhtml" name="robots" content="noindex" />
		<item>
		<title>OpenWebSpider# v0.1.3</title>
		<link>http://www.openwebspider.org/2008/11/05/openwebspider-v013/</link>
		<comments>http://www.openwebspider.org/2008/11/05/openwebspider-v013/#comments</comments>
		<pubDate>Wed, 05 Nov 2008 10:40:38 +0000</pubDate>
		<dc:creator>Shen139</dc:creator>
				<category><![CDATA[News]]></category>
		<category><![CDATA[OpenWebSpider]]></category>
		<category><![CDATA[Release]]></category>
		<category><![CDATA[crawler]]></category>
		<category><![CDATA[download]]></category>
		<category><![CDATA[openwebspider]]></category>
		<category><![CDATA[robot]]></category>
		<category><![CDATA[spider]]></category>
		<category><![CDATA[web crawler]]></category>
		<category><![CDATA[web robot]]></category>
		<category><![CDATA[web spider]]></category>

		<guid isPermaLink="false">http://www.openwebspider.org/?p=96</guid>
		<description><![CDATA[Released OpenWebSpider v0.1.3 CHANGELOG: New feature: CRAWLER NAME and CRAWLER VERSION used in the User-Agent string in HTTP Requests New feature: New configuration file field: sql_hostlist_where New feature: new command-line argument: &#8211;keep-dup BUG: fixed the regex used to extract URLs from &#60;BASE&#62; BUG: fixed in the function that extracts URLs BUG: fixed a bug in [...]]]></description>
			<content:encoded><![CDATA[<p>Released OpenWebSpider v0.1.3</p>
<p>CHANGELOG:</p>
<ul>
<li> New feature: CRAWLER NAME and CRAWLER VERSION used in the User-Agent string in HTTP Requests</li>
<li>New feature: New configuration file field: sql_hostlist_where</li>
<li>New feature: new command-line argument: &#8211;keep-dup</li>
<li>BUG: fixed the regex used to extract URLs from &lt;BASE&gt;</li>
<li>BUG: fixed in the function that extracts URLs</li>
<li>BUG: fixed a bug in page.cs::normalizePage()</li>
<li>BUG: fixed minor bugs</li>
<li>BUG: fixed a bug in robots.txt&#8217;s parser</li>
<li>BUG: fixed a bug in page-rels handler</li>
</ul>
<p>Source code and binary are available in the package: <a href="http://www.openwebspider.org/download/">Download</a></p>
<p><strong><a href="http://www.openwebspider.org/documentation/openwebspider-v01/">Documentation of OpenWebSpider# v0.1</a></strong></p>
]]></content:encoded>
			<wfw:commentRss>http://www.openwebspider.org/2008/11/05/openwebspider-v013/feed/</wfw:commentRss>
		<slash:comments>2</slash:comments>
		</item>
		<item>
		<title>OpenWebSpider# v0.1.2</title>
		<link>http://www.openwebspider.org/2008/09/09/openwebspider-v012/</link>
		<comments>http://www.openwebspider.org/2008/09/09/openwebspider-v012/#comments</comments>
		<pubDate>Tue, 09 Sep 2008 10:01:48 +0000</pubDate>
		<dc:creator>Shen139</dc:creator>
				<category><![CDATA[OpenWebSpider]]></category>
		<category><![CDATA[crawler]]></category>
		<category><![CDATA[download]]></category>
		<category><![CDATA[Release]]></category>
		<category><![CDATA[robot]]></category>
		<category><![CDATA[spider]]></category>
		<category><![CDATA[web crawler]]></category>
		<category><![CDATA[web robot]]></category>
		<category><![CDATA[web spider]]></category>

		<guid isPermaLink="false">http://www.openwebspider.org/?p=62</guid>
		<description><![CDATA[Released OpenWebSpider v0.1.2 CHANGELOG: BUG: fixed the regex used to extract URLs from (I)FRAME New feature: OpenWebSpider# can index images (new table: images) New feature: new command-line argument: −−images Improved Stress-test facility: now OpenWebSpider# doesn&#8217;t require a configuration file and a MySQL Server and it doesn&#8217;t check robots.txt (in stress-test mode) Timeout in execution of [...]]]></description>
			<content:encoded><![CDATA[<p>Released OpenWebSpider v0.1.2</p>
<p>CHANGELOG:</p>
<ul>
<li>BUG: fixed the regex used to extract URLs from (I)FRAME</li>
<li>New feature: OpenWebSpider# can index images (new table: images)</li>
<li>New feature: new command-line argument: −−images</li>
<li>Improved Stress-test facility: now OpenWebSpider# doesn&#8217;t require a configuration file and a MySQL Server and it doesn&#8217;t check robots.txt (in stress-test mode)</li>
<li>Timeout in execution of SQL queries set to 120 seconds (2 minutes)</li>
<li>New feature: new configuration file fields: CRAWLER NAME and CRAWLER VERSION</li>
<li>New feature: CRAWLER NAME used over robots.txt</li>
</ul>
<p>Source code and binary are available in the package: <a href="http://www.openwebspider.org/download/">Download</a></p>
<p><strong><a href="http://www.openwebspider.org/documentation/openwebspider-v01/">Documentation of OpenWebSpider# v0.1</a></strong></p>
]]></content:encoded>
			<wfw:commentRss>http://www.openwebspider.org/2008/09/09/openwebspider-v012/feed/</wfw:commentRss>
		<slash:comments>24</slash:comments>
		</item>
	</channel>
</rss>

