<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>Jonas K. Sekamane &#187; scanned text</title>
	<atom:link href="http://jonas.sekamane.com/tag/scanned-text/feed/" rel="self" type="application/rss+xml" />
	<link>http://jonas.sekamane.com</link>
	<description>...</description>
	<lastBuildDate>Fri, 13 Aug 2010 22:33:06 +0000</lastBuildDate>
	<generator>http://wordpress.org/?v=2.8.5</generator>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
			<item>
		<title>Crowds teach computers to read the scanned text</title>
		<link>http://jonas.sekamane.com/2009/09/crowds-teach-computers-to-read-the-scanned-text/</link>
		<comments>http://jonas.sekamane.com/2009/09/crowds-teach-computers-to-read-the-scanned-text/#comments</comments>
		<pubDate>Wed, 16 Sep 2009 19:21:24 +0000</pubDate>
		<dc:creator>Jonas K. Sekamane</dc:creator>
				<category><![CDATA[Innovative Business Models]]></category>
		<category><![CDATA[crowdsourcing]]></category>
		<category><![CDATA[digitize]]></category>
		<category><![CDATA[google]]></category>
		<category><![CDATA[reCAPTCHA]]></category>
		<category><![CDATA[scanned text]]></category>
		<category><![CDATA[technology]]></category>

		<guid isPermaLink="false">http://jonas.sekamane.com/?p=40</guid>
		<description><![CDATA[From the Google Acquires reCAPTCHA article at Mashable.com:
Why exactly does Google want to own this technology?
&#8230; many of the CAPTCHAs provided by reCAPTCHA come from scanned archival newspapers and old books. Computers find it hard to recognize these words because the ink and paper have degraded over time, but by typing them in as a CAPTCHA, [...]]]></description>
			<content:encoded><![CDATA[<p>From the <a title="Google Acquires reCAPTCHA" href="http://mashable.com/2009/09/16/google-acquires-recaptcha/"><strong>Google Acquires reCAPTCHA</strong></a> article at Mashable.com:</p>
<blockquote><p><strong>Why exactly does Google want to own this technology?</strong></p>
<p style="margin-bottom: 1em; margin-top: 0px; margin-right: 0px; margin-left: 0px; line-height: 1.5; text-align: justify; padding: 0px;">&#8230; many of the CAPTCHAs provided by reCAPTCHA come from scanned archival newspapers and old books. Computers find it hard to recognize these words because the ink and paper have degraded over time, but by typing them in as a CAPTCHA, crowds teach computers to read the scanned text.”</p>
<p style="margin-bottom: 1em; margin-top: 0px; margin-right: 0px; margin-left: 0px; line-height: 1.5; text-align: justify; padding: 0px;">&#8230; those 100,000+ captcha forms are now Google-powered, with the data being used to improve Google’s ability to digitize old books and newspapers to make them Web searchable. It makes a lot of sense, and gives Google yet another strategic advantage over would-be competitors.</p>
</blockquote>
]]></content:encoded>
			<wfw:commentRss>http://jonas.sekamane.com/2009/09/crowds-teach-computers-to-read-the-scanned-text/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
	</channel>
</rss>
