<?xml version="1.0" encoding="UTF-8"?><rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
		>
<channel>
	<title>Comments on: Algorithms for data processing</title>
	<atom:link href="http://blog.thekilobytes.net/2006/09/03/algorithms-for-data-processing/feed/" rel="self" type="application/rss+xml" />
	<link>http://blog.thekilobytes.net/2006/09/03/algorithms-for-data-processing/</link>
	<description>Just another WordPress weblog</description>
	<lastBuildDate>Tue, 06 Apr 2010 16:00:34 +0000</lastBuildDate>
	<generator>http://wordpress.org/?v=2.9.2</generator>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
		<item>
		<title>By: kowkaybin</title>
		<link>http://blog.thekilobytes.net/2006/09/03/algorithms-for-data-processing/comment-page-1/#comment-17</link>
		<dc:creator>kowkaybin</dc:creator>
		<pubDate>Sun, 03 Sep 2006 15:46:31 +0000</pubDate>
		<guid isPermaLink="false">http://blog.thekilobytes.net/2006/09/03/algorithms-for-data-processing/#comment-17</guid>
		<description>I&#039;m having ~20k pages of vBulettin board for data samples, now running a word analysis program to process the data, trying to sample the frequency of the words with these data, i hope i can get:

1. Template Words (which shall not be evaluated on query)
2. Grouping of words (synonyms perhaps you can call)
3. *Spelling correction based on some algorithm that i have not came out with</description>
		<content:encoded><![CDATA[<p>I&#8217;m having ~20k pages of vBulettin board for data samples, now running a word analysis program to process the data, trying to sample the frequency of the words with these data, i hope i can get:</p>
<p>1. Template Words (which shall not be evaluated on query)<br />
2. Grouping of words (synonyms perhaps you can call)<br />
3. *Spelling correction based on some algorithm that i have not came out with</p>
]]></content:encoded>
	</item>
</channel>
</rss>

