<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	xmlns:georss="http://www.georss.org/georss" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:media="http://search.yahoo.com/mrss/"
	>

<channel>
	<title>Plush Thoughts</title>
	<atom:link href="http://plushloony.wordpress.com/feed/" rel="self" type="application/rss+xml" />
	<link>http://plushloony.wordpress.com</link>
	<description>thoughts on technology, information and drinks...</description>
	<lastBuildDate>Fri, 09 Oct 2009 12:48:13 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.com/</generator>
<cloud domain='plushloony.wordpress.com' port='80' path='/?rsscloud=notify' registerProcedure='' protocol='http-post' />
<image>
		<url>http://s2.wp.com/i/buttonw-com.png</url>
		<title>Plush Thoughts</title>
		<link>http://plushloony.wordpress.com</link>
	</image>
	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://plushloony.wordpress.com/osd.xml" title="Plush Thoughts" />
	<atom:link rel='hub' href='http://plushloony.wordpress.com/?pushpress=hub'/>
		<item>
		<title>truckur</title>
		<link>http://plushloony.wordpress.com/2009/10/09/truckur/</link>
		<comments>http://plushloony.wordpress.com/2009/10/09/truckur/#comments</comments>
		<pubDate>Fri, 09 Oct 2009 12:45:34 +0000</pubDate>
		<dc:creator>plushloony</dc:creator>
				<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[Sentiment Analysis]]></category>
		<category><![CDATA[sentiment extraction]]></category>
		<category><![CDATA[social media]]></category>
		<category><![CDATA[twitter]]></category>

		<guid isPermaLink="false">http://plushloony.wordpress.com/?p=28</guid>
		<description><![CDATA[I&#8217;ve checked this out. It sucks. I submitted several laptop names and got hundreds records, all of them were tagged as neutral. Just a heap of twitter and news garbage. Does everybody test their applications on &#8220;IPhone&#8221; &#38; &#8220;Apple&#8221; only? It explains a lot&#8230; Such a caustic post=)))<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=28&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I&#8217;ve checked <a href="http://www.trackur.com"> this </a> out. It sucks.<br />
I submitted several laptop names and got hundreds records, all of them were tagged as neutral. Just a heap of twitter and news garbage. Does everybody test their applications on &#8220;IPhone&#8221; &amp; &#8220;Apple&#8221; only? It explains a lot&#8230;</p>
<p>Such a caustic post=)))</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/plushloony.wordpress.com/28/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/plushloony.wordpress.com/28/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/plushloony.wordpress.com/28/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/plushloony.wordpress.com/28/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/plushloony.wordpress.com/28/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/plushloony.wordpress.com/28/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/plushloony.wordpress.com/28/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/plushloony.wordpress.com/28/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/plushloony.wordpress.com/28/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/plushloony.wordpress.com/28/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/plushloony.wordpress.com/28/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/plushloony.wordpress.com/28/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/plushloony.wordpress.com/28/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/plushloony.wordpress.com/28/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=28&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://plushloony.wordpress.com/2009/10/09/truckur/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/d3997ae25afa54f25664de1326fde8f3?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">plushloony</media:title>
		</media:content>
	</item>
		<item>
		<title>GATE: Russian POS tagger</title>
		<link>http://plushloony.wordpress.com/2009/10/01/gate-russian-pos-tagger/</link>
		<comments>http://plushloony.wordpress.com/2009/10/01/gate-russian-pos-tagger/#comments</comments>
		<pubDate>Thu, 01 Oct 2009 15:13:46 +0000</pubDate>
		<dc:creator>plushloony</dc:creator>
				<category><![CDATA[gate]]></category>
		<category><![CDATA[Information Extraction]]></category>
		<category><![CDATA[language processing]]></category>
		<category><![CDATA[natural language processing]]></category>
		<category><![CDATA[NLP]]></category>
		<category><![CDATA[mystem]]></category>
		<category><![CDATA[russian POS tagger]]></category>
		<category><![CDATA[yandex]]></category>

		<guid isPermaLink="false">http://plushloony.wordpress.com/?p=23</guid>
		<description><![CDATA[As I wrote before GATE is &#8216;good to start&#8217; natural language processing open source framework. I&#8217;ll try to write interesting observations and finding related to capabilities of this system. And first of all I would like to share two approaches to processing of Russian language in this system. Russian segment of world wide web is [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=23&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>As I wrote before GATE is &#8216;good to start&#8217; natural language processing open source framework. I&#8217;ll try to write interesting observations and finding related to capabilities of this system. And first of all I would like to share two approaches to processing of Russian language in this system.</p>
<p>Russian segment of world wide web is fast growing source of data and has potential of huge electronic market, so ability to process and make reasonable conclusions from it&#8217;s content could be quite important for international corporations very soon. At the same time there are not too many solutions and technologies that focus on Russian texts. Support of russian language always was secondary to any company or technology related to the field of the NLP and GATE is an exception. By here are a few ways how you could add support of Russian morphological analysis to GATE based application.</p>
<p>The first approach is based on commercial (but available for non-commercial use) product of Yandex (www.yandex.ru) &#8211;  <a href="http://company.yandex.ru/technology/mystem/">MyStem</a>.  On the <a href="http://dvsekhvalnov.itbrains.ru/index.php/Russian_PRs">ITBrains</a> website you could find detailed steps and download links that would help you to enable Russian POS tagger functionality to GATE. Unfortunately this site experiences technical issues and I preserved corresponding information here -  <a href="http://narod.ru/disk/11416560000/Ru-morph-tagger.zip.html">Ru-morph-tagger.zip &#8211; plugin</a>; <a href="http://narod.ru/disk/11416735000/yandbtm.htm.html"> Documentation (brief guide)</a></p>
<p>Here is another way to embede support of russian language: <a href="http://rupostagger.sourceforge.net/">Russian POS tagger</a></p>
<p>Please let me know if these materials are usefull to someone and if translate is needed somewhere. I&#8217;d be glad to help.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/plushloony.wordpress.com/23/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/plushloony.wordpress.com/23/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/plushloony.wordpress.com/23/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/plushloony.wordpress.com/23/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/plushloony.wordpress.com/23/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/plushloony.wordpress.com/23/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/plushloony.wordpress.com/23/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/plushloony.wordpress.com/23/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/plushloony.wordpress.com/23/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/plushloony.wordpress.com/23/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/plushloony.wordpress.com/23/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/plushloony.wordpress.com/23/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/plushloony.wordpress.com/23/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/plushloony.wordpress.com/23/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=23&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://plushloony.wordpress.com/2009/10/01/gate-russian-pos-tagger/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/d3997ae25afa54f25664de1326fde8f3?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">plushloony</media:title>
		</media:content>
	</item>
		<item>
		<title>Twitter &#8211; Sentimental Satisfaction</title>
		<link>http://plushloony.wordpress.com/2009/09/30/twitter-inside/</link>
		<comments>http://plushloony.wordpress.com/2009/09/30/twitter-inside/#comments</comments>
		<pubDate>Wed, 30 Sep 2009 15:45:44 +0000</pubDate>
		<dc:creator>plushloony</dc:creator>
				<category><![CDATA[sentiment extraction]]></category>
		<category><![CDATA[twitter]]></category>
		<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[Sentiment Analysis]]></category>
		<category><![CDATA[Voice of Customer]]></category>

		<guid isPermaLink="false">http://plushloony.wordpress.com/?p=13</guid>
		<description><![CDATA[Twitter has tempting search API and access to millions of human “thoughts”. What kind of helpful, really meaningful information could be extracted from them? I don&#8217;t believe there is any&#8230;Isn’t it just a huge recycle bin? Any ideas? You’d say : “Sentiments!”. Ok, you are not the first with this idea, let’s see&#8230; Here are [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=13&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Twitter has tempting search API and access to millions of human “thoughts”. What kind of helpful, really meaningful information could be extracted from them? I don&#8217;t believe there is any&#8230;Isn’t it just a huge recycle bin? Any ideas?<br />
You’d say : “Sentiments!”. Ok, you are not the first with this idea, let’s see&#8230; Here are two projects that utilize twitter trying to find positive or negative feedback related to brand, product or concept, I believe we will see more soon.<br />
Beta Version. Research: <a title="TwitterSentiments" href="http://twittersentiment.appspot.com/" target="_blank">http://twittersentiment.appspot.com/</a><br />
These guys still don’t want to send me invitation and give me a chance to test new service, but you can find some screen shots on their site: <a title="TweetSatisfaction" href="http://www.tweetsatisfaction.com" target="_blank">http://www.tweetsatisfaction.com</a></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/plushloony.wordpress.com/13/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/plushloony.wordpress.com/13/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/plushloony.wordpress.com/13/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/plushloony.wordpress.com/13/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/plushloony.wordpress.com/13/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/plushloony.wordpress.com/13/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/plushloony.wordpress.com/13/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/plushloony.wordpress.com/13/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/plushloony.wordpress.com/13/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/plushloony.wordpress.com/13/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/plushloony.wordpress.com/13/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/plushloony.wordpress.com/13/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/plushloony.wordpress.com/13/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/plushloony.wordpress.com/13/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=13&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://plushloony.wordpress.com/2009/09/30/twitter-inside/feed/</wfw:commentRss>
		<slash:comments>2</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/d3997ae25afa54f25664de1326fde8f3?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">plushloony</media:title>
		</media:content>
	</item>
		<item>
		<title>Where information lives…</title>
		<link>http://plushloony.wordpress.com/2009/08/06/where-information-lives%e2%80%a6/</link>
		<comments>http://plushloony.wordpress.com/2009/08/06/where-information-lives%e2%80%a6/#comments</comments>
		<pubDate>Thu, 06 Aug 2009 12:06:17 +0000</pubDate>
		<dc:creator>plushloony</dc:creator>
				<category><![CDATA[Information Extraction]]></category>
		<category><![CDATA[Information Sources]]></category>

		<guid isPermaLink="false">http://plushloony.wordpress.com/?p=9</guid>
		<description><![CDATA[I’d like to take a look at the problem of identifying most valuable publicly available web sources of unstructured or semi-structured data, sources that could be efficiently used for extraction of useful information. By valuable of source I mean maximal ratio of information extraction algorithms complexity required to extract data to amount of potentially useful [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=9&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I’d like to take a look at the problem of identifying most valuable publicly available web sources of unstructured or semi-structured data, sources that could be efficiently used for extraction of useful information. By valuable of source I mean maximal ratio of information extraction algorithms complexity required to extract data to amount of potentially useful information extracted by that methods. Here are just a few thoughts on this…</p>
<p>We don’t expect single text taken from the web to be a trusted source. I think it’s obvious that text created by some author reflects his mistakes and subjective opinion, and also any method of information retrieval returns a number of “false positives”. Thus we need to consider sources that provide significant amount of similar text on a same subject but generated by different authors. In this case common things could be considered as trusted or at least as important facts.</p>
<p>The next problem is homogeneity…One author could describe a lot of things in one text. It significantly increase complexity of information processing if we’d need to identify which authors’ thought relates to what subject.</p>
<p>And as the last item in the list of most significant problems I would name relevancy. For example, if we want to know an opinion about a new movie we are not interested in reading press release cross posted in someone’s blog, technically it’s possible, but it’s hard to identify that such blog item is not a review.</p>
<p>So from my point of view</p>
<ul>
<li><strong>good sources</strong>: customers reviews, professional product reviews</li>
<li><strong>bad sources</strong>: blogs, forums, press releases</li>
</ul>
<p>…other examples?</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/plushloony.wordpress.com/9/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/plushloony.wordpress.com/9/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/plushloony.wordpress.com/9/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/plushloony.wordpress.com/9/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/plushloony.wordpress.com/9/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/plushloony.wordpress.com/9/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/plushloony.wordpress.com/9/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/plushloony.wordpress.com/9/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/plushloony.wordpress.com/9/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/plushloony.wordpress.com/9/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/plushloony.wordpress.com/9/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/plushloony.wordpress.com/9/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/plushloony.wordpress.com/9/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/plushloony.wordpress.com/9/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=9&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://plushloony.wordpress.com/2009/08/06/where-information-lives%e2%80%a6/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/d3997ae25afa54f25664de1326fde8f3?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">plushloony</media:title>
		</media:content>
	</item>
		<item>
		<title>NLP for free! NLP for fun!</title>
		<link>http://plushloony.wordpress.com/2009/07/31/nlp-for-free-nlp-for-fun/</link>
		<comments>http://plushloony.wordpress.com/2009/07/31/nlp-for-free-nlp-for-fun/#comments</comments>
		<pubDate>Fri, 31 Jul 2009 14:28:23 +0000</pubDate>
		<dc:creator>plushloony</dc:creator>
				<category><![CDATA[gate]]></category>
		<category><![CDATA[Information Extraction]]></category>
		<category><![CDATA[NLP]]></category>
		<category><![CDATA[Named Entity Extraction]]></category>

		<guid isPermaLink="false">http://plushloony.wordpress.com/?p=7</guid>
		<description><![CDATA[I can’t say that I know a lot services on the web that provide result of sophisticated natural language processing (NLP). Ok, there are huge search machines, news aggregators, plagiarism identification processors, some academic research projects and … what else?&#8230;Sure on the corporate and government level there are systems that are processing data like unstructured [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=7&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I can’t say that I know a lot services on the web that provide result of sophisticated natural language processing (NLP). Ok, there are huge search machines, news aggregators, plagiarism identification processors, some academic research projects and … what else?&#8230;Sure on the corporate and government level there are systems that are processing data like unstructured customers’ feedback, communication data for security purposes, news etc, but NLP gives mostly nothing to average people. Nothing for having fun! Unlikely it’s hard to suggest cool problem to resolve using NLP methods.  I simply believe that not too many people know how interesting is to work on them. More over most part of software created for NLP and information extraction purposes is a subject of research and absolutely free. Don’t think that its ugly student-made programs, if you think so – take a look at <a href="http://gate.ac.uk">GATE</a> (General Architecture for Text Engineering) by Sheffield University.</p>
<p style="text-align:center;"><img class="aligncenter" title="GATE" src="http://gate.ac.uk/images/gate.gif" alt="" width="66" height="60" /></p>
<p>It’s really powerful open source software that already has dozens of extensions and could be used in mostly all text processing tasks. System is well documented and has preconfigured module called ANNIE to solve standard problem of annotating English text with morphological information, tokenizing, stemming, extracting named entities. Also it’s simple to write your own grammar rules to extract any kind of information you need. Try to play with it and may be you’d have an idea of how to get some value from it! I’d share some experience of using it in the further posts.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/plushloony.wordpress.com/7/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/plushloony.wordpress.com/7/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/plushloony.wordpress.com/7/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/plushloony.wordpress.com/7/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/plushloony.wordpress.com/7/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/plushloony.wordpress.com/7/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/plushloony.wordpress.com/7/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/plushloony.wordpress.com/7/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/plushloony.wordpress.com/7/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/plushloony.wordpress.com/7/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/plushloony.wordpress.com/7/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/plushloony.wordpress.com/7/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/plushloony.wordpress.com/7/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/plushloony.wordpress.com/7/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=7&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://plushloony.wordpress.com/2009/07/31/nlp-for-free-nlp-for-fun/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/d3997ae25afa54f25664de1326fde8f3?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">plushloony</media:title>
		</media:content>

		<media:content url="http://gate.ac.uk/images/gate.gif" medium="image">
			<media:title type="html">GATE</media:title>
		</media:content>
	</item>
		<item>
		<title>Paroles, paroles, paroles&#8230;</title>
		<link>http://plushloony.wordpress.com/2009/07/28/paroles-paroles-paroles/</link>
		<comments>http://plushloony.wordpress.com/2009/07/28/paroles-paroles-paroles/#comments</comments>
		<pubDate>Tue, 28 Jul 2009 12:08:42 +0000</pubDate>
		<dc:creator>plushloony</dc:creator>
				<category><![CDATA[Information Extraction]]></category>

		<guid isPermaLink="false">http://plushloony.wordpress.com/?p=3</guid>
		<description><![CDATA[Don’t you think that there is a lot of absolutely useless information in the world? Information that is hard to call so. Terabytes of redundant characters…Take a look at science articles, PHD works, textbooks etc. All of them could be much thinner if their authors leave only main ideas and accurate proofs based on rules [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=3&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Don’t you think that there is a lot of absolutely useless information in the world? Information that is hard to call so. Terabytes of redundant characters…Take a look at science articles, PHD works, textbooks etc. All of them could be much thinner if their authors leave only main ideas and accurate proofs based on rules of formal logic. Even in some areas where is no place for gas, paper works stays full of empty sentences and redundant word constructions. This note is not an exception! It’s probably in human nature to generate twaddle and hide ideas and facts behind the wall made of words and secondary mind images.</p>
<p>It’s not a problem if the topic you are interested in is described in trusted, complete and the only source. You could allow yourself to spend hours or even days studying it. If you are professional you’d also find what you need in 1000 pages book. Even if two-three sources are enough to get result – context search would be a solution.  But what if search result for your query consist of hundreds documents and you are not so familiar with a subject area?</p>
<p>There is a simple example – the review of a new gadget.  For an advanced internet user it’s an easy task to  get hundreds of related articles, identify most promising, complete and trustful and…finally you&#8217;d get subjective opinion of one or several “experts”.  Not sure that anyone will ever carefully read more than 3-4 reviews, or study badly organized or foreign language resources.</p>
<p>Some companies say that their products “make sense from content”. Sometimes they mean aggregation, search or data mining and analytics. How could we find facts and knowledge behind words and sentences? That would a topic of some records in this Blog&#8230;</p>
<p>Do you have any examples of services that use same idea as the basis?</p>
<p>To be continued…</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/plushloony.wordpress.com/3/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/plushloony.wordpress.com/3/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/plushloony.wordpress.com/3/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/plushloony.wordpress.com/3/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/plushloony.wordpress.com/3/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/plushloony.wordpress.com/3/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/plushloony.wordpress.com/3/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/plushloony.wordpress.com/3/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/plushloony.wordpress.com/3/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/plushloony.wordpress.com/3/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/plushloony.wordpress.com/3/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/plushloony.wordpress.com/3/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/plushloony.wordpress.com/3/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/plushloony.wordpress.com/3/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=plushloony.wordpress.com&amp;blog=8765810&amp;post=3&amp;subd=plushloony&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://plushloony.wordpress.com/2009/07/28/paroles-paroles-paroles/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/d3997ae25afa54f25664de1326fde8f3?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">plushloony</media:title>
		</media:content>
	</item>
	</channel>
</rss>
