<?xml version="1.0" encoding="UTF-8" ?>
<?xml-stylesheet type="text/xsl" href="http://blogs.msdn.com/utility/FeedStylesheets/rss.xsl" media="screen"?><rss version="2.0" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:slash="http://purl.org/rss/1.0/modules/slash/" xmlns:wfw="http://wellformedweb.org/CommentAPI/"><channel><title>Microsoft Web N-Gram</title><link>http://blogs.msdn.com/b/webngram/</link><description>Bringing you web-scale language model data.  Web N-Gram is joint project between Microsoft Bing and Microsoft Research.</description><dc:language>en-US</dc:language><generator>Telligent Evolution Platform Developer Build (Build: 5.6.50428.7875)</generator><item><title>Microsoft Research Speller Challenge is open for business</title><link>http://blogs.msdn.com/b/webngram/archive/2011/01/20/microsoft-research-speller-challenge-is-open-for-business.aspx</link><pubDate>Fri, 21 Jan 2011 01:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10118417</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>0</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10118417</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2011/01/20/microsoft-research-speller-challenge-is-open-for-business.aspx#comments</comments><description>&lt;p&gt;Some additional FAQs for the now-open Microsoft Research Speller Challenge.&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2011/01/20/microsoft-research-speller-challenge-is-open-for-business.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10118417" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/REST/">REST</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/SOAP/">SOAP</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/speller+challenge/">speller challenge</category></item><item><title>The dirty secret about large-vocabulary hashes</title><link>http://blogs.msdn.com/b/webngram/archive/2010/12/27/the-dirty-secret-about-large-vocabulary-hashes.aspx</link><pubDate>Mon, 27 Dec 2010 14:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10109263</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>0</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10109263</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2010/12/27/the-dirty-secret-about-large-vocabulary-hashes.aspx#comments</comments><description>&lt;p&gt;Working with large lexicons means engineering trade-offs become necessary.&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2010/12/27/the-dirty-secret-about-large-vocabulary-hashes.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10109263" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/lexicon/">lexicon</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/ngram/">ngram</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/probability/">probability</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/tokenization/">tokenization</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/tokens/">tokens</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/performance/">performance</category></item><item><title>Did you mean...Schwarzenegger?</title><link>http://blogs.msdn.com/b/webngram/archive/2010/12/15/did-you-mean-schwarzenegger.aspx</link><pubDate>Wed, 15 Dec 2010 23:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10105566</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>0</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10105566</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2010/12/15/did-you-mean-schwarzenegger.aspx#comments</comments><description>&lt;p&gt;Introducing the Speller Challenge, a contest from Microsoft Research and Bing.&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2010/12/15/did-you-mean-schwarzenegger.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10105566" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/speller+challenge/">speller challenge</category></item><item><title>Well, do ya, P(&lt;UNK&gt;)?</title><link>http://blogs.msdn.com/b/webngram/archive/2010/12/13/well-do-ya-p-lt-unk-gt.aspx</link><pubDate>Mon, 13 Dec 2010 17:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10104120</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>0</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10104120</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2010/12/13/well-do-ya-p-lt-unk-gt.aspx#comments</comments><description>&lt;p&gt;What happens when you encounter the unknown?&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2010/12/13/well-do-ya-p-lt-unk-gt.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10104120" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/lexicon/">lexicon</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/ngram/">ngram</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/probability/">probability</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/language+modeling/">language modeling</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/unknown/">unknown</category></item><item><title>Perf tips for using the N-Gram service with WCF</title><link>http://blogs.msdn.com/b/webngram/archive/2010/12/06/perf-tips-for-using-the-n-gram-service-with-wcf.aspx</link><pubDate>Mon, 06 Dec 2010 14:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10096294</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>0</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10096294</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2010/12/06/perf-tips-for-using-the-n-gram-service-with-wcf.aspx#comments</comments><description>&lt;p&gt;Some simple performance tips that may speed up your WCF application.&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2010/12/06/perf-tips-for-using-the-n-gram-service-with-wcf.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10096294" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/ngram/">ngram</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/web+service/">web service</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/Models/">Models</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/SOAP/">SOAP</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/performance/">performance</category></item><item><title>The messy business of tokenization</title><link>http://blogs.msdn.com/b/webngram/archive/2010/11/29/the-messy-business-of-tokenization.aspx</link><pubDate>Mon, 29 Nov 2010 14:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10095658</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>0</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10095658</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2010/11/29/the-messy-business-of-tokenization.aspx#comments</comments><description>&lt;p&gt;Learn about some of the details of tokenization in our service&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2010/11/29/the-messy-business-of-tokenization.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10095658" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/ngram/">ngram</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/web+service/">web service</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/probability/">probability</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/tokenization/">tokenization</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/tokens/">tokens</category></item><item><title>Wordbreakingisacinchwithdata</title><link>http://blogs.msdn.com/b/webngram/archive/2010/11/22/wordbreakingisacinchwithdata.aspx</link><pubDate>Mon, 22 Nov 2010 14:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10087751</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>0</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10087751</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2010/11/22/wordbreakingisacinchwithdata.aspx#comments</comments><description>&lt;p&gt;One use of our service is to break words based on n-gram probability info. &amp;nbsp;No linguistic knowledge necessary.&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2010/11/22/wordbreakingisacinchwithdata.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10087751" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/ngram/">ngram</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/probability/">probability</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/REST/">REST</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/Models/">Models</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/word+break/">word break</category></item><item><title>The fluid language of the Web</title><link>http://blogs.msdn.com/b/webngram/archive/2010/11/15/the-fluid-language-of-the-web-and-or-the-rise-of-trackers.aspx</link><pubDate>Mon, 15 Nov 2010 14:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10085084</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>1</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10085084</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2010/11/15/the-fluid-language-of-the-web-and-or-the-rise-of-trackers.aspx#comments</comments><description>&lt;p&gt;Top 100K words for Apr10 body stream is now available for analysis.&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2010/11/15/the-fluid-language-of-the-web-and-or-the-rise-of-trackers.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10085084" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/lexicon/">lexicon</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/ngram/">ngram</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/language+modeling/">language modeling</category></item><item><title>Using the MicrosoftNgram Python Module</title><link>http://blogs.msdn.com/b/webngram/archive/2010/11/08/using-the-microsoftngram-python-module.aspx</link><pubDate>Mon, 08 Nov 2010 14:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10080119</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>1</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10080119</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2010/11/08/using-the-microsoftngram-python-module.aspx#comments</comments><description>&lt;p&gt;A quick tutorial on the MicrosoftNgram Python library.&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2010/11/08/using-the-microsoftngram-python-module.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10080119" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/ngram/">ngram</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/python/">python</category></item><item><title>Who doesn't like models?</title><link>http://blogs.msdn.com/b/webngram/archive/2010/11/01/who-doesn-t-like-models.aspx</link><pubDate>Mon, 01 Nov 2010 13:00:00 GMT</pubDate><guid isPermaLink="false">91d46819-8472-40ad-a661-2c78acb4018c:10072714</guid><dc:creator>Chris Thrasher</dc:creator><slash:comments>0</slash:comments><wfw:commentRss xmlns:wfw="http://wellformedweb.org/CommentAPI/">http://blogs.msdn.com/b/webngram/rsscomments.aspx?WeblogPostID=10072714</wfw:commentRss><comments>http://blogs.msdn.com/b/webngram/archive/2010/11/01/who-doesn-t-like-models.aspx#comments</comments><description>&lt;p&gt;Different models reflect different writing styles on the web.&lt;/p&gt;...(&lt;a href="http://blogs.msdn.com/b/webngram/archive/2010/11/01/who-doesn-t-like-models.aspx"&gt;read more&lt;/a&gt;)&lt;img src="http://blogs.msdn.com/aggbug.aspx?PostID=10072714" width="1" height="1"&gt;</description><category domain="http://blogs.msdn.com/b/webngram/archive/tags/language+modeling/">language modeling</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/REST/">REST</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/Models/">Models</category><category domain="http://blogs.msdn.com/b/webngram/archive/tags/SOAP/">SOAP</category></item></channel></rss>