<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	xmlns:georss="http://www.georss.org/georss" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:media="http://search.yahoo.com/mrss/"
	>

<channel>
	<title>LingPipe Blog</title>
	<atom:link href="http://lingpipe-blog.com/feed/" rel="self" type="application/rss+xml" />
	<link>http://lingpipe-blog.com</link>
	<description>Natural Language Processing and Text Analytics</description>
	<lastBuildDate>Fri, 24 May 2013 06:53:13 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.com/</generator>
<cloud domain='lingpipe-blog.com' port='80' path='/?rsscloud=notify' registerProcedure='' protocol='http-post' />
<image>
		<url>http://s2.wp.com/i/buttonw-com.png</url>
		<title>LingPipe Blog</title>
		<link>http://lingpipe-blog.com</link>
	</image>
	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://lingpipe-blog.com/osd.xml" title="LingPipe Blog" />
	<atom:link rel='hub' href='http://lingpipe-blog.com/?pushpress=hub'/>
		<item>
		<title>All Bayesian Models are Generative (in Theory)</title>
		<link>http://lingpipe-blog.com/2013/05/23/all-bayesian-models-are-generative-in-theory/</link>
		<comments>http://lingpipe-blog.com/2013/05/23/all-bayesian-models-are-generative-in-theory/#comments</comments>
		<pubDate>Thu, 23 May 2013 18:41:20 +0000</pubDate>
		<dc:creator>Bob Carpenter</dc:creator>
				<category><![CDATA[Carp's Blog]]></category>
		<category><![CDATA[Statistics]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6631</guid>
		<description><![CDATA[[This post is a followup to my previous post, Generative vs. discriminative; Bayesian vs. frequentist.] I had a brief chat with Andrew Gelman about the topic of generative vs. discriminative models. It came up when I was asking him why he didn&#8217;t like the frequentist semicolon notation for variables that are not random. He said [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6631&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2013/05/23/all-bayesian-models-are-generative-in-theory/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/77f083909d955b715846250a33340a14?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">lingpipe</media:title>
		</media:content>
	</item>
		<item>
		<title>The Latin1 Transcoding Trick for Ant</title>
		<link>http://lingpipe-blog.com/2013/04/21/the-latin1-transcoding-trick-for-ant/</link>
		<comments>http://lingpipe-blog.com/2013/04/21/the-latin1-transcoding-trick-for-ant/#comments</comments>
		<pubDate>Sun, 21 Apr 2013 22:31:55 +0000</pubDate>
		<dc:creator>mitzimorris</dc:creator>
				<category><![CDATA[Java]]></category>
		<category><![CDATA[Mitzi's Blog]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6614</guid>
		<description><![CDATA[A while back Bob blogged about The Latin1 Transcoding Trick for Java Servlets, etc. Suppose you have an API that insists on converting an as-yet-unseen stream of bytes to characters for you (e.g. servlets), but lets you set the character encoding if you want. Because Latin1 (officially, ISO-8859-1) maps bytes one-to-one to Unicode code points, [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6614&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2013/04/21/the-latin1-transcoding-trick-for-ant/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://2.gravatar.com/avatar/5148afd2ad595dd1a9a791e06a9af07a?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">mitzimorris</media:title>
		</media:content>
	</item>
		<item>
		<title>Generative vs. Discriminative; Bayesian vs. Frequentist</title>
		<link>http://lingpipe-blog.com/2013/04/12/generative-vs-discriminative-bayesian-vs-frequentist/</link>
		<comments>http://lingpipe-blog.com/2013/04/12/generative-vs-discriminative-bayesian-vs-frequentist/#comments</comments>
		<pubDate>Fri, 12 Apr 2013 20:19:49 +0000</pubDate>
		<dc:creator>Bob Carpenter</dc:creator>
				<category><![CDATA[Carp's Blog]]></category>
		<category><![CDATA[Statistics]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6601</guid>
		<description><![CDATA[[There's now a followup post, All Bayesian models are generative (in theory).] I was helping Boyi Xie get ready for his Ph.D. qualifying exams in computer science at Columbia and at one point I wrote the following diagram on the board to lay out the generative/discriminative and Bayesian/frequentist distinctions in what gets modeled. To keep [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6601&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2013/04/12/generative-vs-discriminative-bayesian-vs-frequentist/feed/</wfw:commentRss>
		<slash:comments>21</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/77f083909d955b715846250a33340a14?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">lingpipe</media:title>
		</media:content>
	</item>
		<item>
		<title>Mean-Field Variational Inference Made Easy</title>
		<link>http://lingpipe-blog.com/2013/03/25/mean-field-variational-inference-made-easy/</link>
		<comments>http://lingpipe-blog.com/2013/03/25/mean-field-variational-inference-made-easy/#comments</comments>
		<pubDate>Mon, 25 Mar 2013 18:14:37 +0000</pubDate>
		<dc:creator>Bob Carpenter</dc:creator>
				<category><![CDATA[Carp's Blog]]></category>
		<category><![CDATA[Statistics]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6514</guid>
		<description><![CDATA[I had the hardest time trying to understand variational inference. All of the presentations I&#8217;ve seen (MacKay, Bishop, Wikipedia, Gelman&#8217;s draft for the third edition of Bayesian Data Analysis) are deeply tied up with the details of a particular model being fit. I wanted to see the algorithm and get the big picture before being [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6514&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2013/03/25/mean-field-variational-inference-made-easy/feed/</wfw:commentRss>
		<slash:comments>7</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/77f083909d955b715846250a33340a14?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">lingpipe</media:title>
		</media:content>
	</item>
		<item>
		<title>Anyone Want to Write an O&#8217;Reilly Book on NLP with Java?</title>
		<link>http://lingpipe-blog.com/2013/02/21/want-write-oreilly-book-nlp-java/</link>
		<comments>http://lingpipe-blog.com/2013/02/21/want-write-oreilly-book-nlp-java/#comments</comments>
		<pubDate>Thu, 21 Feb 2013 19:52:58 +0000</pubDate>
		<dc:creator>Bob Carpenter</dc:creator>
				<category><![CDATA[Carp's Blog]]></category>
		<category><![CDATA[Java]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6476</guid>
		<description><![CDATA[Mitzi and I pitched O&#8217;Reilly books a revision of the Text Processing in Java book that she&#8217;s been finishing off. The response from their editor was that they&#8217;d love to have an NLP book based on Java, but what we provided looked like everything-but-the-NLP you&#8217;d need for such a book. Insightful, these editors. That&#8217;s exactly [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6476&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2013/02/21/want-write-oreilly-book-nlp-java/feed/</wfw:commentRss>
		<slash:comments>5</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/77f083909d955b715846250a33340a14?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">lingpipe</media:title>
		</media:content>
	</item>
		<item>
		<title>Bayesian Inference for LDA is Intractable</title>
		<link>http://lingpipe-blog.com/2013/02/18/bayesian-inference-for-lda-is-intractable/</link>
		<comments>http://lingpipe-blog.com/2013/02/18/bayesian-inference-for-lda-is-intractable/#comments</comments>
		<pubDate>Mon, 18 Feb 2013 22:42:38 +0000</pubDate>
		<dc:creator>Bob Carpenter</dc:creator>
				<category><![CDATA[Carp's Blog]]></category>
		<category><![CDATA[LingPipe in Use]]></category>
		<category><![CDATA[Statistics]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6422</guid>
		<description><![CDATA[Bayesian inference for LDA is intractable. And I mean really really deeply intractable in a way that nobody has figured or is ever likely to figure out how to solve. Before sending me a &#8220;but, but, but, &#8230;&#8221; reply, you might want to bone up on the technical definition of Bayesian inference, which is a [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6422&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2013/02/18/bayesian-inference-for-lda-is-intractable/feed/</wfw:commentRss>
		<slash:comments>9</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/77f083909d955b715846250a33340a14?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">lingpipe</media:title>
		</media:content>
	</item>
		<item>
		<title>Another Linguistic Corpus Collection Game</title>
		<link>http://lingpipe-blog.com/2012/11/12/another-linguistic-corpus-collection-game/</link>
		<comments>http://lingpipe-blog.com/2012/11/12/another-linguistic-corpus-collection-game/#comments</comments>
		<pubDate>Mon, 12 Nov 2012 22:45:01 +0000</pubDate>
		<dc:creator>Bob Carpenter</dc:creator>
				<category><![CDATA[Carp's Blog]]></category>
		<category><![CDATA[Data Annotation]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6192</guid>
		<description><![CDATA[Johan Bos and his crew at University of Groningen have a new suite of games aimed at linguistic data data collection. You can find them at: http://www.wordrobe.org/ Wordrobe is currently hosting four games. Twins is aimed at part-of-speech tagging, Senses is for word sense annotation, Pointers for coref data, and Names for proper name classification. [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6192&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2012/11/12/another-linguistic-corpus-collection-game/feed/</wfw:commentRss>
		<slash:comments>3</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/77f083909d955b715846250a33340a14?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">lingpipe</media:title>
		</media:content>
	</item>
		<item>
		<title>Upgrading from Beta-Binomial to Logistic Regression</title>
		<link>http://lingpipe-blog.com/2012/10/30/upgrading-from-beta-binomial-to-logistic-regression/</link>
		<comments>http://lingpipe-blog.com/2012/10/30/upgrading-from-beta-binomial-to-logistic-regression/#comments</comments>
		<pubDate>Tue, 30 Oct 2012 18:00:02 +0000</pubDate>
		<dc:creator>Bob Carpenter</dc:creator>
				<category><![CDATA[Carp's Blog]]></category>
		<category><![CDATA[Statistics]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6173</guid>
		<description><![CDATA[Bernoulli Model Consider the following very simple model of drawing the components of a binary random N-vector y i.i.d. from a Bernoulli distribution with chance of success theta. data { int N; // number of items int y[N]; // binary outcome for item i } parameters { real theta; // Prob(y[n]=1) = theta } model [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6173&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2012/10/30/upgrading-from-beta-binomial-to-logistic-regression/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/77f083909d955b715846250a33340a14?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">lingpipe</media:title>
		</media:content>
	</item>
		<item>
		<title>Mystery Novel with Natural Language Processing</title>
		<link>http://lingpipe-blog.com/2012/10/24/mystery-novel-with-natural-language-processing/</link>
		<comments>http://lingpipe-blog.com/2012/10/24/mystery-novel-with-natural-language-processing/#comments</comments>
		<pubDate>Wed, 24 Oct 2012 19:30:56 +0000</pubDate>
		<dc:creator>Bob Carpenter</dc:creator>
				<category><![CDATA[Carp's Blog]]></category>
		<category><![CDATA[Reviews]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6108</guid>
		<description><![CDATA[For those of you who like mystery novels, Mitzi&#8217;s just written one. The added bonus for readers of this blog is that there&#8217;s natural language processing involved in the detective work (I don&#8217;t want to give too much away, so I can&#8217;t tell you how). Poetic Justice is in the cozy mystery sub-genre, where the [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6108&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2012/10/24/mystery-novel-with-natural-language-processing/feed/</wfw:commentRss>
		<slash:comments>5</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/77f083909d955b715846250a33340a14?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">lingpipe</media:title>
		</media:content>

		<media:content url="http://colloquial.com/images/pj_cover.jpg" medium="image">
			<media:title type="html">Mitzi Morris, Poetic Justice Cover</media:title>
		</media:content>
	</item>
		<item>
		<title>High Kappa Values are not Necessary for High Quality Corpora</title>
		<link>http://lingpipe-blog.com/2012/10/02/high-kappa-not-necessary-high-quality-corpora/</link>
		<comments>http://lingpipe-blog.com/2012/10/02/high-kappa-not-necessary-high-quality-corpora/#comments</comments>
		<pubDate>Tue, 02 Oct 2012 22:34:45 +0000</pubDate>
		<dc:creator>Bob Carpenter</dc:creator>
				<category><![CDATA[Carp's Blog]]></category>
		<category><![CDATA[Data Annotation]]></category>
		<category><![CDATA[Statistics]]></category>

		<guid isPermaLink="false">http://lingpipe-blog.com/?p=6131</guid>
		<description><![CDATA[I&#8217;m not a big fan of kappa statistics, to say the least. I point out several problems with kappa statistics right after the initial studies in this talk on annotation modeling. I just got back from another talk on annotation where I was ranting again about the uselessness of kappa. In particular, this blog post [&#8230;]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=lingpipe-blog.com&#038;blog=2555819&#038;post=6131&#038;subd=lingpipe&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
		<wfw:commentRss>http://lingpipe-blog.com/2012/10/02/high-kappa-not-necessary-high-quality-corpora/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/77f083909d955b715846250a33340a14?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">lingpipe</media:title>
		</media:content>

		<media:content url="http://lingpipe.files.wordpress.com/2012/10/prev_vs_accuracy_kappa.png" medium="image">
			<media:title type="html">Kappa for varying prevalences and accuracies</media:title>
		</media:content>

		<media:content url="http://lingpipe.files.wordpress.com/2012/10/kappa_plot_whole.png" medium="image">
			<media:title type="html">Kappa for varying prevalences and accuracies</media:title>
		</media:content>
	</item>
	</channel>
</rss>
