<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>Cornelius Puschmann&#039;s Blog &#187; Things I want to look up later</title>
	<atom:link href="http://blog.ynada.com/category/things-i-want-to-look-up-later/feed" rel="self" type="application/rss+xml" />
	<link>http://blog.ynada.com</link>
	<description>My new blog on Linguistics, Digital Humanities and Scholarly Communication on the Internet</description>
	<lastBuildDate>Wed, 18 Jan 2012 17:54:42 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.org/?v=3.3.1</generator>
		<item>
		<title>NLTK corpora</title>
		<link>http://blog.ynada.com/95</link>
		<comments>http://blog.ynada.com/95#comments</comments>
		<pubDate>Sat, 11 Jul 2009 13:26:11 +0000</pubDate>
		<dc:creator>cornelius</dc:creator>
				<category><![CDATA[Things I want to look up later]]></category>
		<category><![CDATA[nltk]]></category>

		<guid isPermaLink="false">http://blog.ynada.com/?p=95</guid>
		<description><![CDATA[[*] alpino&#8230;&#8230;&#8230;&#8230;.. Alpino Dutch Treebank [*] nombank.1.0&#8230;&#8230;&#8230; NomBank Corpus 1.0 [*] abc&#8230;&#8230;&#8230;&#8230;&#8230;.. Australian Broadcasting Commission 2006 [*] maxent_ne_chunker&#8230; ACE Named Entity Chunker (Maximum entropy) [*] conll2000&#8230;&#8230;&#8230;.. CONLL 2000 Chunking Corpus [*] chat80&#8230;&#8230;&#8230;&#8230;.. Chat-80 Data Files [*] brown&#8230;&#8230;&#8230;&#8230;&#8230; Brown Corpus [*] brown_tei&#8230;&#8230;&#8230;.. Brown Corpus (TEI XML Version) [*] cmudict&#8230;&#8230;&#8230;&#8230;. The Carnegie Mellon Pronouncing Dictionary (0.6) [*] [...]]]></description>
			<content:encoded><![CDATA[<p>[*] alpino&#8230;&#8230;&#8230;&#8230;.. Alpino Dutch Treebank<br />
[*] nombank.1.0&#8230;&#8230;&#8230; NomBank Corpus 1.0<br />
[*] abc&#8230;&#8230;&#8230;&#8230;&#8230;.. Australian Broadcasting Commission 2006<br />
[*] maxent_ne_chunker&#8230; ACE Named Entity Chunker (Maximum entropy)<br />
[*] conll2000&#8230;&#8230;&#8230;.. CONLL 2000 Chunking Corpus<br />
[*] chat80&#8230;&#8230;&#8230;&#8230;.. Chat-80 Data Files<br />
[*] brown&#8230;&#8230;&#8230;&#8230;&#8230; Brown Corpus<br />
[*] brown_tei&#8230;&#8230;&#8230;.. Brown Corpus (TEI XML Version)<br />
[*] cmudict&#8230;&#8230;&#8230;&#8230;. The Carnegie Mellon Pronouncing Dictionary (0.6)<br />
[*] biocreative_ppi&#8230;.. BioCreAtIvE (Critical Assessment of Information<br />
Extraction Systems in Biology)<br />
[*] cess_cat&#8230;&#8230;&#8230;&#8230; CESS-CAT Treebank<br />
[*] conll2002&#8230;&#8230;&#8230;.. CONLL 2002 Named Entity Recognition Corpus<br />
[*] conll2007&#8230;&#8230;&#8230;.. Dependency Treebanks from CoNLL 2007 (Catalan<br />
and Basque Subset)<br />
[*] city_database&#8230;&#8230;. City Database<br />
[*] indian&#8230;&#8230;&#8230;&#8230;.. Indian Language POS-Tagged Corpus<br />
[*] shakespeare&#8230;&#8230;&#8230; Shakespeare XML Corpus Sample<br />
[*] dependency_treebank. Dependency Parsed Treebank<br />
[*] inaugural&#8230;&#8230;&#8230;.. C-Span Inaugural Address Corpus<br />
[*] ieer&#8230;&#8230;&#8230;&#8230;&#8230;. NIST IE-ER DATA SAMPLE<br />
[*] gutenberg&#8230;&#8230;&#8230;.. Project Gutenberg Selections<br />
[*] gazetteers&#8230;&#8230;&#8230;. Gazeteer Lists<br />
[*] names&#8230;&#8230;&#8230;&#8230;&#8230; Names Corpus, Version 1.3 (1994-03-29)<br />
[*] mac_morpho&#8230;&#8230;&#8230;. MAC-MORPHO: Brazilian Portuguese news text with<br />
part-of-speech tags<br />
[*] movie_reviews&#8230;&#8230;. Sentiment Polarity Dataset Version 2.0<br />
[*] cess_esp&#8230;&#8230;&#8230;&#8230; CESS-ESP Treebank<br />
[*] genesis&#8230;&#8230;&#8230;&#8230;. Genesis Corpus<br />
[*] kimmo&#8230;&#8230;&#8230;&#8230;&#8230; PC-KIMMO Data Files<br />
[*] floresta&#8230;&#8230;&#8230;&#8230; Portuguese Treebank<br />
[*] qc&#8230;&#8230;&#8230;&#8230;&#8230;&#8230; Experimental Data for Question Classification<br />
[*] nps_chat&#8230;&#8230;&#8230;&#8230; NPS Chat<br />
[*] paradigms&#8230;&#8230;&#8230;.. Paradigm Corpus<br />
[*] pil&#8230;&#8230;&#8230;&#8230;&#8230;.. The Patient Information Leaflet (PIL) Corpus<br />
[*] stopwords&#8230;&#8230;&#8230;.. Stopwords Corpus<br />
[*] propbank&#8230;&#8230;&#8230;&#8230; Proposition Bank Corpus 1.0<br />
[ ] pe08&#8230;&#8230;&#8230;&#8230;&#8230;. Cross-Framework and Cross-Domain Parser<br />
Evaluation Shared Task<br />
[*] state_union&#8230;&#8230;&#8230; C-Span State of the Union Address Corpus<br />
[*] sinica_treebank&#8230;.. Sinica Treebank Corpus Sample<br />
[*] ppattach&#8230;&#8230;&#8230;&#8230; Prepositional Phrase Attachment Corpus<br />
[*] senseval&#8230;&#8230;&#8230;&#8230; SENSEVAL 2 Corpus: Sense Tagged Text<br />
[*] problem_reports&#8230;.. Problem Report Corpus<br />
[*] reuters&#8230;&#8230;&#8230;&#8230;. The Reuters-21578 benchmark corpus, ApteMod<br />
version<br />
[*] swadesh&#8230;&#8230;&#8230;&#8230;. Swadesh Wordlists<br />
[*] rte&#8230;&#8230;&#8230;&#8230;&#8230;.. PASCAL RTE Challenges 1, 2, and 3<br />
[*] udhr&#8230;&#8230;&#8230;&#8230;&#8230;. Universal Declaration of Human Rights Corpus<br />
[*] treebank&#8230;&#8230;&#8230;&#8230; Penn Treebank Sample<br />
[*] unicode_samples&#8230;.. Unicode Samples<br />
[*] verbnet&#8230;&#8230;&#8230;&#8230;. VerbNet Lexicon, Version 2.1<br />
[*] wordnet_ic&#8230;&#8230;&#8230;. WordNet-InfoContent<br />
[*] book_grammars&#8230;&#8230;. Grammars from NLTK Book<br />
[*] words&#8230;&#8230;&#8230;&#8230;&#8230; Word Lists<br />
[*] punkt&#8230;&#8230;&#8230;&#8230;&#8230; Punkt Tokenizer Models<br />
[*] wordnet&#8230;&#8230;&#8230;&#8230;. WordNet<br />
[*] large_grammars&#8230;&#8230; Large context-free grammars for parser<br />
comparison<br />
[*] ycoe&#8230;&#8230;&#8230;&#8230;&#8230;. York-Toronto-Helsinki Parsed Corpus of Old<br />
English Prose<br />
[*] spanish_grammars&#8230;. Grammars for Spanish<br />
[*] rslp&#8230;&#8230;&#8230;&#8230;&#8230;. RSLP Stemmer (Removedor de Sufixos da Lingua<br />
Portuguesa)<br />
[*] tagsets&#8230;&#8230;&#8230;&#8230;. Help on Tagsets<br />
[*] sample_grammars&#8230;.. Sample Grammars<br />
[*] timit&#8230;&#8230;&#8230;&#8230;&#8230; TIMIT Corpus Sample<br />
[*] maxent_treebank_pos_tagger Treebank Part of Speech Tagger (Maximum entropy)<br />
[*] toolbox&#8230;&#8230;&#8230;&#8230;. Toolbox Sample Files<br />
[*] basque_grammars&#8230;.. Grammars for Basque<br />
[*] hmm_treebank_pos_tagger Treebank Part of Speech Tagger (HMM)<br />
[*] webtext&#8230;&#8230;&#8230;&#8230;. Web Text Corpus<br />
[*] switchboard&#8230;&#8230;&#8230; Switchboard Corpus Sample</p>
]]></content:encoded>
			<wfw:commentRss>http://blog.ynada.com/95/feed</wfw:commentRss>
		<slash:comments>1</slash:comments>
		</item>
		<item>
		<title>NLTK modules and their functions</title>
		<link>http://blog.ynada.com/92</link>
		<comments>http://blog.ynada.com/92#comments</comments>
		<pubDate>Sat, 11 Jul 2009 12:09:19 +0000</pubDate>
		<dc:creator>cornelius</dc:creator>
				<category><![CDATA[Things I want to look up later]]></category>
		<category><![CDATA[nltk]]></category>

		<guid isPermaLink="false">http://blog.ynada.com/?p=92</guid>
		<description><![CDATA[Accessing corpora: nltk.corpus String processing: nltk.tokenize, nltk.stem Collocation discovery: nltk.collocations Part-of-speech tagging: nltk.tag Classification: nltk.classify, nltk.cluster Chunking: nltk.chunk Parsing: nltk.parse Semantic interpretation: nltk.sem, nltk.inference Evaluation metrics: nltk.metrics Probability and estimation; nltk.probability Applications: nltk.app, nltk.chat]]></description>
			<content:encoded><![CDATA[<p>Accessing corpora: nltk.corpus<br />
String processing: nltk.tokenize, nltk.stem<br />
Collocation discovery: nltk.collocations<br />
Part-of-speech tagging: nltk.tag<br />
Classification: nltk.classify, nltk.cluster<br />
Chunking: nltk.chunk<br />
Parsing: nltk.parse<br />
Semantic interpretation: nltk.sem, nltk.inference<br />
Evaluation metrics: nltk.metrics<br />
Probability and estimation; nltk.probability<br />
Applications: nltk.app, nltk.chat</p>
]]></content:encoded>
			<wfw:commentRss>http://blog.ynada.com/92/feed</wfw:commentRss>
		<slash:comments>1</slash:comments>
		</item>
	</channel>
</rss>

