<?xml version="1.0"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="en">
	<id>https://www.aclweb.org/aclwiki/api.php?action=feedcontributions&amp;feedformat=atom&amp;user=Sean+Bethard</id>
	<title>ACL Wiki - User contributions [en]</title>
	<link rel="self" type="application/atom+xml" href="https://www.aclweb.org/aclwiki/api.php?action=feedcontributions&amp;feedformat=atom&amp;user=Sean+Bethard"/>
	<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/Special:Contributions/Sean_Bethard"/>
	<updated>2026-05-01T20:54:36Z</updated>
	<subtitle>User contributions</subtitle>
	<generator>MediaWiki 1.43.6</generator>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=User:Sean_Bethard&amp;diff=13253</id>
		<title>User:Sean Bethard</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=User:Sean_Bethard&amp;diff=13253"/>
		<updated>2021-11-16T21:17:54Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: &lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;UMass Linguistics. Brandeis CS.&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=User:Sean_Bethard&amp;diff=13205</id>
		<title>User:Sean Bethard</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=User:Sean_Bethard&amp;diff=13205"/>
		<updated>2021-07-11T16:12:04Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Update user page&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;UMass Linguistics. Brandeis Lab for Linguistics and Computation. Tulsa Language Technology Group.&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Multilingual_resources&amp;diff=12671</id>
		<title>Multilingual resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Multilingual_resources&amp;diff=12671"/>
		<updated>2019-09-12T09:03:49Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Change *[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)] to *[http://nltk.net Natural Language Toolkit (NLTK)], move to Multilingual resources, Collaborative projects.&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;For individual languages, see [[List of resources by language]].&lt;br /&gt;
&lt;br /&gt;
* [[Multilingual Dictionaries]] - including Bilingual Dictionaries&lt;br /&gt;
* [[Multilingual Corpora]] - including Bilingual Corpora&lt;br /&gt;
* [[Multilingual Tools and Software]] - including Bilingual Tools and Software&lt;br /&gt;
&lt;br /&gt;
== Collaborative projects ==&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
;[http://www.language-archives.org/ OLAC: Open Language Archives Community]&lt;br /&gt;
:An international partnership of institutions and individuals who are creating a worldwide virtual library of language resources&lt;br /&gt;
;[http://www.omegawiki.org/ OmegaWiki]&lt;br /&gt;
:A collaborative project to produce a free (as in free software) multilingual resource in every language, with lexicological, terminological and thesaurus information&lt;br /&gt;
;[http://nltk.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
:An amazing library to play with natural language&lt;br /&gt;
&lt;br /&gt;
== Lexical databases ==&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
;[https://www.mpi-inf.mpg.de/yago-naga/uwn/ UWN]: Multilingual wordnet covering over 200 languages, freely available as a TSV file&lt;br /&gt;
&lt;br /&gt;
== Weblogs ==&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
;[http://www.dunglish.nl/ Dunglish (Dutch &amp;amp; English)]&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
[[Category:Resources by language|Multilingual]]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12670</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12670"/>
		<updated>2019-09-12T09:00:35Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Change *[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)] to *[http://nltk.net Natural Language Toolkit (NLTK)], move to Multilingual resources, Collaborative projects.&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
* Missing items are denoted with †.&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator]†  &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser]† &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts]† &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases]†  &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more]† &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval]†  &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet]†&lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names]† &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER]†  &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database]† &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3]&lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository]†&lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus]†&lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial]†&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.]†&lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]†&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]†&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]†&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]†&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]†&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12669</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12669"/>
		<updated>2019-09-12T08:52:31Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Update missing items; last item checked: Telemakus.&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
* Missing items are denoted with †.&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator]†  &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser]† &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts]† &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases]†  &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more]† &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval]†  &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet]†&lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names]† &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER]†  &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database]† &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3]&lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository]†&lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus]†&lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial]†&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.]†&lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]†&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]†&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]†&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]†&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]†&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=User:Sean_Bethard&amp;diff=12668</id>
		<title>User:Sean Bethard</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=User:Sean_Bethard&amp;diff=12668"/>
		<updated>2019-09-12T08:33:11Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: &lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;UMass Linguistics. Brandeis CS.&lt;br /&gt;
NLP at Insight Engines, IBM Watson, Brigham and Women&#039;s Hospital.&lt;br /&gt;
Working on NLU, dialogue, question answering.&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12667</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12667"/>
		<updated>2019-09-12T08:29:26Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Update missing items; last item checked: MultiWordNet.&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
* Missing items are denoted with †.&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator]†  &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser]† &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts]† &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases]†  &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more]† &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval]†  &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet]†&lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names]† &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER]†  &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database]† &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3]&lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet]† &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository] &lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell] &lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer] &lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial] &lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.] &lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]†&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]†&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]†&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]†&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]†&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12664</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12664"/>
		<updated>2019-09-09T04:49:45Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Items that start with the letter &amp;quot;A&amp;quot;: 24. Items that start with the letter &amp;quot;A&amp;quot; and are missing: 21.&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
* Missing items are denoted with †.&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator]†  &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts] &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases] &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more] &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval] &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names] &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database] &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3] &lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository] &lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell] &lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer] &lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial] &lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.] &lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]†&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]†&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]†&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]†&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]†&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]†&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]†&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Resources_for_Dutch&amp;diff=12663</id>
		<title>Resources for Dutch</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Resources_for_Dutch&amp;diff=12663"/>
		<updated>2019-09-06T02:04:49Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Move *[http://www.let.rug.nl/~vannoord/alp/ Algorithms for Linguistic Processing] from Uncategorized resources to Resources for Dutch&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;== Corpora ==&lt;br /&gt;
* [http://ucts.uniba.sk/aranea_about/ Araneum Nederlandicum], Gigaword Dutch web corpus&lt;br /&gt;
* [http://corpora.informatik.uni-leipzig.de/ Dutch Plain text and Co-occurrences at LCC]&lt;br /&gt;
* [http://www.statmt.org/europarl Europarl corpus] - sentence-aligned with English&lt;br /&gt;
* [http://www.clips.uantwerpen.be/datasets/csi-corpus CLiPS Stylometry Investigation (CSI) corpus] - multi-purpose text corpus, main use in stylometry&lt;br /&gt;
* [http://ufal.mff.cuni.cz/hamledt HamleDT], harmonized dependency treebanks of many languages, common annotation style.&lt;br /&gt;
&lt;br /&gt;
== Tools ==&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/alp/Alpino/ Dutch HPSG-based parser] Includes the Alpino treebank (7137 sentences, newspaper, manually corrected)&lt;br /&gt;
*[http://www.let.rug.nl/~vannoord/alp/ Algorithms for Linguistic Processing] &lt;br /&gt;
&lt;br /&gt;
== Grammars ==&lt;br /&gt;
* [[Generation grammars|KPML generation grammar]]&lt;br /&gt;
&lt;br /&gt;
[[Category:Resources by language|Dutch]]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12662</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12662"/>
		<updated>2019-09-06T02:04:09Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Move *[http://www.let.rug.nl/~vannoord/alp/ Algorithms for Linguistic Processing] from Uncategorized resources to Resources for Dutch&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving] &lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts] &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases] &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more] &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval] &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names] &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database] &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3] &lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository] &lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell] &lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer] &lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial] &lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.] &lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Resources_for_Korean&amp;diff=12661</id>
		<title>Resources for Korean</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Resources_for_Korean&amp;diff=12661"/>
		<updated>2019-09-05T14:28:25Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Move *[http://odin.prohosting.com/hkkim/cgi-bin/kaeps/ Korean Accented English Pronunciation Simulator] (broken link) and *[http://nlp.postech.ac.kr/ Part of Speech Tagger for Korean] from Uncategorized resources to Resources for Korean&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;;[http://corpora.informatik.uni-leipzig.de/ Korean plain text and Co-occurrences at LCC]&lt;br /&gt;
;[http://odin.prohosting.com/hkkim/cgi-bin/kaeps/ Korean Accented English Pronunciation Simulator]&lt;br /&gt;
;[http://nlp.postech.ac.kr/ Part of Speech Tagger for Korean]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12660</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12660"/>
		<updated>2019-09-05T14:28:16Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Move *[http://odin.prohosting.com/hkkim/cgi-bin/kaeps/ Korean Accented English Pronunciation Simulator] (broken link) and *[http://nlp.postech.ac.kr/ Part of Speech Tagger for Korean] from Uncategorized resources to Resources for Korean&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~vannoord/alp/ Algorithms for Linguistic Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving] &lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts] &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases] &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more] &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval] &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names] &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database] &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3] &lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository] &lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell] &lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer] &lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial] &lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.] &lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Multilingual_resources&amp;diff=12659</id>
		<title>Multilingual resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Multilingual_resources&amp;diff=12659"/>
		<updated>2019-09-05T13:37:24Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Move *[http://www.language-archives.org/ OLAC: Open Language Archives Community] from Uncategorized resources to Multilingual resources; remove Related resources section; add sections for collaborative projects, lexical databases and weblogs&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;For individual languages, see [[List of resources by language]].&lt;br /&gt;
&lt;br /&gt;
* [[Multilingual Dictionaries]] - including Bilingual Dictionaries&lt;br /&gt;
* [[Multilingual Corpora]] - including Bilingual Corpora&lt;br /&gt;
* [[Multilingual Tools and Software]] - including Bilingual Tools and Software&lt;br /&gt;
&lt;br /&gt;
== Collaborative projects ==&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
;[http://www.language-archives.org/ OLAC: Open Language Archives Community]&lt;br /&gt;
:An international partnership of institutions and individuals who are creating a worldwide virtual library of language resources&lt;br /&gt;
;[http://www.omegawiki.org/ OmegaWiki]&lt;br /&gt;
:A collaborative project to produce a free (as in free software) multilingual resource in every language, with lexicological, terminological and thesaurus information&lt;br /&gt;
&lt;br /&gt;
== Lexical databases ==&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
;[https://www.mpi-inf.mpg.de/yago-naga/uwn/ UWN]: Multilingual wordnet covering over 200 languages, freely available as a TSV file&lt;br /&gt;
&lt;br /&gt;
== Weblogs ==&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
;[http://www.dunglish.nl/ Dunglish (Dutch &amp;amp; English)]&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
[[Category:Resources by language|Multilingual]]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12658</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12658"/>
		<updated>2019-09-05T13:30:16Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Change *[http://www.ldc.upenn.edu/exploration/survey.html A Survey of Open Language Archives] (broken link) to *[http://www.language-archives.org/ OLAC: Open Language Archives Community] and move to Multilingual resources&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~vannoord/alp/ Algorithms for Linguistic Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving] &lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts] &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases] &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more] &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval] &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://odin.prohosting.com/hkkim/cgi-bin/kaeps/ Korean Accented English Pronunciation Simulator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names] &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database] &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3] &lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository] &lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell] &lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer] &lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial] &lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.] &lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://nlp.postech.ac.kr/ Part of Speech Tagger for Korean]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Multilingual_Corpora&amp;diff=12641</id>
		<title>Multilingual Corpora</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Multilingual_Corpora&amp;diff=12641"/>
		<updated>2019-09-03T01:25:01Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Add TalkBank&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;This page lists &#039;&#039;multilingual&#039;&#039; corpora. For &#039;&#039;monolingual&#039;&#039; corpora, see [[List of resources by language]].&lt;br /&gt;
&lt;br /&gt;
See also [[Multilingual resources]].&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
*[http://wt.jrc.it/lt/Acquis/ ACQUIS COMMUNAUTAIRE Multilingual Corpus]&lt;br /&gt;
*[http://www.kun.nl/celex CELEX - The Dutch Center for Lexical Information]&lt;br /&gt;
*[https://childes.talkbank.org/ CHILDES - Child Language Data Exchange System] (component of [https://talkbank.org TalkBank])&lt;br /&gt;
*[http://sli.uvigo.es/CLUVI/ CLUVI Corpus (Galician-English-Spanish-French parallel corpus)]&lt;br /&gt;
*[http://www.cdc.gov/ncidod/sars/languages.htm Centre for Disease Control - Chinese, French, Japanese, Spanish info on SARS]&lt;br /&gt;
*[http://www.linguateca.pt/COMPARA/ COMPARA corpus]&lt;br /&gt;
*[http://www.debian.org/international/ Debian free software community]&lt;br /&gt;
*[http://www.ling.lancs.ac.uk/corplang/emille EMILLE corpus]&lt;br /&gt;
*[http://www.statmt.org/europarl/ European Parliament Proceedings Parallel Corpus 1996-2003]&lt;br /&gt;
*[http://www.illc.uva.nl/EuroWordNet EuroWordNet]&lt;br /&gt;
*[http://glossa.fltr.ucl.ac.be/ GlossaNet]&lt;br /&gt;
*[http://ufal.mff.cuni.cz/hamledt HamleDT], harmonized dependency treebanks of many languages, common annotation style.&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/CatalogEntry.jsp?catalogId=LDC95T20 Hansard French-English parallel corpus]&lt;br /&gt;
*[http://www.tu-chemnitz.de/phil/InternetGrammar/ Learner Behaviour on the Internet]&lt;br /&gt;
*[http://corpora.informatik.uni-leipzig.de Leipzig Corpora Collection: Large monolingual raw corpora for 17+ languages, free downloads]&lt;br /&gt;
*[http://www.coli.uni-saarland.de/~gparis/LMD-TAZ_corpus/ Le Monde Diplomatique-Die Tageszeitung Translation Corpus] - French-German, aligned (parallel)&lt;br /&gt;
*[http://muchmore.dfki.de/resources1.htm MuchMore Springer Bilingual Corpus]&lt;br /&gt;
*[http://nl.ijs.si/ME/ MULTEXT-East: Multilingual Corpora for Eastern and Central European Languages]&lt;br /&gt;
*[http://tcc.itc.it/people/forner/multilingualcorpora.html Multilingual Corpora: Available Resources]&lt;br /&gt;
* [http://www.csse.monash.edu.au/~jwb/tanakacorpus.html Tanaka Corpus: Japanese-English sentence pairs]&lt;br /&gt;
*[http://multisemcor.itc.it MultiSemCor]&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/Newspapers.html Newspapers on the Internet]&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS - an open source parallel corpus]&lt;br /&gt;
*[http://langbank.engl.polyu.edu.hk/indexl.html PolyU Language Bank]&lt;br /&gt;
*[http://register.consilium.eu.int/ Public registry of the Council of the EU]&lt;br /&gt;
*[http://www.multilingual.com/allen51.htm The Bible as a Resource for Translation Software]&lt;br /&gt;
*[http://www.cogsci.ed.ac.uk/elsnet/eci.html The ECI Multilingual corpus]&lt;br /&gt;
*[http://www.fida.net/ Slovenian Corpus FIDA] and [http://www.fidaplus.net/ FIDA+]&lt;br /&gt;
*[http://www.ling.su.se/DaLi/research/smultron/index.htm SMULTRON Corpus] parallell treebank of English, German and Swedish&lt;br /&gt;
*[https://talkbank.org The TalkBank System]&lt;br /&gt;
*[http://www.unhchr.ch/udhr/index.htm UN declaration of human rights in multiple languages]&lt;br /&gt;
*[http://conferences.unite.un.org/UNCorpus/ UN parallel corpora]&lt;br /&gt;
*[http://www.euromatrixplus.net/multi-un/ UN parallel corpora]&lt;br /&gt;
*[http://www-igm.univ-mlv.fr/~unitex/ UNITEX]&lt;br /&gt;
*[http://www.u-grenoble3.fr/kraif/liens.htm Useful links about parallel corpora, by Olivier Kraif]&lt;br /&gt;
*[http://wacky.sslmit.unibo.it/ WaCky Project]&lt;br /&gt;
*[http://www.wortschatz.uni-leipzig.de/html/wliste.html Wortlisten: spoken German, English, French, and Dutch]&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
[[Category:Resources by language|Multilingual]]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Multilingual_Corpora&amp;diff=12640</id>
		<title>Multilingual Corpora</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Multilingual_Corpora&amp;diff=12640"/>
		<updated>2019-09-03T01:17:59Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Change *[http://childes.psy.cmu.edu/ The Childes Corpus - Children&amp;#039;s language] to *[https://childes.talkbank.org/ CHILDES - Child Language Data Exchange System] and move to Multilingual resources, Multilingual corpora&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;This page lists &#039;&#039;multilingual&#039;&#039; corpora. For &#039;&#039;monolingual&#039;&#039; corpora, see [[List of resources by language]].&lt;br /&gt;
&lt;br /&gt;
See also [[Multilingual resources]].&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
*[http://wt.jrc.it/lt/Acquis/ ACQUIS COMMUNAUTAIRE Multilingual Corpus]&lt;br /&gt;
*[http://www.kun.nl/celex CELEX - The Dutch Center for Lexical Information]&lt;br /&gt;
*[https://childes.talkbank.org/ CHILDES - Child Language Data Exchange System]&lt;br /&gt;
*[http://sli.uvigo.es/CLUVI/ CLUVI Corpus (Galician-English-Spanish-French parallel corpus)]&lt;br /&gt;
*[http://www.cdc.gov/ncidod/sars/languages.htm Centre for Disease Control - Chinese, French, Japanese, Spanish info on SARS]&lt;br /&gt;
*[http://www.linguateca.pt/COMPARA/ COMPARA corpus]&lt;br /&gt;
*[http://www.debian.org/international/ Debian free software community]&lt;br /&gt;
*[http://www.ling.lancs.ac.uk/corplang/emille EMILLE corpus]&lt;br /&gt;
*[http://www.statmt.org/europarl/ European Parliament Proceedings Parallel Corpus 1996-2003]&lt;br /&gt;
*[http://www.illc.uva.nl/EuroWordNet EuroWordNet]&lt;br /&gt;
*[http://glossa.fltr.ucl.ac.be/ GlossaNet]&lt;br /&gt;
*[http://ufal.mff.cuni.cz/hamledt HamleDT], harmonized dependency treebanks of many languages, common annotation style.&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/CatalogEntry.jsp?catalogId=LDC95T20 Hansard French-English parallel corpus]&lt;br /&gt;
*[http://www.tu-chemnitz.de/phil/InternetGrammar/ Learner Behaviour on the Internet]&lt;br /&gt;
*[http://corpora.informatik.uni-leipzig.de Leipzig Corpora Collection: Large monolingual raw corpora for 17+ languages, free downloads]&lt;br /&gt;
*[http://www.coli.uni-saarland.de/~gparis/LMD-TAZ_corpus/ Le Monde Diplomatique-Die Tageszeitung Translation Corpus] - French-German, aligned (parallel)&lt;br /&gt;
*[http://muchmore.dfki.de/resources1.htm MuchMore Springer Bilingual Corpus]&lt;br /&gt;
*[http://nl.ijs.si/ME/ MULTEXT-East: Multilingual Corpora for Eastern and Central European Languages]&lt;br /&gt;
*[http://tcc.itc.it/people/forner/multilingualcorpora.html Multilingual Corpora: Available Resources]&lt;br /&gt;
* [http://www.csse.monash.edu.au/~jwb/tanakacorpus.html Tanaka Corpus: Japanese-English sentence pairs]&lt;br /&gt;
*[http://multisemcor.itc.it MultiSemCor]&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/Newspapers.html Newspapers on the Internet]&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS - an open source parallel corpus]&lt;br /&gt;
*[http://langbank.engl.polyu.edu.hk/indexl.html PolyU Language Bank]&lt;br /&gt;
*[http://register.consilium.eu.int/ Public registry of the Council of the EU]&lt;br /&gt;
*[http://www.multilingual.com/allen51.htm The Bible as a Resource for Translation Software]&lt;br /&gt;
*[http://www.cogsci.ed.ac.uk/elsnet/eci.html The ECI Multilingual corpus]&lt;br /&gt;
*[http://www.fida.net/ Slovenian Corpus FIDA] and [http://www.fidaplus.net/ FIDA+]&lt;br /&gt;
*[http://www.ling.su.se/DaLi/research/smultron/index.htm SMULTRON Corpus] parallell treebank of English, German and Swedish&lt;br /&gt;
*[http://www.unhchr.ch/udhr/index.htm UN declaration of human rights in multiple languages]&lt;br /&gt;
*[http://conferences.unite.un.org/UNCorpus/ UN parallel corpora]&lt;br /&gt;
*[http://www.euromatrixplus.net/multi-un/ UN parallel corpora]&lt;br /&gt;
*[http://www-igm.univ-mlv.fr/~unitex/ UNITEX]&lt;br /&gt;
*[http://www.u-grenoble3.fr/kraif/liens.htm Useful links about parallel corpora, by Olivier Kraif]&lt;br /&gt;
*[http://wacky.sslmit.unibo.it/ WaCky Project]&lt;br /&gt;
*[http://www.wortschatz.uni-leipzig.de/html/wliste.html Wortlisten: spoken German, English, French, and Dutch]&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
[[Category:Resources by language|Multilingual]]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12639</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12639"/>
		<updated>2019-09-03T01:15:47Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Change *[http://childes.psy.cmu.edu/ The Childes Corpus - Children&amp;#039;s language] to *[https://childes.talkbank.org/ Child Language Data Exchange System] and move to Multilingual resources, Multilingual corpora&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/survey.html A Survey of Open Language Archives] &lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~vannoord/alp/ Algorithms for Linguistic Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving] &lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts] &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases] &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more] &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval] &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://odin.prohosting.com/hkkim/cgi-bin/kaeps/ Korean Accented English Pronunciation Simulator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names] &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database] &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3] &lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository] &lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell] &lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer] &lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial] &lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.] &lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://nlp.postech.ac.kr/ Part of Speech Tagger for Korean]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Corpora_for_English&amp;diff=12638</id>
		<title>Corpora for English</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Corpora_for_English&amp;diff=12638"/>
		<updated>2019-09-03T00:58:05Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Move *[http://www.grsampson.net/RSue.html SUSANNE Analytic Scheme] from Uncategorized resource to Resources for English, Corpora for English, Free and Downloadable&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;For languages other than English, see [[List of resources by language]].&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
&lt;br /&gt;
===Free and Downloadable===&lt;br /&gt;
*[http://americannationalcorpus.org/ American National Corpus (ANC)]&lt;br /&gt;
*[http://www.cs.cornell.edu/home/llee/data/convote.html Congressional floor-debate transcripts, with support/oppose labels]&lt;br /&gt;
*[http://www-rcf.usc.edu/~billmann/diversity/DDivers-site.htm Dialogue Diversity Corpus]&lt;br /&gt;
*[http://www-2.cs.cmu.edu/afs/cs.cmu.edu/project/theo-11/www/naive-bayes/bow-0.8/stopwords.c English stop words (from SMART)]&lt;br /&gt;
*[http://gmb.let.rug.nl Groningen Meaning Bank] semantically annotated corpus&lt;br /&gt;
*[https://corpling.uis.georgetown.edu/gum/ GUM - Georgetown University Multilayer corpus], multiple parses, coreference, entities, sentence types and RST&lt;br /&gt;
*[https://www.gutenberg.org Project Gutenberg]&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ice/avail.htm International Corpus of English]&lt;br /&gt;
*[http://ufal.mff.cuni.cz/hamledt HamleDT], harmonized dependency treebanks of many languages, common annotation style.&lt;br /&gt;
*[http://prize.hutter1.net/ Hutter Prize for Lossless Compression of Human Knowledge 100M sample of Wikipedia]&lt;br /&gt;
*[http://www.cs.fit.edu/~mmahoney/compression/text.html Large Text Compression Benchmark&#039;s 1G sample of Wikipedia]&lt;br /&gt;
*[http://www.cs.cornell.edu/People/pabo/movie-review-data/ Movie Review Data]&lt;br /&gt;
*[http://mwe.stanford.edu/resources/ Multiword Expression Resources]&lt;br /&gt;
*[http://www-2.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/corpora/susanne/0.html Susanne: Annotated American English Corpus]&lt;br /&gt;
*[http://www.grsampson.net/RSue.html SUSANNE Analytic Scheme]&lt;br /&gt;
*[http://www-users.york.ac.uk/~sp20/corpus.html The Brooklyn-Geneva-Amsterdam-Helsinki Parsed Corpus of Old English]&lt;br /&gt;
*[http://www.grsampson.net/LucyDoc.html The LUCY Corpus - Documentation]&lt;br /&gt;
*[http://www.cs.rochester.edu/research/cisd/resources/trains.html TRAINS Dialogue Corpus]&lt;br /&gt;
*[http://ebiquity.umbc.edu/resource/html/id/351 UMBC Webbase Corpus]&lt;br /&gt;
*[http://www.euromatrixplus.net/multi-un/ UN parallel corpora]&lt;br /&gt;
*[http://www.let.rug.nl/~bos/vpe/ VP Ellipsis corpus]&lt;br /&gt;
* [http://www.statmt.org/wmt15/translation-task.html#download WMT corpora], including [http://en.wikipedia.org/wiki/Europarl_corpus Europarl], News Commentary, and News Crawl&lt;br /&gt;
&lt;br /&gt;
===Proprietary or Require Prior Permission===&lt;br /&gt;
*[http://ucts.uniba.sk/aranea_about/ Araneum Anglicum], Gigaword English web corpus&lt;br /&gt;
*[http://ucts.uniba.sk/aranea_about/ Araneum Anglicum Asiaticum], Gigaword Asian English web corpus&lt;br /&gt;
*[http://www.natcorp.ox.ac.uk/ British National Corpus (BNC)]&lt;br /&gt;
*[http://boston.lti.cs.cmu.edu/Data/clueweb09/ ClueWeb]&lt;br /&gt;
*[http://www.athel.com/cpsa.html Corpus of Spoken Professional English]&lt;br /&gt;
*[http://www.phon.ox.ac.uk/~esther/ivyweb/ English Intonation in the British Isles -The IViE Corpus]&lt;br /&gt;
*[http://www-personal.umich.edu/~jlawler/levin.html English Verb Classes And Alternations: A Preliminary Investigation (Index)]&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/test_collections/gov2-summary.htm GOV2 Corpus] - 426 gigabytes of text&lt;br /&gt;
*[http://mpqa.cs.pitt.edu Multi-Perspective Question Answering (MPQA)]&lt;br /&gt;
*[http://www.askoxford.com/oec/mainpage/?view=uk Oxford English Corpus]&lt;br /&gt;
*[http://www.sketchengine.co.uk/ Sketch Engine]&lt;br /&gt;
*[http://wacky.sslmit.unibo.it/ WaCky]&lt;br /&gt;
*[http://www.webcorp.org.uk/guide/ WebCorp]&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
&amp;lt;!-- Dead links&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/time/ 1963 Time Magazine corpus]&lt;br /&gt;
*[http://www.elda.fr/catalogue/en/speech/S0115.html American English SpeechDat-Car]&lt;br /&gt;
*[http://compbio.uchsc.edu/ccp/corpora/index.shtml Biomedical corpora]&lt;br /&gt;
*[http://homepage.mac.com/bncweb/ BNCweb a web-based interface to the British National Corpus]&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/computing/research/ucrel/bnc.html British National Corpus project page (from UCREL)]&lt;br /&gt;
*[http://clwww.essex.ac.uk/w3c/corpus_ling/content/corpora/list/private/brown/brown.html Brown Corpus]&lt;br /&gt;
*[http://computing.open.ac.uk/coda/data.html CODA Parallel Annotated Monologue-Dialogue Corpus]&lt;br /&gt;
*[http://www.collins.co.uk/books.aspx?group=154 Collins Wordbanks]&lt;br /&gt;
*[http://etext.lib.virginia.edu/ Electronic Text Center -- University of Virginia]&lt;br /&gt;
*[http://usna.edu/LangStudy/BNC/ Exploring Words and Phrases from the British National Corpus]&lt;br /&gt;
*[http://nora.hd.uib.no/icame.html ICAME]&lt;br /&gt;
*[http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
*[http://homepages.feis.herts.ac.uk/~comrcml/Lyon-thesis.ps Restricted English Corpus from Dr. Caroline Lyon for PhD]&lt;br /&gt;
*[http://clix.to/davidlee00 The BNC Index (for the BNCWorld Edition)]&lt;br /&gt;
--&amp;gt;&lt;br /&gt;
&lt;br /&gt;
==Link collections==&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.dcs.gla.ac.uk/idom/ir_resources/ Collections of texts and corpora]&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
*[http://www.sultry.arts.usyd.edu.au/links/statnlp.html Annotated list of resources on statistical NLP and corpus-based CL]&lt;br /&gt;
&lt;br /&gt;
==Corpora tools==&lt;br /&gt;
&amp;lt;!-- Please keep this list in alphabetical order --&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://corpus-tools.org/annis/ ANNIS] - open source search tool for complex multilayer corpora&lt;br /&gt;
*[http://www.dcs.gla.ac.uk/idom/ir_resources/linguistic_utils/stop_words List of stop words]&lt;br /&gt;
*[http://korpus.pl/index.php?page=poliqarp Poliqarp] - open source XML-aware indexer, search engine and concordancer&lt;br /&gt;
*[http://www.sketchengine.co.uk/ The Sketch Engine]&lt;br /&gt;
*[http://www.cis.upenn.edu/~treebank/tokenization.html Treebank tokenization scheme]&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
[[Category:Corpora|*]]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12637</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12637"/>
		<updated>2019-09-03T00:56:27Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Move *[http://www.grsampson.net/RSue.html SUSANNE Analytic Scheme] from Uncategorized resource to Resources for English, Corpora for English, Free and Downloadable&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/survey.html A Survey of Open Language Archives] &lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~vannoord/alp/ Algorithms for Linguistic Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving] &lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts] &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases] &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more] &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval] &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://odin.prohosting.com/hkkim/cgi-bin/kaeps/ Korean Accented English Pronunciation Simulator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names] &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database] &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3] &lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository] &lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell] &lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer] &lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial] &lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.] &lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://nlp.postech.ac.kr/ Part of Speech Tagger for Korean]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://childes.psy.cmu.edu/ The Childes Corpus - Children&#039;s language]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Resources_for_Chinese&amp;diff=12636</id>
		<title>Resources for Chinese</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Resources_for_Chinese&amp;diff=12636"/>
		<updated>2019-09-03T00:42:40Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Move * [http://pears.lib.ohio-state.edu/China/linguist.html Chinese Linguistics] (broken link) from Uncategorized resource to Resources for Chinese&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;==Tools==&lt;br /&gt;
===Free software===&lt;br /&gt;
* [https://github.com/yzhang/rseg rseg] word segmentation; written in ruby (no compilation, no hard dependencies apart from ruby), comes with a model (MIT license)&lt;br /&gt;
* [https://code.google.com/p/ctbparser/ ctbparser] word segmentation, POS tagging, NER, dependency parsing, all using Conditional Random Fields; written in C++ (LGPL license)&lt;br /&gt;
* [http://www.cl.cam.ac.uk/~yz360/zpar.html ZPar] word segmentation, POS tagging, CFG/dep/CCG parsing of Chinese and English; written in C++ (GPL3 license)&lt;br /&gt;
* [http://code.google.com/p/duduplus/ DuDuPlus: a graph-based dependency parser for English and Chinese] (&amp;quot;Other Open Source&amp;quot; license?)&lt;br /&gt;
** where is the source code?&lt;br /&gt;
&lt;br /&gt;
==Corpora==&lt;br /&gt;
===Free license===&lt;br /&gt;
* [http://corpora.heliohost.org/ HC Corpora] 1606811 lines of [http://en.wikipedia.org/wiki/Fair_use Fair Use] excerpts from news, blogs, twitter&lt;br /&gt;
* [http://www.euromatrixplus.net/multi-un/ UN parallel corpora]&lt;br /&gt;
&lt;br /&gt;
===Nonfree or Unknown license===&lt;br /&gt;
* [http://ucts.uniba.sk/aranea_about/ Araneum Sinicum], Gigaword Chinese web corpus&lt;br /&gt;
* [http://www.chinesecomputing.com Chinese Computing] &lt;br /&gt;
* [http://www.icl.pku.edu.cn/icl_groups/corpus/dwldform1.asp Word Segmented and POS tagged People Daily Corpus at ICL of Peking University]&lt;br /&gt;
* [http://corpus.leeds.ac.uk/frqc/i-zh-char.num.html Frequency list of characters in the Internet corpus]&lt;br /&gt;
* [http://corpus.leeds.ac.uk/frqc/internet-zh.num Frequency list of lexical items in the Internet corpus]&lt;br /&gt;
* [http://www.ling.lancs.ac.uk/corplang/lcmc/ Lancaster Corpus of Mandarin Chinese]&lt;br /&gt;
* [http://corpus.leeds.ac.uk/query-zh.html A collection of Chinese corpora and frequency lists]  Online query with three corpora&lt;br /&gt;
* [http://pears.lib.ohio-state.edu/China/linguist.html Chinese Linguistics]&lt;br /&gt;
&lt;br /&gt;
[[Category:Resources by language|Chinese]]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
	<entry>
		<id>https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12635</id>
		<title>Uncategorized resources</title>
		<link rel="alternate" type="text/html" href="https://www.aclweb.org/aclwiki/index.php?title=Uncategorized_resources&amp;diff=12635"/>
		<updated>2019-09-03T00:42:14Z</updated>

		<summary type="html">&lt;p&gt;Sean Bethard: Move * [http://pears.lib.ohio-state.edu/China/linguist.html Chinese Linguistics] (broken link) from Uncategorized resource to Resources for Chinese&lt;/p&gt;
&lt;hr /&gt;
&lt;div&gt;&amp;lt;div class=&amp;quot;usermessage&amp;quot;&amp;gt;&lt;br /&gt;
* Please &#039;&#039;do not add anything new to this list&#039;&#039;; we would like to eventually eliminate this list.&lt;br /&gt;
* Please add new items to the [[List of resources by language]].&lt;br /&gt;
* Please help us move items below into the [[List of resources by language]].&lt;br /&gt;
&amp;lt;/div&amp;gt;&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/survey.html A Survey of Open Language Archives] &lt;br /&gt;
&lt;br /&gt;
*[http://www.siggen.org/resources/ ACL SIGGEN Resources Wiki] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.kun.nl/agfl/ AFGL Parser Generator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~vannoord/alp/ Algorithms for Linguistic Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.a-i.com/ Artificial Intelligence NV (Ai)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eprints.org/ Author/Institution Self-Archiving] &lt;br /&gt;
&lt;br /&gt;
*[http://www.copernic.com/ COPERNIC 2000] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~dbikel/#stat-parser Dan Bikel&#039;s Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://java.sun.com/docs/books/tutorial/i18n/text/boundaryintro.html Detecting Text Boundaries] &lt;br /&gt;
&lt;br /&gt;
*[http://www.catchword.com/era Educational Research Abstracts] &lt;br /&gt;
&lt;br /&gt;
*[http://emotion-research.net/wiki/Databases Emotional Databases] &lt;br /&gt;
&lt;br /&gt;
*[http://lingo.stanford.edu/erg.html English Resource Grammar] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cjk.org/cjk/samples/chincomc.htm English-Chinese Chinese-English Dictionary of Computer Terms] &lt;br /&gt;
&lt;br /&gt;
*[http://www.freelangonline.com/ Freelangonline - many on-line dictionaries + more] &lt;br /&gt;
&lt;br /&gt;
*[http://dmoz.org/Computers/Software/Information_Retrieval/ Information Retrieval] &lt;br /&gt;
&lt;br /&gt;
*[http://ir.dcs.gla.ac.uk/resources.html IR resources] &lt;br /&gt;
&lt;br /&gt;
*[http://odin.prohosting.com/hkkim/cgi-bin/kaeps/ Korean Accented English Pronunciation Simulator] &lt;br /&gt;
&lt;br /&gt;
*[http://www.kwicfinder.com/KWiCFinder.html KwicFinder Web Concordancer and Online Research Tool] &lt;br /&gt;
&lt;br /&gt;
*[http://www.academiaisla.com/acadi/gen/0_en.html LANGUAGE LINKS] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/lexfn/ Lexical FreeNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www-lfg.stanford.edu/lfg/ilfga LFG Database: List of Names] &lt;br /&gt;
&lt;br /&gt;
*[http://lse.umiacs.umd.edu/ Linguist&#039;s Search Engine] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TIGER/ Linguistic Interpretation of a German Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://www.link.cs.cmu.edu/ LINK GRAMMAR PARSER] &lt;br /&gt;
&lt;br /&gt;
*[http://www.eturner.net/linkgrammar-wn/ LinkGrammar-WN project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.psy.uwa.edu.au/MRCDataBase/uwa_mrc.htm MRC Psycholinguistic Database] &lt;br /&gt;
&lt;br /&gt;
*[http://nl.ijs.si/ME/V3/ Multext East Resources, Version 3] &lt;br /&gt;
&lt;br /&gt;
*[http://multiwordnet.itc.it/english/home.php MultiWordNet] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.nus.edu.sg/~rpnlpir/ Natural Language Processing / Information Retrieval Software Repository] &lt;br /&gt;
&lt;br /&gt;
*[http://nlsh.sourceforge.net/ NLSH: Natural Language Shell] &lt;br /&gt;
&lt;br /&gt;
*[http://www.irisa.fr/Omphalos/ Omphalos Context-Free Language Learning Competition] &lt;br /&gt;
&lt;br /&gt;
*[http://ysomeya.hp.infoseek.co.jp/ Online Business Letter Corpus KWIC Concordancer] &lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RLeafAnc.html Parse Evaluation] &lt;br /&gt;
&lt;br /&gt;
*[http://pie.usna.edu Phrases in English and the British National Corpus] &lt;br /&gt;
&lt;br /&gt;
*[http://pygoogle.sourceforge.net/ PyGoogle: A Python Interface to the Google API] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ai.uga.edu/mc/PythonForNewbieLinguists.html Python Programming Tutorial] &lt;br /&gt;
&lt;br /&gt;
*[http://corpus.leeds.ac.uk/internet.html Query to Internet Corpora] &lt;br /&gt;
&lt;br /&gt;
*[http://www.lexmasterclass.com/exercises/regex/index.html Regular Expression Exercises] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sims.berkeley.edu/~hjiang1/eng_chi_resources.html Resources for English-Chinese CLIR] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.technion.ac.il/~gabr/resources/resources.html Resources for Text, Speech and Language Processing] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sfu.ca/rst/ Rhetorical Structure Theory (RST)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensSemRoles.html Senseval-3 Task: Automatic Labeling of Semantic Roles] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clres.com/SensWNDisamb.html Senseval-3 Task: Word-Sense Disambiguation of WordNet Glosses] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.unt.edu/~rada/wa/ Sentence Alignment and Word Alignment: Projects, Papers, Evaluation, Etc.] &lt;br /&gt;
&lt;br /&gt;
*[http://ontoweb-lt.dfki.de/knowledge_index.htm SIG5 OntoWeb] &lt;br /&gt;
&lt;br /&gt;
*[http://sara.natcorp.ox.ac.uk/lookup.html Simple Search of BNC-World] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sigsem.org/ Special Interest Group on Computational Semantics] &lt;br /&gt;
&lt;br /&gt;
*[http://www.grsampson.net/RSue.html SUSANNE Analytic Scheme] &lt;br /&gt;
&lt;br /&gt;
*[http://www.telemakus.net/ Telemakus: Mining and Mapping Research Findings to Promote Knowledge Discovery] &lt;br /&gt;
&lt;br /&gt;
*[http://www.clef-campaign.org/ The Cross-Language Evaluation Forum] &lt;br /&gt;
&lt;br /&gt;
*[http://www.robotwisdom.com/web/biography.html The Internet Timelines Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.fb10.uni-bremen.de/anglistik/langpro/NLG-table/NLG-table-root.htm The John Bateman and Michael Zock&#039;s list of Natural Language Generation Systems] &lt;br /&gt;
&lt;br /&gt;
*[http://www.RosettaProject.org/ The Rosetta PrOject] &lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~xtag The XTAG Project] &lt;br /&gt;
&lt;br /&gt;
*[http://www.TSrali.com/ TransSearch] &lt;br /&gt;
&lt;br /&gt;
*[http://www-nlpir.nist.gov/projects/trecvid/ TREC Video Retrieval Evaluation Page] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html TreeTagger - a language independent part-of-speech tagger] &lt;br /&gt;
&lt;br /&gt;
*[http://www.biomedcentral.com/info/about/datamining= Using BioMed Central&#039;s Open Access Full Text Corpus for Data Mining Research] &lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu/ VIEW: Variation in English Words and Phrases] &lt;br /&gt;
&lt;br /&gt;
*[http://beta.visl.sdu.dk VISL Tagger and Parser] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webir.org/ Web IR &amp;amp; IE] &lt;br /&gt;
&lt;br /&gt;
*[http://elib.cs.berkeley.edu/docfreq/ Web Term Document Frequency Form (Berkeley)] &lt;br /&gt;
&lt;br /&gt;
*[http://www.niederlandistik.fu-berlin.de/cgi-bin/web-conc.cgi WEB-CONC] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webcorp.org.uk/ WEBCORP] &lt;br /&gt;
&lt;br /&gt;
*[http://www.webexp.info/ WebExp2 Experimental Software] &lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.lancs.ac.uk/ucrel/bncfreq/ Word Frequencies in Written and Spoken English (Based on the British National Corpus)] &lt;br /&gt;
&lt;br /&gt;
*[http://tcc.itc.it/research/textec/topics/disambiguation/wordnetdomains.html WordNet Domains] &lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/exploration/expl2000/papers/ Workshop on Web-Based Language Documentation and Description Papers] &lt;br /&gt;
&lt;br /&gt;
*[http://www.gmi.org/wlms/ World Language Mapping System]&lt;br /&gt;
&lt;br /&gt;
*[http://www.comp.leeds.ac.uk/eric/iwcs.ps A Domain-Independent Semantic Tagger for the Study of Meaning Associations in English Text]&lt;br /&gt;
&lt;br /&gt;
*[http://www3.interscience.wiley.com/cgi-bin/abstract/104525215/ABSTRACT Automatic Construction of English/Chinese Parallel Corpora]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.icsi.berkeley.edu/pub/techreports/ Berkeley - Technical Reports]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/publications/lrec2004/bootcat_lrec_2004.pdf BootCaT: Bootstrapping Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://acl.ldc.upenn.edu/I/I05/I05-2015.pdf Building an Annotated Japanese-Chinese Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/diachronic/index.htm DCPSE: Creating a Parsed and Searchable Diachronic Corpus of  Present-Day Spoken English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/info/EPapers.html Electronically available papers (list at Univ. of Stuttgart)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cis.upenn.edu/~cliff-group/94/reports.html Linc Lab (U. Penn) technical reports (not on-line)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.let.rug.nl/~tanja/ Linguistic Knowledge and Word Sense Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://ir.shef.ac.uk/cloughie/papers.html Measuring Text Reuse]&lt;br /&gt;
&lt;br /&gt;
*[http://www.linguistics.rub.de/~kiss/publications/publications.html#boundaries Paper on Sentence Boundary Disambiguation]&lt;br /&gt;
&lt;br /&gt;
*[http://www.dfki.de/lt/papers/cl-abstracts.html Papers of the DFKI CL Department]&lt;br /&gt;
&lt;br /&gt;
*[http://www1.cs.columbia.edu/nlp/theses.html PhD Theses (Columbia Natural Processing Language Group)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.itri.brighton.ac.uk/ucnlg/Proceedings/index.html Proceedings of the Corpus Linguistics 2005 Workshop on Using Corpora for Natural Language Generation]&lt;br /&gt;
&lt;br /&gt;
*[http://sslmit.unibo.it/~baroni/bootcat.html BootCaT Toolkit: Simple Utilities to Bootstrap Corpora and Terms from the Web]&lt;br /&gt;
&lt;br /&gt;
*[http://chasen.aist-nara.ac.jp/hiki/ChaSen/ ChaSen]&lt;br /&gt;
&lt;br /&gt;
*[http://nlp.cs.jhu.edu/~gsm/pd_demo Dendrogram Demo]&lt;br /&gt;
&lt;br /&gt;
*[http://www.olst.umontreal.ca/dicoeng.html DiCo Lexical Database OLST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.wolfson.ox.ac.uk/~peet/eatshow.htm Edinburgh Associative Thesaurus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.smi.ucd.ie/hyppia/ HYPPIA]&lt;br /&gt;
&lt;br /&gt;
*[http://xlex.uni-muenster.de/ M&amp;amp;uuml;nster Tagging Project]&lt;br /&gt;
&lt;br /&gt;
*[http://nltk.sourceforge.net Natural Language Toolkit (NLTK)]&lt;br /&gt;
&lt;br /&gt;
*[http://perso.wanadoo.fr/rosavram/ NooJ]&lt;br /&gt;
&lt;br /&gt;
*[http://www.informatics.susx.ac.uk/research/nlp/rasp/ Robust Accurate Statistical Parsing (RASP)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.searchtools.com/ Search Tools for Web Sites and Intranets]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lsi.upc.edu/~surdeanu/swirl.html SwiRL Semantic Role Labeler]&lt;br /&gt;
&lt;br /&gt;
*[http://view.byu.edu VIEW (Variation in English Words and Phrases)]&lt;br /&gt;
&lt;br /&gt;
*[http://www40.brinkster.com/dictionarium/index.html dictionarium]&lt;br /&gt;
&lt;br /&gt;
*[http://www.mat.upm.es/~aries ARIES Natural Language Tools]&lt;br /&gt;
&lt;br /&gt;
*[http://www.york.ac.uk/services/library/subjects/langint.htm Language and Linguistic Science information sources] &lt;br /&gt;
&lt;br /&gt;
*[http://www.de.elra.research.ec.org/ The RELATOR language resources server]&lt;br /&gt;
&lt;br /&gt;
*[ftp://parcftp.xerox.com/pub/ Xerox PARC FTP site.]&lt;br /&gt;
&lt;br /&gt;
*[http://actarus.atilf.fr/morphalou/ Lexique Morphalou] &lt;br /&gt;
&lt;br /&gt;
*[http://orleans.lti.cs.cmu.edu/Reap/ REAP Project: Reader-Specific Lexical Practice for Improved Reading Comprehension] &lt;br /&gt;
&lt;br /&gt;
*[http://people.cs.uchicago.edu/~dinoj/icsi97syl.disc.gz Syllable-Level Conversational English Transcriptions] &lt;br /&gt;
&lt;br /&gt;
*[http://www.sil.org/mexico/pub/vimsa.htm The Mariano Silva y Aceves Series] &lt;br /&gt;
&lt;br /&gt;
*[http://www.unine.ch/info/clef/ UniNE stopword list for Portuguese] &lt;br /&gt;
&lt;br /&gt;
*[http://www.valencianlanguage.com/ Valencianlanguage.com]&lt;br /&gt;
&lt;br /&gt;
* [http://www.answerbus.com AnswerBus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.axontologic.com Axontologic]&lt;br /&gt;
&lt;br /&gt;
* [http://www.bionlp.org Natural language processing of biology text]&lt;br /&gt;
&lt;br /&gt;
* [http://textalyser.net Text analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.20000-names.com/ 2000 names from around the world]&lt;br /&gt;
&lt;br /&gt;
* [http://www.facstaff.bucknell.edu/rbeard/diction.html A web of online dictionaries]&lt;br /&gt;
&lt;br /&gt;
* [http://abu.cnam.fr/ ABU : la Biblioth\`eque Universelle]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/tagsets/tagmenu.html AMALGAM English PoS tagsets]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-tagged.html AMALGAM Multi-Tagged Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/multi-parsed.html AMALGAM Multi-Treebank]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/amalgam/amalgam/amalgtag3.html AMALGAM email Part-of-Speech tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/arcade/ ARCADE: Evaluation of text alignment tools]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aspseek.org/ ASPSEEK search engine]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ucc.ie/info/net/acronyms/acro.html Acronym Server]&lt;br /&gt;
&lt;br /&gt;
* [http://tcc.itc.it/people/lavelli/ Alberto Lavelli, ITC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.wtsn.binghamton.edu/ANS/ American Name Society]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mat.upm.es/~aries/description.html Aries natural language tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/~ask-ling Ask a Linguist]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webspawner.com/users/samplex/ Build a program immediately from data processing examples: NLP]&lt;br /&gt;
&lt;br /&gt;
* [http://www.link.cs.cmu.edu/link/submit-sentence-4.html CMU Sentence Parser]&lt;br /&gt;
&lt;br /&gt;
* [http://corpora.ids-mannheim.de/~cosmas COSMAS - Corpus Storage, Maintenance and Access System]&lt;br /&gt;
&lt;br /&gt;
* [http://www.uni-paderborn.de/fachbereich/AG/agmadh/WWW/english/scripts.html Collection of Lecture Notes, Surveys, and Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://searchenginewatch.internet.com/facts/searches.html Corpora of user queries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.vassar.edu/CES/ Corpus Enconding Standard]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ Corpus Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://www.robotwisdom.com/ai/cycresources.html Cyc resources]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ict.usc.edu/~traum David Traum, USC]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elcom.de/ ELCOM - Tuersprechanlagen, Produzent fuer Tuersprechanlagen... Hauskommunikation fuer Ihre Sicherheit.]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.leeds.ac.uk/eric/ Eric Atwell, University of Leeds]&lt;br /&gt;
&lt;br /&gt;
* [http://www.pg.gda.pl/~jandac/fsa.html Finite-State Utilities for morphological analysis (known and unknown words), spelling correction, perfect hashing, diacritics restoration]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xrce.xerox.com/cgi-bin/mltt/nodict-fsc-teach-int French conjugation test]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.utk.edu/~cs460.is&amp;amp;r/glossary.html Glossary for the Book Information Storage and Retrieval by R. Korfhage]&lt;br /&gt;
&lt;br /&gt;
* [http://www.kinet-tv.ne.jp/~sat/data/publications/2001/c36.html Hatayama parser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.ust.hk Human Language Technology Center, UST, Hong Kong]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ihear.com/ IHear]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ribbitsoft.com/ist/ist.html Information Search and Transformation Technologies]&lt;br /&gt;
&lt;br /&gt;
* [http://www.illc.uva.nl/~christof Institute for Logic, Language and Computation (ILLC) - University of Amsterdam]&lt;br /&gt;
&lt;br /&gt;
* [http://www.germanistik.fu-berlin.de/il/ Integrational Linguistics]&lt;br /&gt;
&lt;br /&gt;
* [http://www.xs4all.nl/~bsarempt/linguistics/index.html Kura]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lrec-conf.org/lrec2004/doc/ws/CPSLC.pdf LREC 2004 Workshop: Compiling and processing spoken language corpora]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/computing/research/ucrel/claws/trial.html Lancaster CLAWS PoS tagger]&lt;br /&gt;
&lt;br /&gt;
* [http://www.asel.udel.edu/natlang/nlp/lrd.html Language Representation Database]&lt;br /&gt;
&lt;br /&gt;
* [http://lsa.colorado.edu/content.html Latent Semantic Analysis]&lt;br /&gt;
&lt;br /&gt;
* [http://www.blackwellpublishers.co.uk/labs Linguistics Abstracts]&lt;br /&gt;
&lt;br /&gt;
* [http://www.phil.uni-passau.de/linguistik/linguistik_urls/ Linguistics Links Database, University of Passau]&lt;br /&gt;
&lt;br /&gt;
* [http://www.surrey.ac.uk/ELI/thesis.html MA dissertations at Univ. of Surrey, English Language Institute]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ai.mit.edu/projects/infolab MIT AI Lab NLP Demos]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cmu.edu/~aberger/maxent.html MaxEnt and Exponential Models, Tutorials by Adam Berger, CMU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.scn.org/~mentifex/ Mentifex AI]&lt;br /&gt;
&lt;br /&gt;
* [http://meilleursprenoms.com/ Most frequent French names]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cee.hw.ac.uk/~alison/nl/details.html Natural Language Processing Course]&lt;br /&gt;
&lt;br /&gt;
* [http://nlpers.blogspot.com/ Natural Language Processing Research Blog]&lt;br /&gt;
&lt;br /&gt;
* [http://www.elsnet.org/publications/survey/ Natural Language Processing in Eastern Europe]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.dal.ca/~vlado/csci6509/ Natural Language Processing, CSCI6509 (Dalhousie University)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.canoo.net/ Ontology-Based Modelling in the Humanities]&lt;br /&gt;
&lt;br /&gt;
* [http://nlp.postech.ac.kr/ Part of Speech Tagger for Korean]&lt;br /&gt;
&lt;br /&gt;
* [http://sunsite.unc.edu/patents/intropat.html Patent Information (includes patents in IR, Acoustics...)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cis.upenn.edu/~treebank/home.html Penn Treebank Corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://pie.usna.edu/ Phrases in English]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.monash.edu.au/cgi-bin/postmodern Postmodernist Journal Paper Generator]&lt;br /&gt;
&lt;br /&gt;
* [http://acl.ldc.upenn.edu/W/W05/ Proceedings of ENLG-05]&lt;br /&gt;
&lt;br /&gt;
* [http://www.aus.xanadu.com/ Project Xanadu]&lt;br /&gt;
&lt;br /&gt;
* [http://www.riexinger.com/ RIEXINGER Tuerenwerke]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ualberta.ca/~dmiall/reading/index.htm Reader Response: Empirical Studies of Literary Reading]&lt;br /&gt;
&lt;br /&gt;
* [http://www.iol.ie/~mazzoldi/lang/index.html Resources for translators]&lt;br /&gt;
&lt;br /&gt;
* [http://www.lpl.univ-aix.fr/projects/romanseval/ Romanseval : Word sense disambiguation for Romance languages]&lt;br /&gt;
&lt;br /&gt;
* [http://www.dfki.de/lt/diss/ Saarbruecken Dissertations in Computational Linguistics and Language Technology]&lt;br /&gt;
&lt;br /&gt;
* [http://www.ccs.neu.edu/home/futrelle/bionlp/search.html Search Bionlp.org]&lt;br /&gt;
&lt;br /&gt;
* [http://www.itri.brighton.ac.uk/events/senseval/ Senseval 2 : Evaluating Word Sense Disambiguation Systems]&lt;br /&gt;
&lt;br /&gt;
* [http://www.startext.co.uk/ Startext: small, private language &amp;amp; document engineering practice]&lt;br /&gt;
&lt;br /&gt;
* [http://www.cs.cornell.edu/courses/cs775/2001sp/default.html Statistical Natural Language Processing: Models and Methods (Cornell U. COMS 775)]&lt;br /&gt;
&lt;br /&gt;
* [http://www.w3.org/TR/2001/WD-ngram-spec-20010103/ Stochastic Language Models (N-Gram) Specification W3C Working Draft (January 3, 2001)]&lt;br /&gt;
&lt;br /&gt;
* [http://crl.nmsu.edu/summerschool Summer School at NMSU]&lt;br /&gt;
&lt;br /&gt;
* [http://www.let.rug.nl/~vannoord/TextCat/Demo/ TextCat Language Guesser]&lt;br /&gt;
&lt;br /&gt;
* [http://www.mitre.org/technology/alembic-workbench/ The Alembic Workbench]&lt;br /&gt;
&lt;br /&gt;
* [http://egnatia.ee.auth.gr/~yhat/yiannis The LexiGraf web page]&lt;br /&gt;
&lt;br /&gt;
* [http://linguistlist.org/ The Linguist List]&lt;br /&gt;
&lt;br /&gt;
* [http://www.sil.org/computing/shoebox/ The Linguist&#039;s Shoebox]&lt;br /&gt;
&lt;br /&gt;
* [http://www.logos.it/magazine/ The Magazine for the Language Industries]&lt;br /&gt;
&lt;br /&gt;
* [http://www.coli.uni-sb.de/sfb378/negra-corpus/negra-corpus.html The Negra Corpus - German Syntax annotated]&lt;br /&gt;
&lt;br /&gt;
* [http://www.csun.edu/~vcoao0el/de361/de361s53_folder/english.html The Trouble with English Spelling]&lt;br /&gt;
&lt;br /&gt;
* [http://www.webcorp.org.uk/ The WebCorp project]&lt;br /&gt;
&lt;br /&gt;
* [http://timexportal.info TimexPortal - Temporal Expression Recognition and Normalisation]&lt;br /&gt;
&lt;br /&gt;
* [http://www.comp.lancs.ac.uk/ucrel/tech_papers.html UCREL Technical Papers]&lt;br /&gt;
&lt;br /&gt;
* [http://www.czyborra.com/unifont/ Unifont, the Unicode font]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/ Web based language analysis, keyword searching of project Gutenburg texts]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/wordfind.pl Word Finder - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://rreck.sealsoft.com/cgi-bin/apps/wordfind/freqgen.pl Word Frequency Analyzer - uses Project Gutenberg corpus]&lt;br /&gt;
&lt;br /&gt;
* [http://wndomains.itc.it/ Word Sense Disambiguation and Categorization at IRST]&lt;br /&gt;
&lt;br /&gt;
* [http://www.liv.ac.uk/~ms2928/wordsmith/index.htm WordSmith Tools]&lt;br /&gt;
&lt;br /&gt;
* [http://linkage.rockefeller.edu/wli/zipf/ Zipf&#039;s Law]&lt;br /&gt;
&lt;br /&gt;
* [http://www.entmp.org/linguistics/phonGIF/ phonGIF - bitpapped IPA characters (based on the wsuipa METAFONT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html 2000 NIST Speaker Recognition Evaluation Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://ixa.si.ehu.es/Ixa/resources/sensecorpus A Web Corpus and Topic Signatures for All WordNet 1.6 Nominal Senses (v 1.0)]&lt;br /&gt;
&lt;br /&gt;
*[http://odur.let.rug.nl/~vannoord/trees/ Alpino Treebank]&lt;br /&gt;
&lt;br /&gt;
*[http://www.aot.ru/search1.html AOT]&lt;br /&gt;
&lt;br /&gt;
*[http://pioneer.chula.ac.th/~awirote/ling/corpuslst.htm Corpus Resources (Chulalongkorn University, Thailand)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/cran/ Cranfield collection]&lt;br /&gt;
&lt;br /&gt;
*[http://corpus.rae.es/creanet.html CREA]&lt;br /&gt;
&lt;br /&gt;
*[http://www.eat.rl.ac.uk/ Edinburgh Associative Thesaurus (EAT)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hum.uva.nl/~ewn EuroWordNet]&lt;br /&gt;
&lt;br /&gt;
*[http://rali.iro.umontreal.ca/ Hansards Corpus - Searchable]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hcrc.ed.ac.uk/maptask/ HCRC Map Task Corpus XML annotations]&lt;br /&gt;
&lt;br /&gt;
*[http://nats-www.informatik.uni-hamburg.de/~ingo/icopost/ ICOPOST]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/TC.html IMS Corpus Toolbox, Univ. of Stuttgart]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ims.uni-stuttgart.de/projekte/CorpusWorkbench/ IMS Corpus Workbench (CWB)]&lt;br /&gt;
&lt;br /&gt;
*[http://cecl.fltr.ucl.ac.be/Cecl-Projects/Icle/icle.htm International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ipds.uni-kiel.de/links/datenmaterial.en.html Kiel University&#039;s Institute on Phonetics and Speech Procesing]&lt;br /&gt;
&lt;br /&gt;
*[http://www.nilc.icmc.usp.br/lacioweb Lacio Web Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.vuw.ac.nz/llc/ LANGUAGE LEARNING CENTER - ACADEMIC CORPUS]&lt;br /&gt;
&lt;br /&gt;
*[http://www.bmanuel.org/clr2_mp.html Manuel Barbera: General Corpora and Corpus Linguistics Resources]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.cs.cornell.edu/pub/smart/med/ Medlars collection]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.ox.ac.uk/pub/wordlists/ Miscellaneous Word Lists from Oxford University]&lt;br /&gt;
&lt;br /&gt;
*[http://www.lpl.univ-aix.fr/projects/multext/ Multilingual Text Tools and Corpora]&lt;br /&gt;
&lt;br /&gt;
*[http://www.census.gov/genealogy/names Name lists from US census]&lt;br /&gt;
&lt;br /&gt;
*[http://www.di.fc.ul.pt/~ahb/nexing.htm Nexing Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/web/books.html On-line books at CMU]&lt;br /&gt;
&lt;br /&gt;
*[http://logos.uio.no/opus/ OPUS -- An Open Source Parallel Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://elex.amu.edu.pl/~przemka/PICLE_search.php Polish subcorpus of the International Corpus of Learner English]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cirp.es/WXN/wxn/frames/proxectos.html Ramon Piero Center for Research]&lt;br /&gt;
&lt;br /&gt;
*[http://about.reuters.com/researchandstandards/corpus/ Reuters Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S97.html Speech in Noisy Environments 1 (SPINE1 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ldc.upenn.edu/Catalog/LDC2001S99.html Speech in Noisy Environments 2 (SPINE2 CODED) Coded Audio]&lt;br /&gt;
&lt;br /&gt;
*[http://www.cs.cmu.edu/afs/cs/project/ai-repository/ai/areas/nlp/doc/notes/corpora.txt Survey of Electronic Corpora (by Jane A. &lt;br /&gt;
Edwards, file at CMU)]&lt;br /&gt;
&lt;br /&gt;
*[http://www.ucl.ac.uk/english-usage/ Survey of English Usage, University College, London]&lt;br /&gt;
&lt;br /&gt;
*[http://www.icsi.berkeley.edu/real/stp/index.html Switchboard Transcription Project]&lt;br /&gt;
&lt;br /&gt;
*[http://www.tractor.de/ TELRI Research Archive of Computational Tools and Resources]&lt;br /&gt;
&lt;br /&gt;
*[http://childes.psy.cmu.edu/ The Childes Corpus - Children&#039;s language]&lt;br /&gt;
&lt;br /&gt;
*[http://nora.hd.uib.no/index-e.html The CORPORA DataCenter (Norway)]&lt;br /&gt;
&lt;br /&gt;
*[ftp://ftp.dcs.shef.ac.uk/share/ilash/Moby/ The Moby Corpus]&lt;br /&gt;
&lt;br /&gt;
*[http://www.hf.uio.no/tekstlab/prosjekter/SOFIE.htm The Sofie Treebank - A Parallel Treebank of North European Languages]&lt;/div&gt;</summary>
		<author><name>Sean Bethard</name></author>
	</entry>
</feed>