<html xmlns:v="urn:schemas-microsoft-com:vml" xmlns:o="urn:schemas-microsoft-com:office:office" xmlns:w="urn:schemas-microsoft-com:office:word" xmlns="http://www.w3.org/TR/REC-html40">
<head>
<META HTTP-EQUIV="Content-Type" CONTENT="text/html; charset=us-ascii">
<meta name=Generator content="Microsoft Word 11 (filtered medium)">
<!--[if !mso]>
<style>
v\:* {behavior:url(#default#VML);}
o\:* {behavior:url(#default#VML);}
w\:* {behavior:url(#default#VML);}
.shape {behavior:url(#default#VML);}
</style>
<![endif]-->
<style>
<!--
/* Font Definitions */
@font-face
{font-family:Times;
panose-1:2 2 6 3 5 4 5 2 3 4;}
@font-face
{font-family:"Comic Sans MS";
panose-1:3 15 7 2 3 3 2 2 2 4;}
@font-face
{font-family:Tahoma;
panose-1:2 11 6 4 3 5 4 4 2 4;}
/* Style Definitions */
p.MsoNormal, li.MsoNormal, div.MsoNormal
{margin:0cm;
margin-bottom:.0001pt;
font-size:10.0pt;
font-family:"Times New Roman";}
h3
{margin-top:12.0pt;
margin-right:0cm;
margin-bottom:12.0pt;
margin-left:121.05pt;
text-align:justify;
text-indent:-36.0pt;
page-break-after:avoid;
mso-list:l0 level3 lfo3;
font-size:11.0pt;
font-family:Times;}
a:link, span.MsoHyperlink
{color:blue;
text-decoration:underline;}
a:visited, span.MsoHyperlinkFollowed
{color:purple;
text-decoration:underline;}
p.MsoPlainText, li.MsoPlainText, div.MsoPlainText
{margin:0cm;
margin-bottom:.0001pt;
font-size:10.0pt;
font-family:"Courier New";}
p.example, li.example, div.example
{margin-top:0cm;
margin-right:0cm;
margin-bottom:0cm;
margin-left:4.0cm;
margin-bottom:.0001pt;
font-size:10.0pt;
font-family:Times;}
p.Reference-style, li.Reference-style, div.Reference-style
{margin-top:0cm;
margin-right:0cm;
margin-bottom:0cm;
margin-left:93.55pt;
margin-bottom:.0001pt;
text-align:justify;
text-indent:-8.5pt;
font-size:10.0pt;
font-family:Times;}
span.EmailStyle20
{mso-style-type:personal-reply;
font-family:Arial;
color:navy;}
@page Section1
{size:595.3pt 841.9pt;
margin:72.0pt 90.0pt 72.0pt 90.0pt;}
div.Section1
{page:Section1;}
/* List Definitions */
@list l0
{mso-list-id:1466972362;
mso-list-template-ids:262287612;}
@list l0:level1
{mso-level-text:%1;
mso-level-tab-stop:106.65pt;
mso-level-number-position:left;
margin-left:106.65pt;
text-indent:-21.6pt;}
@list l0:level2
{mso-level-text:"%1\.%2";
mso-level-tab-stop:113.85pt;
mso-level-number-position:left;
margin-left:113.85pt;
text-indent:-28.8pt;}
@list l0:level3
{mso-level-style-link:"Heading 3";
mso-level-text:"\.\.%3";
mso-level-tab-stop:121.05pt;
mso-level-number-position:left;
margin-left:121.05pt;
text-indent:-36.0pt;
font-variant:normal !important;
mso-hide:none;
text-transform:none;
position:relative;
top:0pt;
mso-text-raise:0pt;
letter-spacing:0pt;
mso-font-kerning:0pt;
text-effect:none;
text-shadow:none;
text-effect:none;
text-effect:none;
font-emphasize:none;
mso-ansi-font-style:normal;
mso-bidi-font-style:normal;
text-decoration:none;
text-underline:none;
text-decoration:none;
text-line-through:none;
vertical-align:baseline;}
@list l0:level4
{mso-level-text:"%1\.%2\.%3\.%4";
mso-level-tab-stop:128.25pt;
mso-level-number-position:left;
margin-left:128.25pt;
text-indent:-43.2pt;}
@list l0:level5
{mso-level-text:"%1\.%2\.%3\.%4\.%5";
mso-level-tab-stop:135.45pt;
mso-level-number-position:left;
margin-left:135.45pt;
text-indent:-50.4pt;}
@list l0:level6
{mso-level-text:"%1\.%2\.%3\.%4\.%5\.%6";
mso-level-tab-stop:142.65pt;
mso-level-number-position:left;
margin-left:142.65pt;
text-indent:-57.6pt;}
@list l0:level7
{mso-level-text:"%1\.%2\.%3\.%4\.%5\.%6\.%7";
mso-level-tab-stop:149.85pt;
mso-level-number-position:left;
margin-left:149.85pt;
text-indent:-64.8pt;}
@list l0:level8
{mso-level-text:"%1\.%2\.%3\.%4\.%5\.%6\.%7\.%8";
mso-level-tab-stop:157.05pt;
mso-level-number-position:left;
margin-left:157.05pt;
text-indent:-72.0pt;}
@list l0:level9
{mso-level-text:"%1\.%2\.%3\.%4\.%5\.%6\.%7\.%8\.%9";
mso-level-tab-stop:164.25pt;
mso-level-number-position:left;
margin-left:164.25pt;
text-indent:-79.2pt;}
ol
{margin-bottom:0cm;}
ul
{margin-bottom:0cm;}
-->
</style>
<!--[if gte mso 9]><xml>
<o:shapedefaults v:ext="edit" spidmax="1026" />
</xml><![endif]--><!--[if gte mso 9]><xml>
<o:shapelayout v:ext="edit">
<o:idmap v:ext="edit" data="1" />
</o:shapelayout></xml><![endif]-->
</head>
<body lang=EN-GB link=blue vlink=purple>
<div class=Section1>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>Hello Peter,<o:p></o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>You did not say which languages you were
looking for. The JRC-Acquis is a parallel corpus in 22 EU languages. It is
freely available for research purposes. You find it at </span></font><font
size=1 color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'><a href="http://langtech.jrc.it/JRC-Acquis.html"
title="http://langtech.jrc.it/JRC-Acquis.html"><font color=purple><span
style='color:purple'>http://langtech.jrc.it/JRC-Acquis.html</span></font></a></span></font><font
color=navy face=Arial><span style='font-family:Arial;color:navy'>. You can
download a single language or all, with or without alignment information.</span></font><font
color=navy face=Arial><span style='font-family:Arial;color:navy'><o:p></o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>It is not enormous for single languages (about
1 Billion words altogether for the 22 languages), but to our knowledge it is
the biggest parallel corpus, considering the number of languages is covers. I
hope this is useful for your purposes.<o:p></o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>All the best,<o:p></o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>Ralf <o:p></o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>
<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>
<div>
<div>
<p class=MsoNormal style='margin-bottom:12.0pt'><b><font size=1 color=gray
face="Comic Sans MS"><span style='font-size:8.0pt;font-family:"Comic Sans MS";
color:gray;font-weight:bold'>Ralf Steinberger</span></font></b><font size=1
color=gray face="Comic Sans MS"><span style='font-size:8.0pt;font-family:"Comic Sans MS";
color:gray'> (</span></font><font size=1 color=gray face="Comic Sans MS"><span
lang=DE style='font-size:8.0pt;font-family:"Comic Sans MS";color:gray'><a
href="mailto:Ralf.Steinberger@jrc.it" title="mailto:Ralf.Steinberger@jrc.it"><font
color=gray><span lang=EN-GB style='color:gray'><span
title="mailto:Ralf.Steinberger@jrc.it"><span
title="mailto:Ralf.Steinberger@jrc.it"><span
title="mailto:Ralf.Steinberger@jrc.it"><span
title="mailto:Ralf.Steinberger@jrc.it">Ralf.Steinberger@jrc.it</span></span></span></font></span></span></a></span></font><font
size=1 color=gray face="Comic Sans MS"><span style='font-size:7.5pt;font-family:
"Comic Sans MS";color:gray'>) <br>
European Commission - Joint Research Centre (JRC)<br>
IPSC - SeS - Language Technology (</span></font><font size=1
color=gray face="Comic Sans MS"><span style='font-size:8.0pt;font-family:"Comic Sans MS";
color:gray'><a href="http://langtech.jrc.it/"
title="http://langtech.jrc.it/
http://www.jrc.it/langtech"><font size=1
color=gray><span style='font-size:7.5pt;color:gray'><span
title="http://langtech.jrc.it/
http://www.jrc.it/langtech"><span
title="http://langtech.jrc.it/"><span title="http://langtech.jrc.it/"><span
title="http://langtech.jrc.it/
http://www.jrc.it/langtech">http://langtech.jrc.it</span></span></span></font></span></span></a></span></font><font
size=1 color=gray face="Comic Sans MS"><span style='font-size:7.5pt;font-family:
"Comic Sans MS";color:gray'>) </span></font><font color=maroon face=Arial><span
style='font-family:Arial;color:maroon'><o:p></o:p></span></font></p>
<p class=MsoNormal><b><u><font size=1 color=maroon face=Arial><span
style='font-size:9.0pt;font-family:Arial;color:maroon;font-weight:bold'>JRC-Acquis
Multilingual Parallel Corpus</span></font></u></b><font size=1 color=maroon
face=Arial><span style='font-size:9.0pt;font-family:Arial;color:maroon'>
(Version 3)<o:p></o:p></span></font></p>
<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 color=navy face=Symbol><span style='font-size:10.0pt;font-family:Symbol;
color:navy'>·</span></font><font size=1 color=navy><span style='font-size:7.0pt;
color:navy'> </span></font><b><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon;font-weight:bold'>Freely available</span></font></b><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'> for research purposes.<o:p></o:p></span></font></p>
<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 color=navy face=Symbol><span style='font-size:10.0pt;font-family:Symbol;
color:navy'>·</span></font><font size=1 color=navy><span style='font-size:7.0pt;
color:navy'> </span></font><b><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon;font-weight:bold'>22 languages</span></font></b><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>: Bulgarian, Czech, Danish, German, Greek, English, Spanish,
Estonian, Finnish, French, Hungarian, Italian, Lithuanian, Latvian, Maltese,
Dutch, Polish, Portuguese, Romanian, Slovak, Slovene and Swedish.<o:p></o:p></span></font></p>
<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 color=navy face=Symbol><span style='font-size:10.0pt;font-family:Symbol;
color:navy'>·</span></font><font size=1 color=navy><span style='font-size:7.0pt;
color:navy'> </span></font><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>Altogether<b><span style='font-weight:bold'> over 1 Billion words</span></b>.<o:p></o:p></span></font></p>
<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 color=navy face=Symbol><span style='font-size:10.0pt;font-family:Symbol;
color:navy'>·</span></font><font size=1 color=navy><span style='font-size:7.0pt;
color:navy'> </span></font><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>Sentence <b><span style='font-weight:bold'>alignment for 231
language pairs</span></b>.<o:p></o:p></span></font></p>
<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 color=navy face=Symbol><span style='font-size:10.0pt;font-family:Symbol;
color:navy'>·</span></font><font size=1 color=navy><span style='font-size:7.0pt;
color:navy'> </span></font><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>For more information and <b><span style='font-weight:bold'>download</span></b>,
see <a href="http://langtech.jrc.it/JRC-Acquis.html"
title="http://langtech.jrc.it/JRC-Acquis.html"><font color=purple><span
style='color:purple'>http://langtech.jrc.it/JRC-Acquis.html</span></font></a>.<o:p></o:p></span></font></p>
<p class=MsoNormal><font size=2 color="#993366" face=Arial><span
style='font-size:10.0pt;font-family:Arial;color:#993366'> </span></font><font
color=navy face=Arial><span style='font-family:Arial;color:navy'><o:p></o:p></span></font></p>
<p class=MsoNormal><font size=1 color=maroon face=Arial><span style='font-size:
9.0pt;font-family:Arial;color:maroon'>The <b><u><span style='font-weight:bold'>JRC’s
Language Technology group</span></u></b> specialises in the development of
highly multilingual text analysis tools and in cross-lingual applications. Many
applications are accessible online, e.g.:<o:p></o:p></span></font></p>
<p class=MsoNormal style='margin-left:1.0cm;text-indent:-14.15pt'><font size=2
color=navy face=Symbol><span style='font-size:10.0pt;font-family:Symbol;
color:navy'>·</span></font><font size=1 color=navy><span style='font-size:7.0pt;
color:navy'> </span></font><font size=1
color=navy face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:navy'><a href="http://press.jrc.it/NewsExplorer/"
title="http://press.jrc.it/NewsExplorer/"><font color=purple><span
style='color:purple'>NewsExplorer</span></font></a></span></font><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>: multilingual news aggregation and analysis (19 languages);
allows to navigate the news over time and across languages; trend analysis;
collects information about people from the news; social network detection.</span></font><font
size=1 color=navy face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:navy'><o:p></o:p></span></font></p>
<p class=MsoNormal style='margin-left:1.0cm;text-indent:-14.15pt'><font size=2
color=navy face=Symbol><span style='font-size:10.0pt;font-family:Symbol;
color:navy'>·</span></font><font size=1 color=navy><span style='font-size:7.0pt;
color:navy'> </span></font><font size=1
color=navy face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:navy'><a href="http://press.jrc.it/" title="http://press.jrc.it/"><font
color=purple><span style='color:purple'>NewsBrief</span></font></a></span></font><font
size=1 color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>: breaking news detection and display of the very latest thematic
news from around the world; email alerting (22+ languages).</span></font><font
size=1 color=navy face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:navy'><o:p></o:p></span></font></p>
<p class=MsoNormal style='margin-left:1.0cm;text-indent:-14.15pt'><font size=2
color=navy face=Symbol><span style='font-size:10.0pt;font-family:Symbol;
color:navy'>·</span></font><font size=1 color=navy><span style='font-size:7.0pt;
color:navy'> </span></font><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'><a href="http://medusa.jrc.it/" title="http://medusa.jrc.it/"><font
color=purple><span style='color:purple'>MedISys</span></font></a> Medical
Information System: latest health-related news from around the world according
to themes and diseases (22+ languages).<o:p></o:p></span></font></p>
<p class=MsoNormal><font size=1 face=Arial><span style='font-size:8.0pt;
font-family:Arial'><o:p> </o:p></span></font></p>
</div>
</div>
<div>
<div class=MsoNormal align=center style='text-align:center'><font size=2
face="Times New Roman"><span lang=EN-US style='font-size:10.0pt'>
<hr size=2 width="100%" align=center tabindex=-1>
</span></font></div>
<p class=MsoNormal><b><font size=2 face=Tahoma><span lang=EN-US
style='font-size:10.0pt;font-family:Tahoma;font-weight:bold'>From:</span></font></b><font
face=Tahoma><span lang=EN-US style='font-family:Tahoma'> corpora-bounces@uib.no
[mailto:corpora-bounces@uib.no] <b><span style='font-weight:bold'>On Behalf Of </span></b>Peter
Isaev<br>
<b><span style='font-weight:bold'>Sent:</span></b> 19 November 2007 12:38<br>
<b><span style='font-weight:bold'>To:</span></b> CORPORA@uib.no<br>
<b><span style='font-weight:bold'>Subject:</span></b> [Corpora-List] free
corpus</span></font><span lang=EN-US><o:p></o:p></span></p>
</div>
<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'><o:p> </o:p></span></font></p>
<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'>Hello.<br>
<br>
I'm looking for free big corpus, consisting of plain text, something like BNC
corpus (it is not free).<br>
<br>
Where can I download it?<br>
<br>
Thank you.<o:p></o:p></span></font></p>
</div>
</body>
</html>