<html xmlns:v="urn:schemas-microsoft-com:vml" xmlns:o="urn:schemas-microsoft-com:office:office" xmlns:w="urn:schemas-microsoft-com:office:word" xmlns="http://www.w3.org/TR/REC-html40">

<head>
<meta http-equiv=Content-Type content="text/html; charset=iso-8859-1">
<meta name=Generator content="Microsoft Word 11 (filtered medium)">
<!--[if !mso]>
<style>
v\:* {behavior:url(#default#VML);}
o\:* {behavior:url(#default#VML);}
w\:* {behavior:url(#default#VML);}
.shape {behavior:url(#default#VML);}
</style>
<![endif]-->
<style>
<!--
 /* Font Definitions */
 @font-face
        {font-family:Times;
        panose-1:2 2 6 3 5 4 5 2 3 4;}
@font-face
        {font-family:"Comic Sans MS";
        panose-1:3 15 7 2 3 3 2 2 2 4;}
@font-face
        {font-family:Tahoma;
        panose-1:2 11 6 4 3 5 4 4 2 4;}
 /* Style Definitions */
 p.MsoNormal, li.MsoNormal, div.MsoNormal
        {margin:0cm;
        margin-bottom:.0001pt;
        font-size:10.0pt;
        font-family:"Times New Roman";}
h3
        {margin-top:12.0pt;
        margin-right:0cm;
        margin-bottom:12.0pt;
        margin-left:121.05pt;
        text-align:justify;
        text-indent:-36.0pt;
        page-break-after:avoid;
        mso-list:l0 level3 lfo3;
        font-size:11.0pt;
        font-family:Times;}
a:link, span.MsoHyperlink
        {color:blue;
        text-decoration:underline;}
a:visited, span.MsoHyperlinkFollowed
        {color:blue;
        text-decoration:underline;}
p.MsoPlainText, li.MsoPlainText, div.MsoPlainText
        {margin:0cm;
        margin-bottom:.0001pt;
        font-size:10.0pt;
        font-family:"Courier New";}
p.example, li.example, div.example
        {margin-top:0cm;
        margin-right:0cm;
        margin-bottom:0cm;
        margin-left:4.0cm;
        margin-bottom:.0001pt;
        font-size:10.0pt;
        font-family:Times;}
p.Reference-style, li.Reference-style, div.Reference-style
        {margin-top:0cm;
        margin-right:0cm;
        margin-bottom:0cm;
        margin-left:93.55pt;
        margin-bottom:.0001pt;
        text-align:justify;
        text-indent:-8.5pt;
        font-size:10.0pt;
        font-family:Times;}
span.EmailStyle20
        {mso-style-type:personal-reply;
        font-family:Arial;
        color:navy;}
@page Section1
        {size:595.3pt 841.9pt;
        margin:72.0pt 90.0pt 72.0pt 90.0pt;}
div.Section1
        {page:Section1;}
 /* List Definitions */
 @list l0
        {mso-list-id:1466972362;
        mso-list-template-ids:262287612;}
@list l0:level1
        {mso-level-text:%1;
        mso-level-tab-stop:106.65pt;
        mso-level-number-position:left;
        margin-left:106.65pt;
        text-indent:-21.6pt;}
@list l0:level2
        {mso-level-text:"%1\.%2";
        mso-level-tab-stop:113.85pt;
        mso-level-number-position:left;
        margin-left:113.85pt;
        text-indent:-28.8pt;}
@list l0:level3
        {mso-level-style-link:"Heading 3";
        mso-level-text:"\.\.%3";
        mso-level-tab-stop:121.05pt;
        mso-level-number-position:left;
        margin-left:121.05pt;
        text-indent:-36.0pt;
        font-variant:normal !important;
        mso-hide:none;
        text-transform:none;
        position:relative;
        top:0pt;
        mso-text-raise:0pt;
        letter-spacing:0pt;
        mso-font-kerning:0pt;
        text-effect:none;
        text-shadow:none;
        text-effect:none;
        text-effect:none;
        font-emphasize:none;
        mso-ansi-font-style:normal;
        mso-bidi-font-style:normal;
        text-decoration:none;
        text-underline:none;
        text-decoration:none;
        text-line-through:none;
        vertical-align:baseline;}
@list l0:level4
        {mso-level-text:"%1\.%2\.%3\.%4";
        mso-level-tab-stop:128.25pt;
        mso-level-number-position:left;
        margin-left:128.25pt;
        text-indent:-43.2pt;}
@list l0:level5
        {mso-level-text:"%1\.%2\.%3\.%4\.%5";
        mso-level-tab-stop:135.45pt;
        mso-level-number-position:left;
        margin-left:135.45pt;
        text-indent:-50.4pt;}
@list l0:level6
        {mso-level-text:"%1\.%2\.%3\.%4\.%5\.%6";
        mso-level-tab-stop:142.65pt;
        mso-level-number-position:left;
        margin-left:142.65pt;
        text-indent:-57.6pt;}
@list l0:level7
        {mso-level-text:"%1\.%2\.%3\.%4\.%5\.%6\.%7";
        mso-level-tab-stop:149.85pt;
        mso-level-number-position:left;
        margin-left:149.85pt;
        text-indent:-64.8pt;}
@list l0:level8
        {mso-level-text:"%1\.%2\.%3\.%4\.%5\.%6\.%7\.%8";
        mso-level-tab-stop:157.05pt;
        mso-level-number-position:left;
        margin-left:157.05pt;
        text-indent:-72.0pt;}
@list l0:level9
        {mso-level-text:"%1\.%2\.%3\.%4\.%5\.%6\.%7\.%8\.%9";
        mso-level-tab-stop:164.25pt;
        mso-level-number-position:left;
        margin-left:164.25pt;
        text-indent:-79.2pt;}
ol
        {margin-bottom:0cm;}
ul
        {margin-bottom:0cm;}
-->
</style>
<!--[if gte mso 9]><xml>
 <o:shapedefaults v:ext="edit" spidmax="1026" />
</xml><![endif]--><!--[if gte mso 9]><xml>
 <o:shapelayout v:ext="edit">
  <o:idmap v:ext="edit" data="1" />
 </o:shapelayout></xml><![endif]-->
</head>

<body lang=EN-GB link=blue vlink=blue>

<div class=Section1>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>Dear Mihai,<o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>Both the JRC-Acquis parallel corpus and
the DGT-Translation Memory contain Romanian texts. However, they are not speech
transcriptions. <o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>You can find more information on our
website and also download them from there:<o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>            <a
href="http://langtech.jrc.it/">http://langtech.jrc.it/</a><o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>The <b><span style='font-weight:bold'>JRC-Acquis</span></b>
has both full texts in 22 languages (including Romanian) and ~sentence
alignments for all 21 language pairs involving Romanian. The Romanian part of
the JRC-Acquis consists of about 20 Million words. <o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><b><font size=2 color=navy face=Arial><span
style='font-size:10.0pt;font-family:Arial;color:navy;font-weight:bold'>DGT-TM</span></font></b><font
color=navy face=Arial><span style='font-family:Arial;color:navy'> is a
Translation Memory involving the same 22 languages, i.e. it is a loose collection
of translation units (mostly sentences). From these, the full text cannot be
reconstructed, but the added value compared to JRC-Acquis is that the cross-lingual
sentence alignments have been verified manually. The size of the Romanian part is
650,000 translation units (~sentences).<o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>I hope this helps.<o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>All the best,<o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'>Ralf<o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal style='margin-bottom:12.0pt'><b><font size=1 color=gray
face="Comic Sans MS"><span style='font-size:8.0pt;font-family:"Comic Sans MS";
color:gray;font-weight:bold'>Ralf Steinberger</span></font></b><font size=1
color=gray face="Comic Sans MS"><span style='font-size:8.0pt;font-family:"Comic Sans MS";
color:gray'> (</span></font><font size=1 color=gray face="Comic Sans MS"><span
lang=DE style='font-size:8.0pt;font-family:"Comic Sans MS";color:gray'><a
href="mailto:Ralf.Steinberger@jrc.it" title="mailto:Ralf.Steinberger@jrc.it"><font
color=gray><span lang=EN-GB style='color:gray'><span
title="mailto:Ralf.Steinberger@jrc.it"><span
title="mailto:Ralf.Steinberger@jrc.it"><span
title="mailto:Ralf.Steinberger@jrc.it"><span
title="mailto:Ralf.Steinberger@jrc.it">Ralf.Steinberger@jrc.it</span></span></span></font></span></span></a></span></font><font
size=1 color=gray face="Comic Sans MS"><span style='font-size:7.5pt;font-family:
"Comic Sans MS";color:gray'>) <br>
European Commission - Joint Research Centre (JRC)<br>
IPSC - SeS - Language Technology (</span></font><font size=1
color=gray face="Comic Sans MS"><span style='font-size:8.0pt;font-family:"Comic Sans MS";
color:gray'><a href="http://langtech.jrc.it/"
title="http://langtech.jrc.it/ http://www.jrc.it/langtech"><font size=1
color=gray><span style='font-size:7.5pt;color:gray'><span
title="http://langtech.jrc.it/ http://www.jrc.it/langtech"><span
title="http://langtech.jrc.it/"><span title="http://langtech.jrc.it/"><span
title="http://langtech.jrc.it/ http://www.jrc.it/langtech">http://langtech.jrc.it</span></span></span></font></span></span></a></span></font><font
size=1 color=gray face="Comic Sans MS"><span style='font-size:7.5pt;font-family:
"Comic Sans MS";color:gray'>) </span></font><font color=maroon face=Arial><span
style='font-family:Arial;color:maroon'><o:p></o:p></span></font></p>

<p class=MsoNormal><b><u><font size=1 color=maroon face=Arial><span
style='font-size:9.0pt;font-family:Arial;color:maroon;font-weight:bold'>JRC-Acquis
Multilingual Parallel Corpus</span></font></u></b><font size=1 color=maroon
face=Arial><span style='font-size:9.0pt;font-family:Arial;color:maroon'>
(Version 3)<o:p></o:p></span></font></p>

<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 face=Symbol><span style='font-size:10.0pt;font-family:Symbol'>·</span></font><font
size=1><span style='font-size:7.0pt'>       </span></font><b><font
size=1 color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon;font-weight:bold'>Freely available</span></font></b><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'> for research purposes.<o:p></o:p></span></font></p>

<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 face=Symbol><span style='font-size:10.0pt;font-family:Symbol'>·</span></font><font
size=1><span style='font-size:7.0pt'>       </span></font><b><font
size=1 color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon;font-weight:bold'>22 languages</span></font></b><font size=1
color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>: Bulgarian, Czech, Danish, German, Greek, English, Spanish,
Estonian, Finnish, French, Hungarian, Italian, Lithuanian, Latvian, Maltese,
Dutch, Polish, Portuguese, Romanian, Slovak, Slovene and Swedish.<o:p></o:p></span></font></p>

<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 face=Symbol><span style='font-size:10.0pt;font-family:Symbol'>·</span></font><font
size=1><span style='font-size:7.0pt'>       </span></font><font
size=1 color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>Altogether<b><span style='font-weight:bold'> over 1 Billion words</span></b>.<o:p></o:p></span></font></p>

<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 face=Symbol><span style='font-size:10.0pt;font-family:Symbol'>·</span></font><font
size=1><span style='font-size:7.0pt'>       </span></font><font
size=1 color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>Sentence <b><span style='font-weight:bold'>alignment for 231
language pairs</span></b>.<o:p></o:p></span></font></p>

<p class=MsoNormal style='margin-left:31.35pt;text-indent:-14.15pt'><font
size=2 face=Symbol><span style='font-size:10.0pt;font-family:Symbol'>·</span></font><font
size=1><span style='font-size:7.0pt'>       </span></font><font
size=1 color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'>For more information and <b><span style='font-weight:bold'>download</span></b>,
see <a href="http://langtech.jrc.it/JRC-Acquis.html"
title="http://langtech.jrc.it/JRC-Acquis.html"><font color=purple><span
style='color:purple'>http://langtech.jrc.it/JRC-Acquis.html</span></font></a>.<o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color="#993366" face=Arial><span
style='font-size:10.0pt;font-family:Arial;color:#993366'>                                                                                        </span></font><font
face=Arial><span style='font-family:Arial'><o:p></o:p></span></font></p>

<p class=MsoNormal><font size=1 color=maroon face=Arial><span style='font-size:
9.0pt;font-family:Arial;color:maroon'>The <b><u><span style='font-weight:bold'>JRC’s
Language Technology group</span></u></b> specialises in the development of
highly multilingual text analysis tools and in cross-lingual applications. Many
applications are accessible online, e.g.:<o:p></o:p></span></font></p>

<p class=MsoNormal style='margin-left:1.0cm;text-indent:-14.15pt'><font size=2
face=Symbol><span style='font-size:10.0pt;font-family:Symbol'>·</span></font><font
size=1><span style='font-size:7.0pt'>       </span></font><font
size=1 face=Arial><span style='font-size:8.0pt;font-family:Arial'><a
href="http://press.jrc.it/NewsExplorer/"
title="http://press.jrc.it/NewsExplorer/"><font color=purple><span
style='color:purple'>NewsExplorer</span></font></a><font color=maroon><span
style='color:maroon'>: multilingual news aggregation and analysis (19
languages); allows to navigate the news over time and across languages; trend
analysis; collects information about people from the news; social network
detection.</span></font><o:p></o:p></span></font></p>

<p class=MsoNormal style='margin-left:1.0cm;text-indent:-14.15pt'><font size=2
face=Symbol><span style='font-size:10.0pt;font-family:Symbol'>·</span></font><font
size=1><span style='font-size:7.0pt'>       </span></font><font
size=1 face=Arial><span style='font-size:8.0pt;font-family:Arial'><a
href="http://press.jrc.it/" title="http://press.jrc.it/"><font color=purple><span
style='color:purple'>NewsBrief</span></font></a><font color=maroon><span
style='color:maroon'>: breaking news detection and display of the very latest
thematic news from around the world; email alerting (22+ languages).</span></font><o:p></o:p></span></font></p>

<p class=MsoNormal style='margin-left:1.0cm;text-indent:-14.15pt'><font size=2
face=Symbol><span style='font-size:10.0pt;font-family:Symbol'>·</span></font><font
size=1><span style='font-size:7.0pt'>       </span></font><font
size=1 color=maroon face=Arial><span style='font-size:8.0pt;font-family:Arial;
color:maroon'><a href="http://medusa.jrc.it/" title="http://medusa.jrc.it/"><font
color=purple><span style='color:purple'>MedISys</span></font></a> Medical
Information System: latest health-related news from around the world according
to themes and diseases (22+ languages).</span></font><font size=1 face=Arial><span
style='font-size:8.0pt;font-family:Arial'><o:p></o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<p class=MsoNormal><font size=2 color=navy face=Arial><span style='font-size:
10.0pt;font-family:Arial;color:navy'><o:p> </o:p></span></font></p>

<div>

<div class=MsoNormal align=center style='text-align:center'><font size=2
face="Times New Roman"><span lang=EN-US style='font-size:10.0pt'>

<hr size=2 width="100%" align=center tabindex=-1>

</span></font></div>

<p class=MsoNormal><b><font size=2 face=Tahoma><span lang=EN-US
style='font-size:10.0pt;font-family:Tahoma;font-weight:bold'>From:</span></font></b><font
face=Tahoma><span lang=EN-US style='font-family:Tahoma'> corpora-bounces@uib.no
[mailto:corpora-bounces@uib.no] <b><span style='font-weight:bold'>On Behalf Of </span></b>Mihai
Daniel Frumuselu<br>
<b><span style='font-weight:bold'>Sent:</span></b> 03 December 2007 18:31<br>
<b><span style='font-weight:bold'>To:</span></b> Corpora@uib.no<br>
<b><span style='font-weight:bold'>Subject:</span></b> [Corpora-List] Romanian
language corpora</span></font><span lang=EN-US><o:p></o:p></span></p>

</div>

<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'><o:p> </o:p></span></font></p>

<div>

<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'>Dear Madam/Sir,<o:p></o:p></span></font></p>

</div>

<div>

<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'> <o:p></o:p></span></font></p>

</div>

<div>

<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'>I am currently looking for Romanian language corpora in electronic
format, particularly conversation transcriptions. A colleague from Linguist
List advised me to contact you. Do you happen to know there are corpora of
Romanian, either online or on a disk? <o:p></o:p></span></font></p>

</div>

<div>

<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'> <o:p></o:p></span></font></p>

</div>

<div>

<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'>Thank you and best regards,<o:p></o:p></span></font></p>

</div>

<div>

<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'> <o:p></o:p></span></font></p>

</div>

<div>

<p class=MsoNormal><font size=2 face="Times New Roman"><span style='font-size:
10.0pt'>Mihai Frumuselu<br clear=all>
<br>
<br>
</span></font><font size=1><span style='font-size:7.5pt'>Mihai Daniel Frumuselu<br>
doktorand i lingvistik<br>
<br>
Björnkullaringen 28D<br>
141 51 Huddinge<br>
<br>
Tlf.:  (08) 42 86 52 31 (hemma)<br>
        0704 - 29 85 51 (mobil) <br>
<br>
<a href="http://www.mihai.se">www.mihai.se</a>, <a
href="http://www.oru.se/hum/mihai_frumuselu">www.oru.se/hum/mihai_frumuselu</a><br>
<a href="http://www.mihaidaniel.myphotoalbum.com">www.mihaidaniel.myphotoalbum.com
</a><br>
e-post: <a href="mailto:mihai.frumuselu@gmail.com">mihai.frumuselu@gmail.com</a>
</span></font><o:p></o:p></p>

</div>

</div>

</body>

</html>