LabEx EFL


[Retour à la fiche]

Metadonnées au format OLAC

 
  <?xml version="1.0" encoding="UTF-8"?>
  <olac:olac
   xmlns:olac="http://www.language-archives.org/OLAC/1.1/" 
   xmlns:dc="http://purl.org/dc/elements/1.1/" 
   xmlns:dcterms="http://purl.org/dc/terms/" 
   xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
   xsi:schemaLocation="http://www.language-archives.org/OLAC/1.1/ http://www.language-archives.org/OLAC/1.1/olac.xsd http://purl.org/dc/elements/1.1/
   http://dublincore.org/schemas/xmls/qdc/2006/01/06/dc.xsd http://purl.org/dc/terms/ http://dublincore.org/schemas/xmls/qdc/2006/01/06/dcterms.xsd">
  <dc:title>Europarl3</dc:title>
  <dc:publisher>
  <dc:creator>Jörg Tiedemann</dc:creator>
  <dcterms:accessRights>Téléchargement</dcterms:accessRights><dcterms:license/>
  <dcterms:provenance>web (Parlement Européen)</dcterms:provenance>
  <dc:language>Danish, Greek, English, Spanish, Finnish, French, Italian, Dutch, Polish, Portuguese, Slovak</dc:language>
  <dc:abstract>Corpus parallèle issu du site du Parlement Européen. Environ 40 millions de mots par langue, 11 langues (da, de, el, en, es, fi, fr, it, nl, pt, sv).

11 languages, 55 bitexts (3.5 G)
total number of files: 7,034
total number of tokens: 404.01M
total number of sentence fragments: 15.81M</dc:abstract>
  <dc:description>annotations morpho-syntaxiques</dc:description>
  <dc:source>Jörg Tiedemann, 2009, News from OPUS - A Collection of Multilingual Parallel Corpora with Tools and Interfaces [pdf]     In N. Nicolov and K. Bontcheva and G. Angelova and R. Mitkov (eds.) Recent Advances in Natural Language Processing (vol V), pages 237-248, John Benjamins, Amsterdam/Philadelphia</dc:source>
  <dc:identifier xsi:type="dcterms:URI">http://opus.lingfil.uu.se/Europarl3.php</dc:identifier>
  <dcterms:created xsi:type="dcterms:W3CDTF">2024-25-04</dcterms:created>
  <dc:type>3,5 Go</dc:type>
  <dc:format>text/XML, XCES</dc:format>
  <dc:type xsi:type="dcterms:DCMIType">Text</dc:type>
  </olac:olac>