LabEx EFL


[Retour à la fiche]

Metadonnées au format CLARIN

   <?xml version="1.0" encoding="UTF-8"?>
<CMD xmlns="http://www.clarin.eu/cmd/"
     xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
     xmlns:dc="http://purl.org/dc/elements/1.1/"
     xmlns:dcterms="http://purl.org/dc/terms/"
     xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/"
     xmlns:defns="http://www.openarchives.org/OAI/2.0/"
     xmlns:olac="http://www.language-archives.org/OLAC/1.0/"
     xmlns:olac11="http://www.language-archives.org/OLAC/1.1/"
     CMDVersion="1.1"
     xsi:schemaLocation="http://www.clarin.eu/cmd/ http://catalog.clarin.eu/ds/ComponentRegistry/rest/registry/profiles/clarin.eu:cr1:p_1288172614026/xsd">
   <Header>
      <MdCreator>olac2cmdi.xsl</MdCreator>
      <MdCreationDate/>
      <MdSelfLink/>
      <MdProfile>clarin.eu:cr1:p_1288172614026</MdProfile>
      <MdCollectionDisplayName/>
   </Header>
   <Resources>
      <ResourceProxyList>
         <ResourceProxy id="d1e25">
            <ResourceType>Resource</ResourceType>
            <ResourceRef>http://ece.ut.ac.ir/dbrg/bijankhan/</ResourceRef>
         </ResourceProxy>
      </ResourceProxyList>
      <JournalFileProxyList/>
      <ResourceRelationList/>
   </Resources>
   <Components>
      <OLAC-DcmiTerms>
         <abstract>Bijankhan corpus is a tagged corpus that is suitable for natural language processing research on the Persian (Farsi) language. This collection is gathered form daily news and common texts. In this collection all documents are categorized into different subjects such as political, cultural and so on. Totally, there are 4300 different subjects. The Bijankhan collection contains about 2.6 millions manually tagged words with a tag set that contains 40 Persian POS tags. This collection is prepared and distributed by database research group at University of Tehran.</abstract>
         <accessRights>T&eacute;l&eacute;chargement</accessRights>
         <created dcterms-type="W3CDTF">2024-29-03</created>
         <creator/>
         <description/>
         <format/>
         <identifier dcterms-type="URI">http://ece.ut.ac.ir/dbrg/bijankhan/</identifier>
         <language/>
         <license/>
         <provenance/>
         <source/>
         <title>Bijankhan Corpus</title>
         <type olac-linguistic-type="primary_text"/>
         <type olac-discourse-type="narrative"/>
         <type dcterms-type="DCMIType">Sound</type>
         <type/>
      </OLAC-DcmiTerms>
   </Components>
</CMD>