LabEx EFL


[Retour à la fiche]

Metadonnées au format OLAC

 
  <?xml version="1.0" encoding="UTF-8"?>
  <olac:olac
   xmlns:olac="http://www.language-archives.org/OLAC/1.1/" 
   xmlns:dc="http://purl.org/dc/elements/1.1/" 
   xmlns:dcterms="http://purl.org/dc/terms/" 
   xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
   xsi:schemaLocation="http://www.language-archives.org/OLAC/1.1/ http://www.language-archives.org/OLAC/1.1/olac.xsd http://purl.org/dc/elements/1.1/
   http://dublincore.org/schemas/xmls/qdc/2006/01/06/dc.xsd http://purl.org/dc/terms/ http://dublincore.org/schemas/xmls/qdc/2006/01/06/dcterms.xsd">
  <dc:title>Language detector</dc:title>
  <dc:publisher><dc:publisher>LPP (P3) : Laboratoire de phonétique et de phonologie</dc:publisher>
  <dc:creator/>
  <dcterms:accessRights>Téléchargement</dcterms:accessRights>
  <dcterms:license>GPL</dcterms:license>
  <dcterms:provenance/>
  <dc:language/><dc:abstract>Trouve la langue d'un texte grâce à l'algorithme suivant :
* finds among the 20 most common characters of the text the most common unicode category. If this category is a letter (category starting with “L” : Ll=letter lower case, Lu=letter upper case, Lo=letter other) continue, if not (ie. Mostly other characters like ponctuation) give up.
* Check among the 20 most common characters if the first word of the unicode name gives a unique language name</dc:abstract>
  <dc:description/>
  <dc:source/>
  <dc:identifier xsi:type="dcterms:URI">http://elizia.net/languageDetector/languageDetector.html</dc:identifier>
  <dcterms:created xsi:type="dcterms:W3CDTF">2024-22-12</dcterms:created>
  <dc:type/>
  <dc:format>application/Python</dc:format>
  <dc:type xsi:type="dcterms:DCMIType">Software</dc:type>
  </olac:olac>