[
Retour à la fiche]
Metadonnées au format OLAC
<?xml version="1.0" encoding="UTF-8"?>
<olac:olac
xmlns:olac="http://www.language-archives.org/OLAC/1.1/"
xmlns:dc="http://purl.org/dc/elements/1.1/"
xmlns:dcterms="http://purl.org/dc/terms/"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://www.language-archives.org/OLAC/1.1/ http://www.language-archives.org/OLAC/1.1/olac.xsd http://purl.org/dc/elements/1.1/
http://dublincore.org/schemas/xmls/qdc/2006/01/06/dc.xsd http://purl.org/dc/terms/ http://dublincore.org/schemas/xmls/qdc/2006/01/06/dcterms.xsd">
<dc:title>Language detector</dc:title>
<dc:publisher><dc:publisher>LPP (P3) : Laboratoire de phonétique et de phonologie</dc:publisher>
<dc:creator/>
<dcterms:accessRights>Téléchargement</dcterms:accessRights>
<dcterms:license>GPL</dcterms:license>
<dcterms:provenance/>
<dc:language/><dc:abstract>Trouve la langue d'un texte grâce à l'algorithme suivant :
* finds among the 20 most common characters of the text the most common unicode category. If this category is a letter (category starting with “L” : Ll=letter lower case, Lu=letter upper case, Lo=letter other) continue, if not (ie. Mostly other characters like ponctuation) give up.
* Check among the 20 most common characters if the first word of the unicode name gives a unique language name</dc:abstract>
<dc:description/>
<dc:source/>
<dc:identifier xsi:type="dcterms:URI">http://elizia.net/languageDetector/languageDetector.html</dc:identifier>
<dcterms:created xsi:type="dcterms:W3CDTF">2024-22-12</dcterms:created>
<dc:type/>
<dc:format>application/Python</dc:format>
<dc:type xsi:type="dcterms:DCMIType">Software</dc:type>
</olac:olac>