<div class="row">
        <div class="col-12">
            <pre class="with-hljs"><code class="lang-php">&lt;?php

/***************************************************************************\
 *  SPIP, Systeme de publication pour l&#039;internet                           *
 *                                                                         *
 *  Copyright (c) 2001-2016                                                *
 *  Arnaud Martin, Antoine Pitrou, Philippe Riviere, Emmanuel Saint-James  *
 *                                                                         *
 *  Ce programme est un logiciel libre distribue sous licence GNU/GPL.     *
 *  Pour plus de details voir le fichier COPYING.txt ou l&#039;aide en ligne.   *
\***************************************************************************/


//
if (!defined(&#039;_ECRIRE_INC_VERSION&#039;)) return;


/*
 * charsets supportes en natif : voir les tables dans ecrire/charsets/
 * les autres charsets sont supportes via mbstring()
 */

// http://doc.spip.org/@load_charset
function load_charset ($charset = &#039;AUTO&#039;, $langue_site = &#039;AUTO&#039;) {
	if ($charset == &#039;AUTO&#039;)
		$charset = $GLOBALS[&#039;meta&#039;][&#039;charset&#039;];
	$charset = trim(strtolower($charset));
	if (isset($GLOBALS[&#039;CHARSET&#039;][$charset]))
		return $charset;

	if ($langue_site == &#039;AUTO&#039;)
		$langue_site = $GLOBALS[&#039;meta&#039;][&#039;langue_site&#039;];

	if ($charset == &#039;utf-8&#039;) {
		$GLOBALS[&#039;CHARSET&#039;][$charset] = array();
		return $charset;
	}
	
	// Quelques synonymes
	if ($charset == &#039;&#039;) $charset = &#039;iso-8859-1&#039;;
	else if ($charset == &#039;windows-1250&#039;) $charset = &#039;cp1250&#039;;
	else if ($charset == &#039;windows-1251&#039;) $charset = &#039;cp1251&#039;;
	else if ($charset == &#039;windows-1256&#039;) $charset = &#039;cp1256&#039;;

	if (find_in_path($charset . &#039;.php&#039;, &#039;charsets/&#039;, true)) {
		return $charset;
	} else {
		spip_log(&quot;Erreur: pas de fichier de conversion &#039;charsets/$charset&#039;&quot;);
		$GLOBALS[&#039;CHARSET&#039;][$charset] = array();
		return false;
	}
}

//
// Verifier qu&#039;on peut utiliser mb_string
//
// http://doc.spip.org/@init_mb_string
function init_mb_string() {
	static $mb;

	// verifier que tout est present (fonctions mb_string pour php &gt;= 4.0.6)
	// et que le charset interne est connu de mb_string
	if (!$mb) {
		if (function_exists(&#039;mb_internal_encoding&#039;)
		AND function_exists(&#039;mb_detect_order&#039;)
		AND function_exists(&#039;mb_substr&#039;)
		AND function_exists(&#039;mb_strlen&#039;)
		AND function_exists(&#039;mb_encode_mimeheader&#039;)
		AND function_exists(&#039;mb_encode_numericentity&#039;)
		AND function_exists(&#039;mb_decode_numericentity&#039;)
		AND mb_detect_order($GLOBALS[&#039;meta&#039;][&#039;charset&#039;])
		) {
			mb_internal_encoding(&#039;utf-8&#039;);
			$mb = 1;
		} else
			$mb = -1;
	}

	return ($mb == 1);
}

// Detecter les versions buggees d&#039;iconv
// http://doc.spip.org/@test_iconv
function test_iconv() {
	static $iconv_ok;

	if (!$iconv_ok) {
		if (!function_exists(&#039;iconv&#039;))
			$iconv_ok = -1;
		else {
			if (utf_32_to_unicode(@iconv(&#039;utf-8&#039;, &#039;utf-32&#039;, &#039;chaine de test&#039;)) == &#039;chaine de test&#039;)
				$iconv_ok = 1;
			else
				$iconv_ok = -1;
		}
	}
	return ($iconv_ok == 1);
}

// Test de fonctionnement du support UTF-8 dans PCRE
// (contournement bug Debian Woody)
// http://doc.spip.org/@test_pcre_unicode
function test_pcre_unicode() {
	static $pcre_ok = 0;

	if (!$pcre_ok) {
		$s = &quot; &quot;.chr(195).chr(169).&quot;t&quot;.chr(195).chr(169).&quot; &quot;;
		if (preg_match(&#039;,\W...\W,u&#039;, $s)) $pcre_ok = 1;
		else $pcre_ok = -1;
	}
	return $pcre_ok == 1;
}

// Plages alphanumeriques (incomplet...)
// http://doc.spip.org/@pcre_lettres_unicode
function pcre_lettres_unicode() {
	static $plage_unicode;

	if (!$plage_unicode) {
		if (test_pcre_unicode()) {
			// cf. http://www.unicode.org/charts/
			$plage_unicode = &#039;\w&#039; // iso-latin
				. &#039;\x{100}-\x{24f}&#039; // europeen etendu
				. &#039;\x{300}-\x{1cff}&#039; // des tas de trucs
			;
		}
		else {
			// fallback a trois sous
			$plage_unicode = &#039;\w&#039;;
		}
	}
	return $plage_unicode;
}

// Plage ponctuation de 0x2000 a 0x206F
// (i.e. de 226-128-128 a 226-129-176)
// http://doc.spip.org/@plage_punct_unicode
function plage_punct_unicode() {
	return &#039;\xE2(\x80[\x80-\xBF]|\x81[\x80-\xAF])&#039;;
}

// corriger caracteres non-conformes : 128-159
// cf. charsets/iso-8859-1.php (qu&#039;on recopie ici pour aller plus vite)
// on peut passer un charset cible en parametre pour accelerer le passage iso-8859-1 -&gt; autre charset
// http://doc.spip.org/@corriger_caracteres_windows
function corriger_caracteres_windows($texte, $charset=&#039;AUTO&#039;, $charset_cible=&#039;unicode&#039;) {
	static $trans;
	
	if (is_array($texte)) {
		return array_map(&#039;corriger_caracteres_windows&#039;, $texte);
	}
	
	if ($charset==&#039;AUTO&#039;) $charset = $GLOBALS[&#039;meta&#039;][&#039;charset&#039;];
	if ($charset == &#039;utf-8&#039;) {
		$p = chr(194);
		if (strpos($texte,$p)===false) return $texte;
	} else if ($charset == &#039;iso-8859-1&#039;) {
		$p = &#039;&#039;;
	} else
		return $texte;

	if (!isset($trans[$charset][$charset_cible])) {
		$trans[$charset][$charset_cible] = array(
			$p.chr(128) =&gt; &quot;&amp;#8364;&quot;,
			$p.chr(129) =&gt; &#039; &#039;, # pas affecte
			$p.chr(130) =&gt; &quot;&amp;#8218;&quot;,
			$p.chr(131) =&gt; &quot;&amp;#402;&quot;,
			$p.chr(132) =&gt; &quot;&amp;#8222;&quot;,
			$p.chr(133) =&gt; &quot;&amp;#8230;&quot;,
			$p.chr(134) =&gt; &quot;&amp;#8224;&quot;,
			$p.chr(135) =&gt; &quot;&amp;#8225;&quot;,
			$p.chr(136) =&gt; &quot;&amp;#710;&quot;,
			$p.chr(137) =&gt; &quot;&amp;#8240;&quot;,
			$p.chr(138) =&gt; &quot;&amp;#352;&quot;,
			$p.chr(139) =&gt; &quot;&amp;#8249;&quot;,
			$p.chr(140) =&gt; &quot;&amp;#338;&quot;,
			$p.chr(141) =&gt; &#039; &#039;, # pas affecte
			$p.chr(142) =&gt; &quot;&amp;#381;&quot;,
			$p.chr(143) =&gt; &#039; &#039;, # pas affecte
			$p.chr(144) =&gt; &#039; &#039;, # pas affecte
			$p.chr(145) =&gt; &quot;&amp;#8216;&quot;,
			$p.chr(146) =&gt; &quot;&amp;#8217;&quot;,
			$p.chr(147) =&gt; &quot;&amp;#8220;&quot;,
			$p.chr(148) =&gt; &quot;&amp;#8221;&quot;,
			$p.chr(149) =&gt; &quot;&amp;#8226;&quot;,
			$p.chr(150) =&gt; &quot;&amp;#8211;&quot;,
			$p.chr(151) =&gt; &quot;&amp;#8212;&quot;,
			$p.chr(152) =&gt; &quot;&amp;#732;&quot;,
			$p.chr(153) =&gt; &quot;&amp;#8482;&quot;, 
			$p.chr(154) =&gt; &quot;&amp;#353;&quot;,
			$p.chr(155) =&gt; &quot;&amp;#8250;&quot;,
			$p.chr(156) =&gt; &quot;&amp;#339;&quot;,
			$p.chr(157) =&gt; &#039; &#039;, # pas affecte
			$p.chr(158) =&gt; &quot;&amp;#382;&quot;,
			$p.chr(159) =&gt; &quot;&amp;#376;&quot;,
		);
		if ($charset_cible!=&#039;unicode&#039;){
			foreach($trans[$charset][$charset_cible] as $k=&gt;$c)
				$trans[$charset][$charset_cible][$k] = unicode2charset($c, $charset_cible);
		}
	}

	return @str_replace(array_keys($trans[$charset][$charset_cible]),
			   array_values($trans[$charset][$charset_cible]),$texte);
}


//
// Transformer les &amp;eacute; en &amp;#123;
// $secure = true pour *ne pas convertir* les caracteres malins &amp;lt; &amp;amp; etc.
//
// http://doc.spip.org/@html2unicode
function html2unicode($texte, $secure=false) {
	if (strpos($texte,&#039;&amp;&#039;) === false) return $texte;
	static $trans = array();
	if (!$trans) {
		global $CHARSET;
		load_charset(&#039;html&#039;);
		foreach ($CHARSET[&#039;html&#039;] as $key =&gt; $val) {
			$trans[&quot;&amp;$key;&quot;] = $val;
		}
	}

	if ($secure)
		return str_replace(array_keys($trans),array_values($trans),$texte);
	else
		return str_replace(array(&#039;&amp;amp;&#039;, &#039;&amp;quot;&#039;, &#039;&amp;lt;&#039;, &#039;&amp;gt;&#039;),array(&#039;&amp;&#039;, &#039;&quot;&#039;, &#039;&lt;&#039;, &#039;&gt;&#039;),
		  str_replace(array_keys($trans),array_values($trans),$texte)			
		);
}

//
// Transformer les &amp;eacute; en &amp;#123;
//
// http://doc.spip.org/@mathml2unicode
function mathml2unicode($texte) {
	static $trans;
	if (!$trans) {
		global $CHARSET;
		load_charset(&#039;mathml&#039;);
		
		foreach ($CHARSET[&#039;mathml&#039;] as $key =&gt; $val)
			$trans[&quot;&amp;$key;&quot;] = $val;
	}

	return str_replace(array_keys($trans),array_values($trans),$texte);
}


//
// Transforme une chaine en entites unicode &amp;#129;
//
// Note: l&#039;argument $forcer est obsolete : il visait a ne pas
// convertir les accents iso-8859-1
// http://doc.spip.org/@charset2unicode
function charset2unicode($texte, $charset=&#039;AUTO&#039; /* $forcer: obsolete*/) {
	static $trans;

	if ($charset == &#039;AUTO&#039;)
		$charset = $GLOBALS[&#039;meta&#039;][&#039;charset&#039;];

	if ($charset == &#039;&#039;) $charset = &#039;iso-8859-1&#039;;
	$charset = strtolower($charset);

	switch ($charset) {
	case &#039;utf-8&#039;:
	case &#039;utf8&#039;:
		return utf_8_to_unicode($texte);

	case &#039;iso-8859-1&#039;:
		$texte = corriger_caracteres_windows($texte, &#039;iso-8859-1&#039;);
		// pas de break; ici, on suit sur default:

	default:
		// mbstring presente ?
		if (init_mb_string()) {
			if ($order = mb_detect_order() # mb_string connait-il $charset?
			AND mb_detect_order($charset)) {
				$s = mb_convert_encoding($texte, &#039;utf-8&#039;, $charset);
				if ($s &amp;&amp; $s != $texte) return utf_8_to_unicode($s);
			}
			mb_detect_order($order); # remettre comme precedemment
		}

		// Sinon, peut-etre connaissons-nous ce charset ?
		if (!isset($trans[$charset])) {
			global $CHARSET;
			if ($cset = load_charset($charset)
			AND is_array($CHARSET[$cset]))
				foreach ($CHARSET[$cset] as $key =&gt; $val) {
					$trans[$charset][chr($key)] = &#039;&amp;#&#039;.$val.&#039;;&#039;;
			}
		}
		if (count($trans[$charset]))
			return str_replace(array_keys($trans[$charset]),array_values($trans[$charset]),$texte);

		// Sinon demander a iconv (malgre le fait qu&#039;il coupe quand un
		// caractere n&#039;appartient pas au charset, mais c&#039;est un probleme
		// surtout en utf-8, gere ci-dessus)
		if (test_iconv()) {
			$s = iconv($charset, &#039;utf-32le&#039;, $texte);
			if ($s) return utf_32_to_unicode($s);
		}

		// Au pire ne rien faire
		spip_log(&quot;erreur charset &#039;$charset&#039; non supporte&quot;);
		return $texte;
	}
}

//
// Transforme les entites unicode &amp;#129; dans le charset specifie
// Attention on ne transforme pas les entites &lt; &amp;#128; car si elles
// ont ete encodees ainsi c&#039;est a dessein
// http://doc.spip.org/@unicode2charset
function unicode2charset($texte, $charset=&#039;AUTO&#039;) {
	static $CHARSET_REVERSE;
	static $trans = array();
	
	if ($charset == &#039;AUTO&#039;)
		$charset = $GLOBALS[&#039;meta&#039;][&#039;charset&#039;];

	switch($charset) {
	case &#039;utf-8&#039;:
		return unicode_to_utf_8($texte);
		break;

	default:
		$charset = load_charset($charset);

		if (!is_array($CHARSET_REVERSE[$charset])) {
			$CHARSET_REVERSE[$charset] = array_flip($GLOBALS[&#039;CHARSET&#039;][$charset]);
		}

		if (!isset($trans[$charset])){
			$trans[$charset]=array();
			$t = &amp;$trans[$charset];
			for($e=128;$e&lt;255;$e++){
				$h = dechex($e);
				if ($s = isset($CHARSET_REVERSE[$charset][$e])){
					$s = $CHARSET_REVERSE[$charset][$e];
					$t[&#039;&amp;#&#039;.$e.&#039;;&#039;] = $t[&#039;&amp;#0&#039;.$e.&#039;;&#039;] = $t[&#039;&amp;#00&#039;.$e.&#039;;&#039;] = chr($s);
					$t[&#039;&amp;#x&#039;.$h.&#039;;&#039;] = $t[&#039;&amp;#x0&#039;.$h.&#039;;&#039;] = $t[&#039;&amp;#x00&#039;.$h.&#039;;&#039;] = chr($s);
				}
				else{
					$t[&#039;&amp;#&#039;.$e.&#039;;&#039;] = $t[&#039;&amp;#0&#039;.$e.&#039;;&#039;] = $t[&#039;&amp;#00&#039;.$e.&#039;;&#039;] = chr($e);
					$t[&#039;&amp;#x&#039;.$h.&#039;;&#039;] = $t[&#039;&amp;#x0&#039;.$h.&#039;;&#039;] = $t[&#039;&amp;#x00&#039;.$h.&#039;;&#039;] = chr($e);
				}
			}
		}
		$texte = str_replace(array_keys($trans[$charset]),array_values($trans[$charset]),$texte);
		return $texte;
	}
}


// Importer un texte depuis un charset externe vers le charset du site
// (les caracteres non resolus sont transformes en &amp;#123;)
// http://doc.spip.org/@importer_charset
function importer_charset($texte, $charset = &#039;AUTO&#039;) {
	// on traite le cas le plus frequent iso-8859-1 vers utf directement pour aller plus vite !
	if (($charset == &#039;iso-8859-1&#039;) &amp;&amp; ($GLOBALS[&#039;meta&#039;][&#039;charset&#039;]==&#039;utf-8&#039;) &amp;&amp; function_exists(&#039;utf8_encode&#039;)){
		$texte = corriger_caracteres_windows($texte, &#039;iso-8859-1&#039;,&#039;unicode&#039;);
		$texte = utf8_encode($texte);
		return $texte;
	}
	return unicode2charset(charset2unicode($texte, $charset));
}

// UTF-8
// http://doc.spip.org/@utf_8_to_unicode
function utf_8_to_unicode($source) {

	// mb_string : methode rapide
	if (init_mb_string()) {
		$convmap = array(0x7F, 0xFFFFFF, 0x0, 0xFFFFFF);
		return mb_encode_numericentity($source, $convmap, &#039;UTF-8&#039;);
	}

	// Sinon methode pas a pas
	static $decrement;
	static $shift;

	// Cf. php.net, par Ronen. Adapte pour compatibilite &lt; php4
	if (!is_array($decrement)) {
		// array used to figure what number to decrement from character order value
		// according to number of characters used to map unicode to ascii by utf-8
		$decrement[4] = 240;
		$decrement[3] = 224;
		$decrement[2] = 192;
		$decrement[1] = 0;
		// the number of bits to shift each charNum by
		$shift[1][0] = 0;
		$shift[2][0] = 6;
		$shift[2][1] = 0;
		$shift[3][0] = 12;
		$shift[3][1] = 6;
		$shift[3][2] = 0;
		$shift[4][0] = 18;
		$shift[4][1] = 12;
		$shift[4][2] = 6;
		$shift[4][3] = 0;
	}

	$pos = 0;
	$len = strlen ($source);
	$encodedString = &#039;&#039;;
	while ($pos &lt; $len) {
		$char = &#039;&#039;;
		$ischar = false;
		$asciiPos = ord (substr ($source, $pos, 1));
		if (($asciiPos &gt;= 240) &amp;&amp; ($asciiPos &lt;= 255)) {
			// 4 chars representing one unicode character
			$thisLetter = substr ($source, $pos, 4);
			$pos += 4;
		}
		else if (($asciiPos &gt;= 224) &amp;&amp; ($asciiPos &lt;= 239)) {
			// 3 chars representing one unicode character
			$thisLetter = substr ($source, $pos, 3);
			$pos += 3;
		}
		else if (($asciiPos &gt;= 192) &amp;&amp; ($asciiPos &lt;= 223)) {
			// 2 chars representing one unicode character
			$thisLetter = substr ($source, $pos, 2);
			$pos += 2;
		}
		else {
			// 1 char (lower ascii)
			$thisLetter = substr ($source, $pos, 1);
			$pos += 1;
			$char = $thisLetter;
			$ischar = true;
		}

		if ($ischar)
			$encodedString .= $char;
		else {	// process the string representing the letter to a unicode entity
			$thisLen = strlen ($thisLetter);
			$thisPos = 0;
			$decimalCode = 0;
			while ($thisPos &lt; $thisLen) {
				$thisCharOrd = ord (substr ($thisLetter, $thisPos, 1));
				if ($thisPos == 0) {
					$charNum = intval ($thisCharOrd - $decrement[$thisLen]);
					$decimalCode += ($charNum &lt;&lt; $shift[$thisLen][$thisPos]);
				} else {
					$charNum = intval ($thisCharOrd - 128);
					$decimalCode += ($charNum &lt;&lt; $shift[$thisLen][$thisPos]);
				}
				$thisPos++;
			}
			$encodedLetter = &quot;&amp;#&quot;. preg_replace(&#039;/^0+/&#039;, &#039;&#039;, $decimalCode) . &#039;;&#039;;
			$encodedString .= $encodedLetter;
		}
	}
	return $encodedString;
}

// UTF-32 ne sert plus que si on passe par iconv, c&#039;est-a-dire quand
// mb_string est absente ou ne connait pas notre charset
// mais on l&#039;optimise quand meme par mb_string
// =&gt; tout ca sera osolete quand on sera surs d&#039;avoir mb_string
// http://doc.spip.org/@utf_32_to_unicode
function utf_32_to_unicode($source) {

	// mb_string : methode rapide
	if (init_mb_string()) {
		$convmap = array(0x7F, 0xFFFFFF, 0x0, 0xFFFFFF);
		$source = mb_encode_numericentity($source, $convmap, &#039;UTF-32LE&#039;);
		return str_replace(chr(0), &#039;&#039;, $source);
	}

	// Sinon methode lente
	$texte = &#039;&#039;;
	while ($source) {
		$words = unpack(&quot;V*&quot;, substr($source, 0, 1024));
		$source = substr($source, 1024);
		foreach ($words as $word) {
			if ($word &lt; 128)
				$texte .= chr($word);
			// ignorer le BOM - http://www.unicode.org/faq/utf_bom.html
			else if ($word != 65279)
				$texte .= &#039;&amp;#&#039;.$word.&#039;;&#039;;
		}
	}
	return $texte;

}

// Ce bloc provient de php.net, auteur Ronen
// http://doc.spip.org/@caractere_utf_8
function caractere_utf_8($num) {
	$num = intval($num);
	if($num&lt;128)
		return chr($num);
	if($num&lt;2048)
		return chr(($num&gt;&gt;6)+192).chr(($num&amp;63)+128);
	if($num&lt;65536)
		return chr(($num&gt;&gt;12)+224).chr((($num&gt;&gt;6)&amp;63)+128).chr(($num&amp;63)+128);
	if($num&lt;1114112)
		return chr(($num&gt;&gt;18)+240).chr((($num&gt;&gt;12)&amp;63)+128).chr((($num&gt;&gt;6)&amp;63)+128). chr(($num&amp;63)+128);
	return &#039;&#039;;
}

// http://doc.spip.org/@unicode_to_utf_8
function unicode_to_utf_8($texte) {

	// 1. Entites &amp;#128; et suivantes
	$vu = array();
	if (preg_match_all(&#039;,&amp;#0*([1-9][0-9][0-9]+);,S&#039;,
	$texte, $regs, PREG_SET_ORDER))
	foreach ($regs as $reg) {
		if ($reg[1]&gt;127 AND !isset($vu[$reg[0]]))
			$vu[$reg[0]] = caractere_utf_8($reg[1]);
	}
	//$texte = str_replace(array_keys($vu), array_values($vu), $texte);

	// 2. Entites &gt; &amp;#xFF;
	//$vu = array();
	if (preg_match_all(&#039;,&amp;#x0*([1-9a-f][0-9a-f][0-9a-f]+);,iS&#039;,
	$texte, $regs, PREG_SET_ORDER))
	foreach ($regs as $reg) {
		if (!isset($vu[$reg[0]]))
			$vu[$reg[0]] = caractere_utf_8(hexdec($reg[1]));
	}
	return str_replace(array_keys($vu), array_values($vu), $texte);

}

// convertit les &amp;#264; en \u0108
// http://doc.spip.org/@unicode_to_javascript
function unicode_to_javascript($texte) {
	$vu = array();
	while (preg_match(&#039;,&amp;#0*([0-9]+);,S&#039;, $texte, $regs) AND !isset($vu[$regs[1]])) {
		$num = $regs[1];
		$vu[$num] = true;
		$s = &#039;\u&#039;.sprintf(&quot;%04x&quot;, $num);
		$texte = str_replace($regs[0], $s, $texte);
	}
	return $texte;
}

// convertit les %uxxxx (envoyes par javascript)
// http://doc.spip.org/@javascript_to_unicode
function javascript_to_unicode ($texte) {
	while (preg_match(&quot;,%u([0-9A-F][0-9A-F][0-9A-F][0-9A-F]),&quot;, $texte, $regs))
		$texte = str_replace($regs[0],&quot;&amp;#&quot;.hexdec($regs[1]).&quot;;&quot;, $texte);
	return $texte;
}
// convertit les %E9 (envoyes par le browser) en chaine du charset du site (binaire)
// http://doc.spip.org/@javascript_to_binary
function javascript_to_binary ($texte) {
	while (preg_match(&quot;,%([0-9A-F][0-9A-F]),&quot;, $texte, $regs))
		$texte = str_replace($regs[0],chr(hexdec($regs[1])), $texte);
	return $texte;
}


// http://doc.spip.org/@translitteration_rapide
function translitteration_rapide($texte, $charset=&#039;AUTO&#039;, $complexe=&#039;&#039;) {
	static $trans;
	if ($charset == &#039;AUTO&#039;)
		$charset = $GLOBALS[&#039;meta&#039;][&#039;charset&#039;];
	if (!strlen($texte))
		return $texte;

	$table_translit =&#039;translit&#039;.$complexe;

	// 2. Translitterer grace a la table predefinie
	if (!$trans[$complexe]) {
		global $CHARSET;
		load_charset($table_translit);
		foreach ($CHARSET[$table_translit] as $key =&gt; $val)
			$trans[$complexe][caractere_utf_8($key)] = $val;
	}

	return str_replace(array_keys($trans[$complexe]),array_values($trans[$complexe]),$texte);
}

//
// Translitteration charset =&gt; ascii (pour l&#039;indexation)
// Attention les caracteres non reconnus sont renvoyes en utf-8
//
// http://doc.spip.org/@translitteration
function translitteration($texte, $charset=&#039;AUTO&#039;, $complexe=&#039;&#039;) {
	// 0. Supprimer les caracteres illegaux
	include_spip(&#039;inc/filtres&#039;);
	$texte = corriger_caracteres($texte);

	// 1. Passer le charset et les &amp;eacute en utf-8
	$texte = unicode_to_utf_8(html2unicode(charset2unicode($texte, $charset, true)));

	return translitteration_rapide($texte,$charset,$complexe);
}

// &amp;agrave; est retourne sous la forme &quot;a`&quot; et pas &quot;a&quot;
// mais si $chiffre=true, on retourne &quot;a8&quot; (vietnamien)
// http://doc.spip.org/@translitteration_complexe
function translitteration_complexe($texte, $chiffres=false) {
	$texte = translitteration($texte,&#039;AUTO&#039;,&#039;complexe&#039;);

	if ($chiffres) {
		$texte = preg_replace(&quot;/[aeiuoyd][&#039;`?~.^+(-]{1,2}/eS&quot;,
			&quot;translitteration_chiffree(&#039;\\0&#039;)&quot;, $texte);
	}
	
	return $texte;
}
// http://doc.spip.org/@translitteration_chiffree
function translitteration_chiffree($car) {
	return strtr($car, &quot;&#039;`?~.^+(-&quot;, &quot;123456789&quot;);
}


// Reconnaitre le BOM utf-8 (0xEFBBBF)
// http://doc.spip.org/@bom_utf8
function bom_utf8($texte) {
	return (substr($texte, 0,3) == chr(0xEF).chr(0xBB).chr(0xBF));
}
// Verifie qu&#039;un document est en utf-8 valide
// http://us2.php.net/manual/fr/function.mb-detect-encoding.php#50087
// http://w3.org/International/questions/qa-forms-utf-8.html
// note: preg_replace permet de contourner un &quot;stack overflow&quot; sur PCRE
// http://doc.spip.org/@is_utf8
function is_utf8($string) {
	return !strlen(
	preg_replace(
	  &#039;,[\x09\x0A\x0D\x20-\x7E]&#039;            # ASCII
	. &#039;|[\xC2-\xDF][\x80-\xBF]&#039;             # non-overlong 2-byte
	. &#039;|\xE0[\xA0-\xBF][\x80-\xBF]&#039;         # excluding overlongs
	. &#039;|[\xE1-\xEC\xEE\xEF][\x80-\xBF]{2}&#039;  # straight 3-byte
	. &#039;|\xED[\x80-\x9F][\x80-\xBF]&#039;         # excluding surrogates
	. &#039;|\xF0[\x90-\xBF][\x80-\xBF]{2}&#039;      # planes 1-3
	. &#039;|[\xF1-\xF3][\x80-\xBF]{3}&#039;          # planes 4-15
	. &#039;|\xF4[\x80-\x8F][\x80-\xBF]{2}&#039;      # plane 16
	. &#039;,sS&#039;,
	&#039;&#039;, $string));
}
// http://doc.spip.org/@is_ascii
function is_ascii($string) {
	return !strlen(
	preg_replace(
	&#039;,[\x09\x0A\x0D\x20-\x7E],sS&#039;,
	&#039;&#039;, $string));
}

// Transcode une page (attrapee sur le web, ou un squelette) en essayant
// par tous les moyens de deviner son charset (y compris headers HTTP)
// http://doc.spip.org/@transcoder_page
function transcoder_page($texte, $headers=&#039;&#039;) {

	// Si tout est &lt; 128 pas la peine d&#039;aller plus loin
	if (is_ascii($texte)) {
		#spip_log(&#039;charset: ascii&#039;);
		return $texte;
	}

	// Reconnaitre le BOM utf-8 (0xEFBBBF)
	if (bom_utf8($texte)) {
		$charset = &#039;utf-8&#039;;
		$texte = substr($texte,3);
	}

	// charset precise par le contenu (xml)
	else if (preg_match(
	&#039;,&lt;[?]xml[^&gt;]*encoding[^&gt;]*=[^&gt;]*([-_a-z0-9]+?),UimsS&#039;, $texte, $regs))
		$charset = trim(strtolower($regs[1]));
	// charset precise par le contenu (html)
	else if (preg_match(
	&#039;,&lt;(meta|html|body)[^&gt;]*charset[^&gt;]*=[^&gt;]*([-_a-z0-9]+?),UimsS&#039;,
	$texte, $regs)
	# eviter #CHARSET des squelettes
	AND (($tmp = trim(strtolower($regs[2]))) != &#039;charset&#039;))
		$charset = $tmp;
	// charset de la reponse http
	else if (preg_match(&#039;,charset=([-_a-z0-9]+),i&#039;, $headers, $regs))
		$charset = trim(strtolower($regs[1]));
	else $charset = &#039;&#039;;
	// normaliser les noms du shif-jis japonais
	if (preg_match(&#039;,^(x|shift)[_-]s?jis$,i&#039;, $charset))
		$charset = &#039;shift-jis&#039;;

	if ($charset) {
		spip_log(&quot;charset: $charset&quot;);
	} else {
		// valeur par defaut
		if (is_utf8($texte))
			$charset = &#039;utf-8&#039;;
		else
			$charset = &#039;iso-8859-1&#039;;
		spip_log(&quot;charset probable: $charset&quot;);
	}

	return importer_charset($texte, $charset);
}


//
// Gerer les outils mb_string
//
// http://doc.spip.org/@spip_substr
function spip_substr($c, $start=0, $length = NULL) {
	// Si ce n&#039;est pas utf-8, utiliser substr
	if ($GLOBALS[&#039;meta&#039;][&#039;charset&#039;] != &#039;utf-8&#039;) {
		if ($length)
			return substr($c, $start, $length);
		else
			substr($c, $start);
	}

	// Si utf-8, voir si on dispose de mb_string
	if (init_mb_string()) {
		if ($length)
			return mb_substr($c, $start, $length);
		else
			return mb_substr($c, $start);
	}

	// Version manuelle (cf. ci-dessous)
	return spip_substr_manuelle($c, $start, $length);
}

// version manuelle de substr utf8, pour php vieux et/ou mal installe
// http://doc.spip.org/@spip_substr_manuelle
function spip_substr_manuelle($c, $start, $length = NULL) {

	// Cas pathologique
	if ($length === 0)
		return &#039;&#039;;

	// S&#039;il y a un demarrage, on se positionne
	if ($start &gt; 0)
		$c = substr($c, strlen(spip_substr_manuelle($c, 0, $start)));
	elseif ($start &lt; 0)
		return spip_substr_manuelle($c, spip_strlen($c)+$start, $length);

	if (!$length)
		return $c;

	if ($length &gt; 0) {
		// on prend n fois la longueur desiree, pour etre surs d&#039;avoir tout
		// (un caractere utf-8 prenant au maximum n bytes)
		$n = 0; while (preg_match(&#039;,[\x80-\xBF]{&#039;.(++$n).&#039;},&#039;, $c));
		$c = substr($c, 0, $n*$length);
		// puis, tant qu&#039;on est trop long, on coupe...
		while (($l = spip_strlen($c)) &gt; $length)
			$c = substr($c, 0, $length - $l);
		return $c;
	}

	// $length &lt; 0
	return spip_substr_manuelle($c, 0, spip_strlen($c)+$length);
}

// http://doc.spip.org/@spip_strlen
function spip_strlen($c) {
	// Si ce n&#039;est pas utf-8, utiliser strlen
	if ($GLOBALS[&#039;meta&#039;][&#039;charset&#039;] != &#039;utf-8&#039;)
		return strlen($c);

	// Sinon, utiliser mb_strlen() si disponible
	if (init_mb_string())
		return mb_strlen($c);

	// Methode manuelle : on supprime les bytes 10......,
	// on compte donc les ascii (0.......) et les demarrages
	// de caracteres utf-8 (11......)
	return strlen(preg_replace(&#039;,[\x80-\xBF],S&#039;, &#039;&#039;, $c));
}

// Initialisation
$GLOBALS[&#039;CHARSET&#039;] = Array();

// noter a l&#039;occasion dans la meta pcre_u notre capacite a utiliser le flag /u
// dans les preg_replace pour ne pas casser certaines lettres accentuees :
// en utf-8 chr(195).chr(160) = a` alors qu&#039;en iso-latin chr(160) = nbsp
if (!isset($GLOBALS[&#039;meta&#039;][&#039;pcre_u&#039;])
  OR (isset($_GET[&#039;var_mode&#039;]) AND !isset($_GET[&#039;var_profile&#039;]))) {
	include_spip(&#039;inc/meta&#039;);
	ecrire_meta(&#039;pcre_u&#039;,
		$u = ($GLOBALS[&#039;meta&#039;][&#039;charset&#039;] == &#039;utf-8&#039;
		AND test_pcre_unicode())
			? &#039;u&#039; :&#039;&#039;
	);
}


/**
 * Transforme une chaîne utf-8 en utf-8 sans &quot;planes&quot;
 * ce qui permet de la donner à MySQL &quot;utf8&quot;, qui n&#039;est pas un utf-8 complet
 * L&#039;alternative serait d&#039;utiliser utf8mb4
 * 
 * @param string $x
 *     La chaîne à transformer
 * @return string
 *     La chaîne avec les caractères utf8 des hauts &quot;planes&quot; échappée
 *     en unicode : &amp;#128169;
 */
function utf8_noplanes($x) {
	$regexp_utf8_4bytes = &#039;/(
      \xF0[\x90-\xBF][\x80-\xBF]{2}     # planes 1-3
   | [\xF1-\xF3][\x80-\xBF]{3}          # planes 4-15
   |  \xF4[\x80-\x8F][\x80-\xBF]{2}     # plane 16
)/xS&#039;;
	if (preg_match_all($regexp_utf8_4bytes, $x, $z, PREG_PATTERN_ORDER)) {
		foreach($z[0] as $k) {
			$ku = utf_8_to_unicode($k);
			$x = str_replace($k, $ku, $x);
		}
	}
	return $x;
}


?&gt;
</code></pre>        </div>
    </div>