Inspection of "Ticket #4348 : Compat PHP 7.4, Trying to access ar..." - spip/SPIP - Measure and Improve Code Quality continuously with Scrutinizer

Completed

Push — master ( 8414fb...da8260 )

by cam

created 2019-08-26 07:40 UTC

Status

Indentation +703 added lines, -703 removed lines patch added patch discarded remove patch

@@ -22,7 +22,7 @@  discard block
 block discarded – undo
 
 // securité
 if (!defined('_ECRIRE_INC_VERSION')) {
-	return;
+    return;
 }
 
 // se faciliter la lecture du charset
@@ -42,45 +42,45 @@  discard block
 block discarded – undo
  *     - false si le charset n'est pas décrit dans le répertoire charsets/
  **/
 function load_charset($charset = 'AUTO') {
-	if ($charset == 'AUTO') {
-		$charset = $GLOBALS['meta']['charset'];
-	}
-	$charset = trim(strtolower($charset));
-	if (isset($GLOBALS['CHARSET'][$charset])) {
-		return $charset;
-	}
-
-	if ($charset == 'utf-8') {
-		$GLOBALS['CHARSET'][$charset] = array();
-
-		return $charset;
-	}
-
-	// Quelques synonymes
-	if ($charset == '') {
-		$charset = 'iso-8859-1';
-	} else {
-		if ($charset == 'windows-1250') {
-			$charset = 'cp1250';
-		} else {
-			if ($charset == 'windows-1251') {
-				$charset = 'cp1251';
-			} else {
-				if ($charset == 'windows-1256') {
-					$charset = 'cp1256';
-				}
-			}
-		}
-	}
-
-	if (find_in_path($charset . '.php', 'charsets/', true)) {
-		return $charset;
-	} else {
-		spip_log("Erreur: pas de fichier de conversion 'charsets/$charset'");
-		$GLOBALS['CHARSET'][$charset] = array();
-
-		return false;
-	}
+    if ($charset == 'AUTO') {
+        $charset = $GLOBALS['meta']['charset'];
+    }
+    $charset = trim(strtolower($charset));
+    if (isset($GLOBALS['CHARSET'][$charset])) {
+        return $charset;
+    }
+
+    if ($charset == 'utf-8') {
+        $GLOBALS['CHARSET'][$charset] = array();
+
+        return $charset;
+    }
+
+    // Quelques synonymes
+    if ($charset == '') {
+        $charset = 'iso-8859-1';
+    } else {
+        if ($charset == 'windows-1250') {
+            $charset = 'cp1250';
+        } else {
+            if ($charset == 'windows-1251') {
+                $charset = 'cp1251';
+            } else {
+                if ($charset == 'windows-1256') {
+                    $charset = 'cp1256';
+                }
+            }
+        }
+    }
+
+    if (find_in_path($charset . '.php', 'charsets/', true)) {
+        return $charset;
+    } else {
+        spip_log("Erreur: pas de fichier de conversion 'charsets/$charset'");
+        $GLOBALS['CHARSET'][$charset] = array();
+
+        return false;
+    }
 }
 
 
@@ -91,30 +91,30 @@  discard block
 block discarded – undo
  *     true si toutes les fonctions mb nécessaires sont présentes
  **/
 function init_mb_string() {
-	static $mb;
-
-	// verifier que tout est present (fonctions mb_string pour php >= 4.0.6)
-	// et que le charset interne est connu de mb_string
-	if (!$mb) {
-		if (function_exists('mb_internal_encoding')
-			and function_exists('mb_detect_order')
-			and function_exists('mb_substr')
-			and function_exists('mb_strlen')
-			and function_exists('mb_strtolower')
-			and function_exists('mb_strtoupper')
-			and function_exists('mb_encode_mimeheader')
-			and function_exists('mb_encode_numericentity')
-			and function_exists('mb_decode_numericentity')
-			and mb_detect_order(lire_config('charset', _DEFAULT_CHARSET))
-		) {
-			mb_internal_encoding('utf-8');
-			$mb = 1;
-		} else {
-			$mb = -1;
-		}
-	}
-
-	return ($mb == 1);
+    static $mb;
+
+    // verifier que tout est present (fonctions mb_string pour php >= 4.0.6)
+    // et que le charset interne est connu de mb_string
+    if (!$mb) {
+        if (function_exists('mb_internal_encoding')
+            and function_exists('mb_detect_order')
+            and function_exists('mb_substr')
+            and function_exists('mb_strlen')
+            and function_exists('mb_strtolower')
+            and function_exists('mb_strtoupper')
+            and function_exists('mb_encode_mimeheader')
+            and function_exists('mb_encode_numericentity')
+            and function_exists('mb_decode_numericentity')
+            and mb_detect_order(lire_config('charset', _DEFAULT_CHARSET))
+        ) {
+            mb_internal_encoding('utf-8');
+            $mb = 1;
+        } else {
+            $mb = -1;
+        }
+    }
+
+    return ($mb == 1);
 }
 
 /**
@@ -129,21 +129,21 @@  discard block
 block discarded – undo
  *     true si iconv fonctionne correctement
  **/
 function test_iconv() {
-	static $iconv_ok;
-
-	if (!$iconv_ok) {
-		if (!function_exists('iconv')) {
-			$iconv_ok = -1;
-		} else {
-			if (utf_32_to_unicode(@iconv('utf-8', 'utf-32', 'chaine de test')) == 'chaine de test') {
-				$iconv_ok = 1;
-			} else {
-				$iconv_ok = -1;
-			}
-		}
-	}
-
-	return ($iconv_ok == 1);
+    static $iconv_ok;
+
+    if (!$iconv_ok) {
+        if (!function_exists('iconv')) {
+            $iconv_ok = -1;
+        } else {
+            if (utf_32_to_unicode(@iconv('utf-8', 'utf-32', 'chaine de test')) == 'chaine de test') {
+                $iconv_ok = 1;
+            } else {
+                $iconv_ok = -1;
+            }
+        }
+    }
+
+    return ($iconv_ok == 1);
 }
 
 
@@ -156,18 +156,18 @@  discard block
 block discarded – undo
  *     true si PCRE supporte l'UTF-8 correctement
  **/
 function test_pcre_unicode() {
-	static $pcre_ok = 0;
-
-	if (!$pcre_ok) {
-		$s = " " . chr(195) . chr(169) . "t" . chr(195) . chr(169) . " ";
-		if (preg_match(',\W...\W,u', $s)) {
-			$pcre_ok = 1;
-		} else {
-			$pcre_ok = -1;
-		}
-	}
-
-	return $pcre_ok == 1;
+    static $pcre_ok = 0;
+
+    if (!$pcre_ok) {
+        $s = " " . chr(195) . chr(169) . "t" . chr(195) . chr(169) . " ";
+        if (preg_match(',\W...\W,u', $s)) {
+            $pcre_ok = 1;
+        } else {
+            $pcre_ok = -1;
+        }
+    }
+
+    return $pcre_ok == 1;
 }
 
 /**
@@ -183,22 +183,22 @@  discard block
 block discarded – undo
  *    Plage de caractères
  **/
 function pcre_lettres_unicode() {
-	static $plage_unicode;
-
-	if (!$plage_unicode) {
-		if (test_pcre_unicode()) {
-			// cf. http://www.unicode.org/charts/
-			$plage_unicode = '\w' // iso-latin
-				. '\x{100}-\x{24f}' // europeen etendu
-				. '\x{300}-\x{1cff}' // des tas de trucs
-			;
-		} else {
-			// fallback a trois sous
-			$plage_unicode = '\w';
-		}
-	}
-
-	return $plage_unicode;
+    static $plage_unicode;
+
+    if (!$plage_unicode) {
+        if (test_pcre_unicode()) {
+            // cf. http://www.unicode.org/charts/
+            $plage_unicode = '\w' // iso-latin
+                . '\x{100}-\x{24f}' // europeen etendu
+                . '\x{300}-\x{1cff}' // des tas de trucs
+            ;
+        } else {
+            // fallback a trois sous
+            $plage_unicode = '\w';
+        }
+    }
+
+    return $plage_unicode;
 }
 
 
@@ -216,7 +216,7 @@  discard block
 block discarded – undo
  *    Plage de caractères
  **/
 function plage_punct_unicode() {
-	return '\xE2(\x80[\x80-\xBF]|\x81[\x80-\xAF])';
+    return '\xE2(\x80[\x80-\xBF]|\x81[\x80-\xAF])';
 }
 
 /**
@@ -236,72 +236,72 @@  discard block
 block discarded – undo
  *     Texte corrigé
  **/
 function corriger_caracteres_windows($texte, $charset = 'AUTO', $charset_cible = 'unicode') {
-	static $trans;
-
-	if (is_array($texte)) {
-		return array_map('corriger_caracteres_windows', $texte);
-	}
-
-	if ($charset == 'AUTO') {
-		$charset = lire_config('charset', _DEFAULT_CHARSET);
-	}
-	if ($charset == 'utf-8') {
-		$p = chr(194);
-		if (strpos($texte, $p) == false) {
-			return $texte;
-		}
-	} else {
-		if ($charset == 'iso-8859-1') {
-			$p = '';
-		} else {
-			return $texte;
-		}
-	}
-
-	if (!isset($trans[$charset][$charset_cible])) {
-		$trans[$charset][$charset_cible] = array(
-			$p . chr(128) => "&#8364;",
-			$p . chr(129) => ' ', # pas affecte
-			$p . chr(130) => "&#8218;",
-			$p . chr(131) => "&#402;",
-			$p . chr(132) => "&#8222;",
-			$p . chr(133) => "&#8230;",
-			$p . chr(134) => "&#8224;",
-			$p . chr(135) => "&#8225;",
-			$p . chr(136) => "&#710;",
-			$p . chr(137) => "&#8240;",
-			$p . chr(138) => "&#352;",
-			$p . chr(139) => "&#8249;",
-			$p . chr(140) => "&#338;",
-			$p . chr(141) => ' ', # pas affecte
-			$p . chr(142) => "&#381;",
-			$p . chr(143) => ' ', # pas affecte
-			$p . chr(144) => ' ', # pas affecte
-			$p . chr(145) => "&#8216;",
-			$p . chr(146) => "&#8217;",
-			$p . chr(147) => "&#8220;",
-			$p . chr(148) => "&#8221;",
-			$p . chr(149) => "&#8226;",
-			$p . chr(150) => "&#8211;",
-			$p . chr(151) => "&#8212;",
-			$p . chr(152) => "&#732;",
-			$p . chr(153) => "&#8482;",
-			$p . chr(154) => "&#353;",
-			$p . chr(155) => "&#8250;",
-			$p . chr(156) => "&#339;",
-			$p . chr(157) => ' ', # pas affecte
-			$p . chr(158) => "&#382;",
-			$p . chr(159) => "&#376;",
-		);
-		if ($charset_cible != 'unicode') {
-			foreach ($trans[$charset][$charset_cible] as $k => $c) {
-				$trans[$charset][$charset_cible][$k] = unicode2charset($c, $charset_cible);
-			}
-		}
-	}
-
-	return @str_replace(array_keys($trans[$charset][$charset_cible]),
-		array_values($trans[$charset][$charset_cible]), $texte);
+    static $trans;
+
+    if (is_array($texte)) {
+        return array_map('corriger_caracteres_windows', $texte);
+    }
+
+    if ($charset == 'AUTO') {
+        $charset = lire_config('charset', _DEFAULT_CHARSET);
+    }
+    if ($charset == 'utf-8') {
+        $p = chr(194);
+        if (strpos($texte, $p) == false) {
+            return $texte;
+        }
+    } else {
+        if ($charset == 'iso-8859-1') {
+            $p = '';
+        } else {
+            return $texte;
+        }
+    }
+
+    if (!isset($trans[$charset][$charset_cible])) {
+        $trans[$charset][$charset_cible] = array(
+            $p . chr(128) => "&#8364;",
+            $p . chr(129) => ' ', # pas affecte
+            $p . chr(130) => "&#8218;",
+            $p . chr(131) => "&#402;",
+            $p . chr(132) => "&#8222;",
+            $p . chr(133) => "&#8230;",
+            $p . chr(134) => "&#8224;",
+            $p . chr(135) => "&#8225;",
+            $p . chr(136) => "&#710;",
+            $p . chr(137) => "&#8240;",
+            $p . chr(138) => "&#352;",
+            $p . chr(139) => "&#8249;",
+            $p . chr(140) => "&#338;",
+            $p . chr(141) => ' ', # pas affecte
+            $p . chr(142) => "&#381;",
+            $p . chr(143) => ' ', # pas affecte
+            $p . chr(144) => ' ', # pas affecte
+            $p . chr(145) => "&#8216;",
+            $p . chr(146) => "&#8217;",
+            $p . chr(147) => "&#8220;",
+            $p . chr(148) => "&#8221;",
+            $p . chr(149) => "&#8226;",
+            $p . chr(150) => "&#8211;",
+            $p . chr(151) => "&#8212;",
+            $p . chr(152) => "&#732;",
+            $p . chr(153) => "&#8482;",
+            $p . chr(154) => "&#353;",
+            $p . chr(155) => "&#8250;",
+            $p . chr(156) => "&#339;",
+            $p . chr(157) => ' ', # pas affecte
+            $p . chr(158) => "&#382;",
+            $p . chr(159) => "&#376;",
+        );
+        if ($charset_cible != 'unicode') {
+            foreach ($trans[$charset][$charset_cible] as $k => $c) {
+                $trans[$charset][$charset_cible][$k] = unicode2charset($c, $charset_cible);
+            }
+        }
+    }
+
+    return @str_replace(array_keys($trans[$charset][$charset_cible]),
+        array_values($trans[$charset][$charset_cible]), $texte);
 }
 
 
@@ -318,24 +318,24 @@  discard block
 block discarded – undo
  *     Texte converti
  **/
 function html2unicode($texte, $secure = false) {
-	if (strpos($texte, '&') === false) {
-		return $texte;
-	}
-	static $trans = array();
-	if (!$trans) {
-		load_charset('html');
-		foreach ($GLOBALS['CHARSET']['html'] as $key => $val) {
-			$trans["&$key;"] = $val;
-		}
-	}
-
-	if ($secure) {
-		return str_replace(array_keys($trans), array_values($trans), $texte);
-	} else {
-		return str_replace(array('&amp;', '&quot;', '&lt;', '&gt;'), array('&', '"', '<', '>'),
-			str_replace(array_keys($trans), array_values($trans), $texte)
-		);
-	}
+    if (strpos($texte, '&') === false) {
+        return $texte;
+    }
+    static $trans = array();
+    if (!$trans) {
+        load_charset('html');
+        foreach ($GLOBALS['CHARSET']['html'] as $key => $val) {
+            $trans["&$key;"] = $val;
+        }
+    }
+
+    if ($secure) {
+        return str_replace(array_keys($trans), array_values($trans), $texte);
+    } else {
+        return str_replace(array('&amp;', '&quot;', '&lt;', '&gt;'), array('&', '"', '<', '>'),
+            str_replace(array_keys($trans), array_values($trans), $texte)
+        );
+    }
 }
 
 
@@ -350,16 +350,16 @@  discard block
 block discarded – undo
  *     Texte converti
  **/
 function mathml2unicode($texte) {
-	static $trans;
-	if (!$trans) {
-		load_charset('mathml');
+    static $trans;
+    if (!$trans) {
+        load_charset('mathml');
 
-		foreach ($GLOBALS['CHARSET']['mathml'] as $key => $val) {
-			$trans["&$key;"] = $val;
-		}
-	}
+        foreach ($GLOBALS['CHARSET']['mathml'] as $key => $val) {
+            $trans["&$key;"] = $val;
+        }
+    }
 
-	return str_replace(array_keys($trans), array_values($trans), $texte);
+    return str_replace(array_keys($trans), array_values($trans), $texte);
 }
 
 
@@ -381,69 +381,69 @@  discard block
 block discarded – undo
  *     Texte converti en unicode
  **/
 function charset2unicode($texte, $charset = 'AUTO' /* $forcer: obsolete*/) {
-	static $trans;
-
-	if ($charset == 'AUTO') {
-		$charset = lire_config('charset', _DEFAULT_CHARSET);
-	}
-
-	if ($charset == '') {
-		$charset = 'iso-8859-1';
-	}
-	$charset = strtolower($charset);
-
-	switch ($charset) {
-		case 'utf-8':
-		case 'utf8':
-			return utf_8_to_unicode($texte);
-
-		case 'iso-8859-1':
-			$texte = corriger_caracteres_windows($texte, 'iso-8859-1');
-		// pas de break; ici, on suit sur default:
-
-		default:
-			// mbstring presente ?
-			if (init_mb_string()) {
-				if ($order = mb_detect_order() # mb_string connait-il $charset?
-					and mb_detect_order($charset)
-				) {
-					$s = mb_convert_encoding($texte, 'utf-8', $charset);
-					if ($s && $s != $texte) {
-						return utf_8_to_unicode($s);
-					}
-				}
-				mb_detect_order($order); # remettre comme precedemment
-			}
-
-			// Sinon, peut-etre connaissons-nous ce charset ?
-			if (!isset($trans[$charset])) {
-				if ($cset = load_charset($charset)
-					and is_array($GLOBALS['CHARSET'][$cset])
-				) {
-					foreach ($GLOBALS['CHARSET'][$cset] as $key => $val) {
-						$trans[$charset][chr($key)] = '&#' . $val . ';';
-					}
-				}
-			}
-			if (count($trans[$charset])) {
-				return str_replace(array_keys($trans[$charset]), array_values($trans[$charset]), $texte);
-			}
-
-			// Sinon demander a iconv (malgre le fait qu'il coupe quand un
-			// caractere n'appartient pas au charset, mais c'est un probleme
-			// surtout en utf-8, gere ci-dessus)
-			if (test_iconv()) {
-				$s = iconv($charset, 'utf-32le', $texte);
-				if ($s) {
-					return utf_32_to_unicode($s);
-				}
-			}
-
-			// Au pire ne rien faire
-			spip_log("erreur charset '$charset' non supporte");
-
-			return $texte;
-	}
+    static $trans;
+
+    if ($charset == 'AUTO') {
+        $charset = lire_config('charset', _DEFAULT_CHARSET);
+    }
+
+    if ($charset == '') {
+        $charset = 'iso-8859-1';
+    }
+    $charset = strtolower($charset);
+
+    switch ($charset) {
+        case 'utf-8':
+        case 'utf8':
+            return utf_8_to_unicode($texte);
+
+        case 'iso-8859-1':
+            $texte = corriger_caracteres_windows($texte, 'iso-8859-1');
+        // pas de break; ici, on suit sur default:
+
+        default:
+            // mbstring presente ?
+            if (init_mb_string()) {
+                if ($order = mb_detect_order() # mb_string connait-il $charset?
+                    and mb_detect_order($charset)
+                ) {
+                    $s = mb_convert_encoding($texte, 'utf-8', $charset);
+                    if ($s && $s != $texte) {
+                        return utf_8_to_unicode($s);
+                    }
+                }
+                mb_detect_order($order); # remettre comme precedemment
+            }
+
+            // Sinon, peut-etre connaissons-nous ce charset ?
+            if (!isset($trans[$charset])) {
+                if ($cset = load_charset($charset)
+                    and is_array($GLOBALS['CHARSET'][$cset])
+                ) {
+                    foreach ($GLOBALS['CHARSET'][$cset] as $key => $val) {
+                        $trans[$charset][chr($key)] = '&#' . $val . ';';
+                    }
+                }
+            }
+            if (count($trans[$charset])) {
+                return str_replace(array_keys($trans[$charset]), array_values($trans[$charset]), $texte);
+            }
+
+            // Sinon demander a iconv (malgre le fait qu'il coupe quand un
+            // caractere n'appartient pas au charset, mais c'est un probleme
+            // surtout en utf-8, gere ci-dessus)
+            if (test_iconv()) {
+                $s = iconv($charset, 'utf-32le', $texte);
+                if ($s) {
+                    return utf_32_to_unicode($s);
+                }
+            }
+
+            // Au pire ne rien faire
+            spip_log("erreur charset '$charset' non supporte");
+
+            return $texte;
+    }
 }
 
 
@@ -462,44 +462,44 @@  discard block
 block discarded – undo
  *     Texte transformé dans le charset souhaité
  **/
 function unicode2charset($texte, $charset = 'AUTO') {
-	static $CHARSET_REVERSE;
-	static $trans = array();
-
-	if ($charset == 'AUTO') {
-		$charset = lire_config('charset', _DEFAULT_CHARSET);
-	}
-
-	switch ($charset) {
-		case 'utf-8':
-			return unicode_to_utf_8($texte);
-			break;
-
-		default:
-			$charset = load_charset($charset);
-
-			if (!is_array($CHARSET_REVERSE[$charset])) {
-				$CHARSET_REVERSE[$charset] = array_flip($GLOBALS['CHARSET'][$charset]);
-			}
-
-			if (!isset($trans[$charset])) {
-				$trans[$charset] = array();
-				$t = &$trans[$charset];
-				for ($e = 128; $e < 255; $e++) {
-					$h = dechex($e);
-					if ($s = isset($CHARSET_REVERSE[$charset][$e])) {
-						$s = $CHARSET_REVERSE[$charset][$e];
-						$t['&#' . $e . ';'] = $t['&#0' . $e . ';'] = $t['&#00' . $e . ';'] = chr($s);
-						$t['&#x' . $h . ';'] = $t['&#x0' . $h . ';'] = $t['&#x00' . $h . ';'] = chr($s);
-					} else {
-						$t['&#' . $e . ';'] = $t['&#0' . $e . ';'] = $t['&#00' . $e . ';'] = chr($e);
-						$t['&#x' . $h . ';'] = $t['&#x0' . $h . ';'] = $t['&#x00' . $h . ';'] = chr($e);
-					}
-				}
-			}
-			$texte = str_replace(array_keys($trans[$charset]), array_values($trans[$charset]), $texte);
-
-			return $texte;
-	}
+    static $CHARSET_REVERSE;
+    static $trans = array();
+
+    if ($charset == 'AUTO') {
+        $charset = lire_config('charset', _DEFAULT_CHARSET);
+    }
+
+    switch ($charset) {
+        case 'utf-8':
+            return unicode_to_utf_8($texte);
+            break;
+
+        default:
+            $charset = load_charset($charset);
+
+            if (!is_array($CHARSET_REVERSE[$charset])) {
+                $CHARSET_REVERSE[$charset] = array_flip($GLOBALS['CHARSET'][$charset]);
+            }
+
+            if (!isset($trans[$charset])) {
+                $trans[$charset] = array();
+                $t = &$trans[$charset];
+                for ($e = 128; $e < 255; $e++) {
+                    $h = dechex($e);
+                    if ($s = isset($CHARSET_REVERSE[$charset][$e])) {
+                        $s = $CHARSET_REVERSE[$charset][$e];
+                        $t['&#' . $e . ';'] = $t['&#0' . $e . ';'] = $t['&#00' . $e . ';'] = chr($s);
+                        $t['&#x' . $h . ';'] = $t['&#x0' . $h . ';'] = $t['&#x00' . $h . ';'] = chr($s);
+                    } else {
+                        $t['&#' . $e . ';'] = $t['&#0' . $e . ';'] = $t['&#00' . $e . ';'] = chr($e);
+                        $t['&#x' . $h . ';'] = $t['&#x0' . $h . ';'] = $t['&#x00' . $h . ';'] = chr($e);
+                    }
+                }
+            }
+            $texte = str_replace(array_keys($trans[$charset]), array_values($trans[$charset]), $texte);
+
+            return $texte;
+    }
 }
 
 
@@ -517,37 +517,37 @@  discard block
 block discarded – undo
  *     Texte transformé dans le charset site
  **/
 function importer_charset($texte, $charset = 'AUTO') {
-	static $trans = array();
-	// on traite le cas le plus frequent iso-8859-1 vers utf directement pour aller plus vite !
-	if (($charset == 'iso-8859-1') && ($GLOBALS['meta']['charset'] == 'utf-8')) {
-		$texte = corriger_caracteres_windows($texte, 'iso-8859-1', $GLOBALS['meta']['charset']);
-		if (init_mb_string()) {
-			if ($order = mb_detect_order() # mb_string connait-il $charset?
-				and mb_detect_order($charset)
-			) {
-				$s = mb_convert_encoding($texte, 'utf-8', $charset);
-			}
-			mb_detect_order($order); # remettre comme precedemment
-			return $s;
-		}
-		// Sinon, peut-etre connaissons-nous ce charset ?
-		if (!isset($trans[$charset])) {
-			if ($cset = load_charset($charset)
-				and is_array($GLOBALS['CHARSET'][$cset])
-			) {
-				foreach ($GLOBALS['CHARSET'][$cset] as $key => $val) {
-					$trans[$charset][chr($key)] = unicode2charset('&#' . $val . ';');
-				}
-			}
-		}
-		if (count($trans[$charset])) {
-			return str_replace(array_keys($trans[$charset]), array_values($trans[$charset]), $texte);
-		}
-
-		return $texte;
-	}
-
-	return unicode2charset(charset2unicode($texte, $charset));
+    static $trans = array();
+    // on traite le cas le plus frequent iso-8859-1 vers utf directement pour aller plus vite !
+    if (($charset == 'iso-8859-1') && ($GLOBALS['meta']['charset'] == 'utf-8')) {
+        $texte = corriger_caracteres_windows($texte, 'iso-8859-1', $GLOBALS['meta']['charset']);
+        if (init_mb_string()) {
+            if ($order = mb_detect_order() # mb_string connait-il $charset?
+                and mb_detect_order($charset)
+            ) {
+                $s = mb_convert_encoding($texte, 'utf-8', $charset);
+            }
+            mb_detect_order($order); # remettre comme precedemment
+            return $s;
+        }
+        // Sinon, peut-etre connaissons-nous ce charset ?
+        if (!isset($trans[$charset])) {
+            if ($cset = load_charset($charset)
+                and is_array($GLOBALS['CHARSET'][$cset])
+            ) {
+                foreach ($GLOBALS['CHARSET'][$cset] as $key => $val) {
+                    $trans[$charset][chr($key)] = unicode2charset('&#' . $val . ';');
+                }
+            }
+        }
+        if (count($trans[$charset])) {
+            return str_replace(array_keys($trans[$charset]), array_values($trans[$charset]), $texte);
+        }
+
+        return $texte;
+    }
+
+    return unicode2charset(charset2unicode($texte, $charset));
 }
 
 
@@ -563,92 +563,92 @@  discard block
 block discarded – undo
  **/
 function utf_8_to_unicode($source) {
 
-	// mb_string : methode rapide
-	if (init_mb_string()) {
-		$convmap = array(0x7F, 0xFFFFFF, 0x0, 0xFFFFFF);
-
-		return mb_encode_numericentity($source, $convmap, 'UTF-8');
-	}
-
-	// Sinon methode pas a pas
-	static $decrement;
-	static $shift;
-
-	// Cf. php.net, par Ronen. Adapte pour compatibilite < php4
-	if (!is_array($decrement)) {
-		// array used to figure what number to decrement from character order value
-		// according to number of characters used to map unicode to ascii by utf-8
-		$decrement[4] = 240;
-		$decrement[3] = 224;
-		$decrement[2] = 192;
-		$decrement[1] = 0;
-		// the number of bits to shift each charNum by
-		$shift[1][0] = 0;
-		$shift[2][0] = 6;
-		$shift[2][1] = 0;
-		$shift[3][0] = 12;
-		$shift[3][1] = 6;
-		$shift[3][2] = 0;
-		$shift[4][0] = 18;
-		$shift[4][1] = 12;
-		$shift[4][2] = 6;
-		$shift[4][3] = 0;
-	}
-
-	$pos = 0;
-	$len = strlen($source);
-	$encodedString = '';
-	while ($pos < $len) {
-		$char = '';
-		$ischar = false;
-		$asciiPos = ord(substr($source, $pos, 1));
-		if (($asciiPos >= 240) && ($asciiPos <= 255)) {
-			// 4 chars representing one unicode character
-			$thisLetter = substr($source, $pos, 4);
-			$pos += 4;
-		} else {
-			if (($asciiPos >= 224) && ($asciiPos <= 239)) {
-				// 3 chars representing one unicode character
-				$thisLetter = substr($source, $pos, 3);
-				$pos += 3;
-			} else {
-				if (($asciiPos >= 192) && ($asciiPos <= 223)) {
-					// 2 chars representing one unicode character
-					$thisLetter = substr($source, $pos, 2);
-					$pos += 2;
-				} else {
-					// 1 char (lower ascii)
-					$thisLetter = substr($source, $pos, 1);
-					$pos += 1;
-					$char = $thisLetter;
-					$ischar = true;
-				}
-			}
-		}
-
-		if ($ischar) {
-			$encodedString .= $char;
-		} else {  // process the string representing the letter to a unicode entity
-			$thisLen = strlen($thisLetter);
-			$thisPos = 0;
-			$decimalCode = 0;
-			while ($thisPos < $thisLen) {
-				$thisCharOrd = ord(substr($thisLetter, $thisPos, 1));
-				if ($thisPos == 0) {
-					$charNum = intval($thisCharOrd - $decrement[$thisLen]);
-					$decimalCode += ($charNum << $shift[$thisLen][$thisPos]);
-				} else {
-					$charNum = intval($thisCharOrd - 128);
-					$decimalCode += ($charNum << $shift[$thisLen][$thisPos]);
-				}
-				$thisPos++;
-			}
-			$encodedLetter = "&#" . preg_replace('/^0+/', '', $decimalCode) . ';';
-			$encodedString .= $encodedLetter;
-		}
-	}
-
-	return $encodedString;
+    // mb_string : methode rapide
+    if (init_mb_string()) {
+        $convmap = array(0x7F, 0xFFFFFF, 0x0, 0xFFFFFF);
+
+        return mb_encode_numericentity($source, $convmap, 'UTF-8');
+    }
+
+    // Sinon methode pas a pas
+    static $decrement;
+    static $shift;
+
+    // Cf. php.net, par Ronen. Adapte pour compatibilite < php4
+    if (!is_array($decrement)) {
+        // array used to figure what number to decrement from character order value
+        // according to number of characters used to map unicode to ascii by utf-8
+        $decrement[4] = 240;
+        $decrement[3] = 224;
+        $decrement[2] = 192;
+        $decrement[1] = 0;
+        // the number of bits to shift each charNum by
+        $shift[1][0] = 0;
+        $shift[2][0] = 6;
+        $shift[2][1] = 0;
+        $shift[3][0] = 12;
+        $shift[3][1] = 6;
+        $shift[3][2] = 0;
+        $shift[4][0] = 18;
+        $shift[4][1] = 12;
+        $shift[4][2] = 6;
+        $shift[4][3] = 0;
+    }
+
+    $pos = 0;
+    $len = strlen($source);
+    $encodedString = '';
+    while ($pos < $len) {
+        $char = '';
+        $ischar = false;
+        $asciiPos = ord(substr($source, $pos, 1));
+        if (($asciiPos >= 240) && ($asciiPos <= 255)) {
+            // 4 chars representing one unicode character
+            $thisLetter = substr($source, $pos, 4);
+            $pos += 4;
+        } else {
+            if (($asciiPos >= 224) && ($asciiPos <= 239)) {
+                // 3 chars representing one unicode character
+                $thisLetter = substr($source, $pos, 3);
+                $pos += 3;
+            } else {
+                if (($asciiPos >= 192) && ($asciiPos <= 223)) {
+                    // 2 chars representing one unicode character
+                    $thisLetter = substr($source, $pos, 2);
+                    $pos += 2;
+                } else {
+                    // 1 char (lower ascii)
+                    $thisLetter = substr($source, $pos, 1);
+                    $pos += 1;
+                    $char = $thisLetter;
+                    $ischar = true;
+                }
+            }
+        }
+
+        if ($ischar) {
+            $encodedString .= $char;
+        } else {  // process the string representing the letter to a unicode entity
+            $thisLen = strlen($thisLetter);
+            $thisPos = 0;
+            $decimalCode = 0;
+            while ($thisPos < $thisLen) {
+                $thisCharOrd = ord(substr($thisLetter, $thisPos, 1));
+                if ($thisPos == 0) {
+                    $charNum = intval($thisCharOrd - $decrement[$thisLen]);
+                    $decimalCode += ($charNum << $shift[$thisLen][$thisPos]);
+                } else {
+                    $charNum = intval($thisCharOrd - 128);
+                    $decimalCode += ($charNum << $shift[$thisLen][$thisPos]);
+                }
+                $thisPos++;
+            }
+            $encodedLetter = "&#" . preg_replace('/^0+/', '', $decimalCode) . ';';
+            $encodedString .= $encodedLetter;
+        }
+    }
+
+    return $encodedString;
 }
 
 /**
@@ -667,32 +667,32 @@  discard block
 block discarded – undo
  **/
 function utf_32_to_unicode($source) {
 
-	// mb_string : methode rapide
-	if (init_mb_string()) {
-		$convmap = array(0x7F, 0xFFFFFF, 0x0, 0xFFFFFF);
-		$source = mb_encode_numericentity($source, $convmap, 'UTF-32LE');
-
-		return str_replace(chr(0), '', $source);
-	}
-
-	// Sinon methode lente
-	$texte = '';
-	while ($source) {
-		$words = unpack("V*", substr($source, 0, 1024));
-		$source = substr($source, 1024);
-		foreach ($words as $word) {
-			if ($word < 128) {
-				$texte .= chr($word);
-			} // ignorer le BOM - http://www.unicode.org/faq/utf_bom.html
-			else {
-				if ($word != 65279) {
-					$texte .= '&#' . $word . ';';
-				}
-			}
-		}
-	}
-
-	return $texte;
+    // mb_string : methode rapide
+    if (init_mb_string()) {
+        $convmap = array(0x7F, 0xFFFFFF, 0x0, 0xFFFFFF);
+        $source = mb_encode_numericentity($source, $convmap, 'UTF-32LE');
+
+        return str_replace(chr(0), '', $source);
+    }
+
+    // Sinon methode lente
+    $texte = '';
+    while ($source) {
+        $words = unpack("V*", substr($source, 0, 1024));
+        $source = substr($source, 1024);
+        foreach ($words as $word) {
+            if ($word < 128) {
+                $texte .= chr($word);
+            } // ignorer le BOM - http://www.unicode.org/faq/utf_bom.html
+            else {
+                if ($word != 65279) {
+                    $texte .= '&#' . $word . ';';
+                }
+            }
+        }
+    }
+
+    return $texte;
 
 }
 
@@ -710,21 +710,21 @@  discard block
 block discarded – undo
  *    Caractère utf8 si trouvé, '' sinon
  **/
 function caractere_utf_8($num) {
-	$num = intval($num);
-	if ($num < 128) {
-		return chr($num);
-	}
-	if ($num < 2048) {
-		return chr(($num >> 6) + 192) . chr(($num & 63) + 128);
-	}
-	if ($num < 65536) {
-		return chr(($num >> 12) + 224) . chr((($num >> 6) & 63) + 128) . chr(($num & 63) + 128);
-	}
-	if ($num < 1114112) {
-		return chr(($num >> 18) + 240) . chr((($num >> 12) & 63) + 128) . chr((($num >> 6) & 63) + 128) . chr(($num & 63) + 128);
-	}
-
-	return '';
+    $num = intval($num);
+    if ($num < 128) {
+        return chr($num);
+    }
+    if ($num < 2048) {
+        return chr(($num >> 6) + 192) . chr(($num & 63) + 128);
+    }
+    if ($num < 65536) {
+        return chr(($num >> 12) + 224) . chr((($num >> 6) & 63) + 128) . chr(($num & 63) + 128);
+    }
+    if ($num < 1114112) {
+        return chr(($num >> 18) + 240) . chr((($num >> 12) & 63) + 128) . chr((($num >> 6) & 63) + 128) . chr(($num & 63) + 128);
+    }
+
+    return '';
 }
 
 /**
@@ -737,30 +737,30 @@  discard block
 block discarded – undo
  **/
 function unicode_to_utf_8($texte) {
 
-	// 1. Entites &#128; et suivantes
-	$vu = array();
-	if (preg_match_all(',&#0*([1-9][0-9][0-9]+);,S',
-		$texte, $regs, PREG_SET_ORDER)) {
-		foreach ($regs as $reg) {
-			if ($reg[1] > 127 and !isset($vu[$reg[0]])) {
-				$vu[$reg[0]] = caractere_utf_8($reg[1]);
-			}
-		}
-	}
-	//$texte = str_replace(array_keys($vu), array_values($vu), $texte);
-
-	// 2. Entites > &#xFF;
-	//$vu = array();
-	if (preg_match_all(',&#x0*([1-9a-f][0-9a-f][0-9a-f]+);,iS',
-		$texte, $regs, PREG_SET_ORDER)) {
-		foreach ($regs as $reg) {
-			if (!isset($vu[$reg[0]])) {
-				$vu[$reg[0]] = caractere_utf_8(hexdec($reg[1]));
-			}
-		}
-	}
-
-	return str_replace(array_keys($vu), array_values($vu), $texte);
+    // 1. Entites &#128; et suivantes
+    $vu = array();
+    if (preg_match_all(',&#0*([1-9][0-9][0-9]+);,S',
+        $texte, $regs, PREG_SET_ORDER)) {
+        foreach ($regs as $reg) {
+            if ($reg[1] > 127 and !isset($vu[$reg[0]])) {
+                $vu[$reg[0]] = caractere_utf_8($reg[1]);
+            }
+        }
+    }
+    //$texte = str_replace(array_keys($vu), array_values($vu), $texte);
+
+    // 2. Entites > &#xFF;
+    //$vu = array();
+    if (preg_match_all(',&#x0*([1-9a-f][0-9a-f][0-9a-f]+);,iS',
+        $texte, $regs, PREG_SET_ORDER)) {
+        foreach ($regs as $reg) {
+            if (!isset($vu[$reg[0]])) {
+                $vu[$reg[0]] = caractere_utf_8(hexdec($reg[1]));
+            }
+        }
+    }
+
+    return str_replace(array_keys($vu), array_values($vu), $texte);
 
 }
 
@@ -773,15 +773,15 @@  discard block
 block discarded – undo
  *     Texte converti
  **/
 function unicode_to_javascript($texte) {
-	$vu = array();
-	while (preg_match(',&#0*([0-9]+);,S', $texte, $regs) and !isset($vu[$regs[1]])) {
-		$num = $regs[1];
-		$vu[$num] = true;
-		$s = '\u' . sprintf("%04x", $num);
-		$texte = str_replace($regs[0], $s, $texte);
-	}
-
-	return $texte;
+    $vu = array();
+    while (preg_match(',&#0*([0-9]+);,S', $texte, $regs) and !isset($vu[$regs[1]])) {
+        $num = $regs[1];
+        $vu[$num] = true;
+        $s = '\u' . sprintf("%04x", $num);
+        $texte = str_replace($regs[0], $s, $texte);
+    }
+
+    return $texte;
 }
 
 /**
@@ -793,11 +793,11 @@  discard block
 block discarded – undo
  *     Texte converti
  **/
 function javascript_to_unicode($texte) {
-	while (preg_match(",%u([0-9A-F][0-9A-F][0-9A-F][0-9A-F]),", $texte, $regs)) {
-		$texte = str_replace($regs[0], "&#" . hexdec($regs[1]) . ";", $texte);
-	}
+    while (preg_match(",%u([0-9A-F][0-9A-F][0-9A-F][0-9A-F]),", $texte, $regs)) {
+        $texte = str_replace($regs[0], "&#" . hexdec($regs[1]) . ";", $texte);
+    }
 
-	return $texte;
+    return $texte;
 }
 
 /**
@@ -809,11 +809,11 @@  discard block
 block discarded – undo
  *     Texte converti
  **/
 function javascript_to_binary($texte) {
-	while (preg_match(",%([0-9A-F][0-9A-F]),", $texte, $regs)) {
-		$texte = str_replace($regs[0], chr(hexdec($regs[1])), $texte);
-	}
+    while (preg_match(",%([0-9A-F][0-9A-F]),", $texte, $regs)) {
+        $texte = str_replace($regs[0], chr(hexdec($regs[1])), $texte);
+    }
 
-	return $texte;
+    return $texte;
 }
 
 
@@ -831,26 +831,26 @@  discard block
 block discarded – undo
  * @return string
  */
 function translitteration_rapide($texte, $charset = 'AUTO', $complexe = '') {
-	static $trans = [];
-	if ($charset == 'AUTO') {
-		$charset = $GLOBALS['meta']['charset'];
-	}
-	if (!strlen($texte)) {
-		return $texte;
-	}
-
-	$table_translit = 'translit' . $complexe;
-
-	// 2. Translitterer grace a la table predefinie
-	if (!isset($trans[$complexe])) {
-		$trans[$complexe] = [];
-		load_charset($table_translit);
-		foreach ($GLOBALS['CHARSET'][$table_translit] as $key => $val) {
-			$trans[$complexe][caractere_utf_8($key)] = $val;
-		}
-	}
-
-	return str_replace(array_keys($trans[$complexe]), array_values($trans[$complexe]), $texte);
+    static $trans = [];
+    if ($charset == 'AUTO') {
+        $charset = $GLOBALS['meta']['charset'];
+    }
+    if (!strlen($texte)) {
+        return $texte;
+    }
+
+    $table_translit = 'translit' . $complexe;
+
+    // 2. Translitterer grace a la table predefinie
+    if (!isset($trans[$complexe])) {
+        $trans[$complexe] = [];
+        load_charset($table_translit);
+        foreach ($GLOBALS['CHARSET'][$table_translit] as $key => $val) {
+            $trans[$complexe][caractere_utf_8($key)] = $val;
+        }
+    }
+
+    return str_replace(array_keys($trans[$complexe]), array_values($trans[$complexe]), $texte);
 }
 
 /**
@@ -873,14 +873,14 @@  discard block
 block discarded – undo
  * @return string
  */
 function translitteration($texte, $charset = 'AUTO', $complexe = '') {
-	// 0. Supprimer les caracteres illegaux
-	include_spip('inc/filtres');
-	$texte = corriger_caracteres($texte);
+    // 0. Supprimer les caracteres illegaux
+    include_spip('inc/filtres');
+    $texte = corriger_caracteres($texte);
 
-	// 1. Passer le charset et les &eacute en utf-8
-	$texte = unicode_to_utf_8(html2unicode(charset2unicode($texte, $charset, true)));
+    // 1. Passer le charset et les &eacute en utf-8
+    $texte = unicode_to_utf_8(html2unicode(charset2unicode($texte, $charset, true)));
 
-	return translitteration_rapide($texte, $charset, $complexe);
+    return translitteration_rapide($texte, $charset, $complexe);
 }
 
 /**
@@ -895,17 +895,17 @@  discard block
 block discarded – undo
  * @return string
  */
 function translitteration_complexe($texte, $chiffres = false) {
-	$texte = translitteration($texte, 'AUTO', 'complexe');
+    $texte = translitteration($texte, 'AUTO', 'complexe');
 
-	if ($chiffres) {
-		$texte = preg_replace_callback(
-			"/[aeiuoyd]['`?~.^+(-]{1,2}/S",
-			function($m) { return translitteration_chiffree($m[0]); },
-			$texte
-		);
-	}
+    if ($chiffres) {
+        $texte = preg_replace_callback(
+            "/[aeiuoyd]['`?~.^+(-]{1,2}/S",
+            function($m) { return translitteration_chiffree($m[0]); },
+            $texte
+        );
+    }
 
-	return $texte;
+    return $texte;
 }
 
 /**
@@ -917,7 +917,7 @@  discard block
 block discarded – undo
  * @return string
  */
 function translitteration_chiffree($car) {
-	return strtr($car, "'`?~.^+(-", "123456789");
+    return strtr($car, "'`?~.^+(-", "123456789");
 }
 
 
@@ -930,7 +930,7 @@  discard block
 block discarded – undo
  *    true s'il a un BOM
  **/
 function bom_utf8($texte) {
-	return (substr($texte, 0, 3) == chr(0xEF) . chr(0xBB) . chr(0xBF));
+    return (substr($texte, 0, 3) == chr(0xEF) . chr(0xBB) . chr(0xBF));
 }
 
 /**
@@ -947,18 +947,18 @@  discard block
 block discarded – undo
  *     true si c'est le cas
  **/
 function is_utf8($string) {
-	return !strlen(
-		preg_replace(
-			',[\x09\x0A\x0D\x20-\x7E]'            # ASCII
-			. '|[\xC2-\xDF][\x80-\xBF]'             # non-overlong 2-byte
-			. '|\xE0[\xA0-\xBF][\x80-\xBF]'         # excluding overlongs
-			. '|[\xE1-\xEC\xEE\xEF][\x80-\xBF]{2}'  # straight 3-byte
-			. '|\xED[\x80-\x9F][\x80-\xBF]'         # excluding surrogates
-			. '|\xF0[\x90-\xBF][\x80-\xBF]{2}'      # planes 1-3
-			. '|[\xF1-\xF3][\x80-\xBF]{3}'          # planes 4-15
-			. '|\xF4[\x80-\x8F][\x80-\xBF]{2}'      # plane 16
-			. ',sS',
-			'', $string));
+    return !strlen(
+        preg_replace(
+            ',[\x09\x0A\x0D\x20-\x7E]'            # ASCII
+            . '|[\xC2-\xDF][\x80-\xBF]'             # non-overlong 2-byte
+            . '|\xE0[\xA0-\xBF][\x80-\xBF]'         # excluding overlongs
+            . '|[\xE1-\xEC\xEE\xEF][\x80-\xBF]{2}'  # straight 3-byte
+            . '|\xED[\x80-\x9F][\x80-\xBF]'         # excluding surrogates
+            . '|\xF0[\x90-\xBF][\x80-\xBF]{2}'      # planes 1-3
+            . '|[\xF1-\xF3][\x80-\xBF]{3}'          # planes 4-15
+            . '|\xF4[\x80-\x8F][\x80-\xBF]{2}'      # plane 16
+            . ',sS',
+            '', $string));
 }
 
 /**
@@ -970,10 +970,10 @@  discard block
 block discarded – undo
  *     true si c'est le cas
  **/
 function is_ascii($string) {
-	return !strlen(
-		preg_replace(
-			',[\x09\x0A\x0D\x20-\x7E],sS',
-			'', $string));
+    return !strlen(
+        preg_replace(
+            ',[\x09\x0A\x0D\x20-\x7E],sS',
+            '', $string));
 }
 
 /**
@@ -992,58 +992,58 @@  discard block
 block discarded – undo
  **/
 function transcoder_page($texte, $headers = '') {
 
-	// Si tout est < 128 pas la peine d'aller plus loin
-	if (is_ascii($texte)) {
-		#spip_log('charset: ascii');
-		return $texte;
-	}
-
-	// Reconnaitre le BOM utf-8 (0xEFBBBF)
-	if (bom_utf8($texte)) {
-		$charset = 'utf-8';
-		$texte = substr($texte, 3);
-	} // charset precise par le contenu (xml)
-	else {
-		if (preg_match(
-			',<[?]xml[^>]*encoding[^>]*=[^>]*([-_a-z0-9]+?),UimsS', $texte, $regs)) {
-			$charset = trim(strtolower($regs[1]));
-		} // charset precise par le contenu (html)
-		else {
-			if (preg_match(
-					',<(meta|html|body)[^>]*charset[^>]*=[^>]*([-_a-z0-9]+?),UimsS',
-					$texte, $regs)
-				# eviter #CHARSET des squelettes
-				and (($tmp = trim(strtolower($regs[2]))) != 'charset')
-			) {
-				$charset = $tmp;
-			} // charset de la reponse http
-			else {
-				if (preg_match(',charset=([-_a-z0-9]+),i', $headers, $regs)) {
-					$charset = trim(strtolower($regs[1]));
-				} else {
-					$charset = '';
-				}
-			}
-		}
-	}
-	// normaliser les noms du shif-jis japonais
-	if (preg_match(',^(x|shift)[_-]s?jis$,i', $charset)) {
-		$charset = 'shift-jis';
-	}
-
-	if ($charset) {
-		spip_log("charset: $charset");
-	} else {
-		// valeur par defaut
-		if (is_utf8($texte)) {
-			$charset = 'utf-8';
-		} else {
-			$charset = 'iso-8859-1';
-		}
-		spip_log("charset probable: $charset");
-	}
-
-	return importer_charset($texte, $charset);
+    // Si tout est < 128 pas la peine d'aller plus loin
+    if (is_ascii($texte)) {
+        #spip_log('charset: ascii');
+        return $texte;
+    }
+
+    // Reconnaitre le BOM utf-8 (0xEFBBBF)
+    if (bom_utf8($texte)) {
+        $charset = 'utf-8';
+        $texte = substr($texte, 3);
+    } // charset precise par le contenu (xml)
+    else {
+        if (preg_match(
+            ',<[?]xml[^>]*encoding[^>]*=[^>]*([-_a-z0-9]+?),UimsS', $texte, $regs)) {
+            $charset = trim(strtolower($regs[1]));
+        } // charset precise par le contenu (html)
+        else {
+            if (preg_match(
+                    ',<(meta|html|body)[^>]*charset[^>]*=[^>]*([-_a-z0-9]+?),UimsS',
+                    $texte, $regs)
+                # eviter #CHARSET des squelettes
+                and (($tmp = trim(strtolower($regs[2]))) != 'charset')
+            ) {
+                $charset = $tmp;
+            } // charset de la reponse http
+            else {
+                if (preg_match(',charset=([-_a-z0-9]+),i', $headers, $regs)) {
+                    $charset = trim(strtolower($regs[1]));
+                } else {
+                    $charset = '';
+                }
+            }
+        }
+    }
+    // normaliser les noms du shif-jis japonais
+    if (preg_match(',^(x|shift)[_-]s?jis$,i', $charset)) {
+        $charset = 'shift-jis';
+    }
+
+    if ($charset) {
+        spip_log("charset: $charset");
+    } else {
+        // valeur par defaut
+        if (is_utf8($texte)) {
+            $charset = 'utf-8';
+        } else {
+            $charset = 'iso-8859-1';
+        }
+        spip_log("charset probable: $charset");
+    }
+
+    return importer_charset($texte, $charset);
 }
 
 
@@ -1067,26 +1067,26 @@  discard block
 block discarded – undo
  *     Le texte coupé
  **/
 function spip_substr($c, $start = 0, $length = null) {
-	// Si ce n'est pas utf-8, utiliser substr
-	if ($GLOBALS['meta']['charset'] != 'utf-8') {
-		if ($length) {
-			return substr($c, $start, $length);
-		} else {
-			substr($c, $start);
-		}
-	}
-
-	// Si utf-8, voir si on dispose de mb_string
-	if (init_mb_string()) {
-		if ($length) {
-			return mb_substr($c, $start, $length);
-		} else {
-			return mb_substr($c, $start);
-		}
-	}
-
-	// Version manuelle (cf. ci-dessous)
-	return spip_substr_manuelle($c, $start, $length);
+    // Si ce n'est pas utf-8, utiliser substr
+    if ($GLOBALS['meta']['charset'] != 'utf-8') {
+        if ($length) {
+            return substr($c, $start, $length);
+        } else {
+            substr($c, $start);
+        }
+    }
+
+    // Si utf-8, voir si on dispose de mb_string
+    if (init_mb_string()) {
+        if ($length) {
+            return mb_substr($c, $start, $length);
+        } else {
+            return mb_substr($c, $start);
+        }
+    }
+
+    // Version manuelle (cf. ci-dessous)
+    return spip_substr_manuelle($c, $start, $length);
 }
 
 
@@ -1105,40 +1105,40 @@  discard block
 block discarded – undo
  **/
 function spip_substr_manuelle($c, $start, $length = null) {
 
-	// Cas pathologique
-	if ($length === 0) {
-		return '';
-	}
-
-	// S'il y a un demarrage, on se positionne
-	if ($start > 0) {
-		$c = substr($c, strlen(spip_substr_manuelle($c, 0, $start)));
-	} elseif ($start < 0) {
-		return spip_substr_manuelle($c, spip_strlen($c) + $start, $length);
-	}
-
-	if (!$length) {
-		return $c;
-	}
-
-	if ($length > 0) {
-		// on prend n fois la longueur desiree, pour etre surs d'avoir tout
-		// (un caractere utf-8 prenant au maximum n bytes)
-		$n = 0;
-		while (preg_match(',[\x80-\xBF]{' . (++$n) . '},', $c)) {
-			;
-		}
-		$c = substr($c, 0, $n * $length);
-		// puis, tant qu'on est trop long, on coupe...
-		while (($l = spip_strlen($c)) > $length) {
-			$c = substr($c, 0, $length - $l);
-		}
-
-		return $c;
-	}
-
-	// $length < 0
-	return spip_substr_manuelle($c, 0, spip_strlen($c) + $length);
+    // Cas pathologique
+    if ($length === 0) {
+        return '';
+    }
+
+    // S'il y a un demarrage, on se positionne
+    if ($start > 0) {
+        $c = substr($c, strlen(spip_substr_manuelle($c, 0, $start)));
+    } elseif ($start < 0) {
+        return spip_substr_manuelle($c, spip_strlen($c) + $start, $length);
+    }
+
+    if (!$length) {
+        return $c;
+    }
+
+    if ($length > 0) {
+        // on prend n fois la longueur desiree, pour etre surs d'avoir tout
+        // (un caractere utf-8 prenant au maximum n bytes)
+        $n = 0;
+        while (preg_match(',[\x80-\xBF]{' . (++$n) . '},', $c)) {
+            ;
+        }
+        $c = substr($c, 0, $n * $length);
+        // puis, tant qu'on est trop long, on coupe...
+        while (($l = spip_strlen($c)) > $length) {
+            $c = substr($c, 0, $length - $l);
+        }
+
+        return $c;
+    }
+
+    // $length < 0
+    return spip_substr_manuelle($c, 0, spip_strlen($c) + $length);
 }
 
 /**
@@ -1152,14 +1152,14 @@  discard block
 block discarded – undo
  *     La chaîne avec une majuscule sur le premier mot
  */
 function spip_ucfirst($c) {
-	// Si on n'a pas mb_* ou si ce n'est pas utf-8, utiliser ucfirst
-	if (!init_mb_string() or $GLOBALS['meta']['charset'] != 'utf-8') {
-		return ucfirst($c);
-	}
+    // Si on n'a pas mb_* ou si ce n'est pas utf-8, utiliser ucfirst
+    if (!init_mb_string() or $GLOBALS['meta']['charset'] != 'utf-8') {
+        return ucfirst($c);
+    }
 
-	$lettre1 = mb_strtoupper(spip_substr($c, 0, 1));
+    $lettre1 = mb_strtoupper(spip_substr($c, 0, 1));
 
-	return $lettre1 . spip_substr($c, 1);
+    return $lettre1 . spip_substr($c, 1);
 }
 
 /**
@@ -1173,12 +1173,12 @@  discard block
 block discarded – undo
  *     La chaîne en minuscules
  */
 function spip_strtolower($c) {
-	// Si on n'a pas mb_* ou si ce n'est pas utf-8, utiliser strtolower 
-	if (!init_mb_string() or $GLOBALS['meta']['charset'] != 'utf-8') {
-		return strtolower($c);
-	}
+    // Si on n'a pas mb_* ou si ce n'est pas utf-8, utiliser strtolower 
+    if (!init_mb_string() or $GLOBALS['meta']['charset'] != 'utf-8') {
+        return strtolower($c);
+    }
 
-	return mb_strtolower($c);
+    return mb_strtolower($c);
 }
 
 /**
@@ -1192,23 +1192,23 @@  discard block
 block discarded – undo
  *     Longueur de la chaîne
  */
 function spip_strlen($c) {
-	// On transforme les sauts de ligne pour ne pas compter deux caractères
-	$c = str_replace("\r\n", "\n", $c);
-
-	// Si ce n'est pas utf-8, utiliser strlen
-	if ($GLOBALS['meta']['charset'] != 'utf-8') {
-		return strlen($c);
-	}
-
-	// Sinon, utiliser mb_strlen() si disponible
-	if (init_mb_string()) {
-		return mb_strlen($c);
-	}
-
-	// Methode manuelle : on supprime les bytes 10......,
-	// on compte donc les ascii (0.......) et les demarrages
-	// de caracteres utf-8 (11......)
-	return strlen(preg_replace(',[\x80-\xBF],S', '', $c));
+    // On transforme les sauts de ligne pour ne pas compter deux caractères
+    $c = str_replace("\r\n", "\n", $c);
+
+    // Si ce n'est pas utf-8, utiliser strlen
+    if ($GLOBALS['meta']['charset'] != 'utf-8') {
+        return strlen($c);
+    }
+
+    // Sinon, utiliser mb_strlen() si disponible
+    if (init_mb_string()) {
+        return mb_strlen($c);
+    }
+
+    // Methode manuelle : on supprime les bytes 10......,
+    // on compte donc les ascii (0.......) et les demarrages
+    // de caracteres utf-8 (11......)
+    return strlen(preg_replace(',[\x80-\xBF],S', '', $c));
 }
 
 // Initialisation
@@ -1218,14 +1218,14 @@  discard block
 block discarded – undo
 // dans les preg_replace pour ne pas casser certaines lettres accentuees :
 // en utf-8 chr(195).chr(160) = a` alors qu'en iso-latin chr(160) = nbsp
 if (!isset($GLOBALS['meta']['pcre_u'])
-	or (isset($_GET['var_mode']) and !isset($_GET['var_profile']))
+    or (isset($_GET['var_mode']) and !isset($_GET['var_profile']))
 ) {
-	include_spip('inc/meta');
-	ecrire_meta('pcre_u',
-		$u = (lire_config('charset', _DEFAULT_CHARSET) == 'utf-8'
-			and test_pcre_unicode())
-			? 'u' : ''
-	);
+    include_spip('inc/meta');
+    ecrire_meta('pcre_u',
+        $u = (lire_config('charset', _DEFAULT_CHARSET) == 'utf-8'
+            and test_pcre_unicode())
+            ? 'u' : ''
+    );
 }
 
 
@@ -1241,17 +1241,17 @@  discard block
 block discarded – undo
  *     en unicode : &#128169;
  */
 function utf8_noplanes($x) {
-	$regexp_utf8_4bytes = '/(
+    $regexp_utf8_4bytes = '/(
       \xF0[\x90-\xBF][\x80-\xBF]{2}     # planes 1-3
    | [\xF1-\xF3][\x80-\xBF]{3}          # planes 4-15
    |  \xF4[\x80-\x8F][\x80-\xBF]{2}     # plane 16
 )/xS';
-	if (preg_match_all($regexp_utf8_4bytes, $x, $z, PREG_PATTERN_ORDER)) {
-		foreach ($z[0] as $k) {
-			$ku = utf_8_to_unicode($k);
-			$x = str_replace($k, $ku, $x);
-		}
-	}
-
-	return $x;
+    if (preg_match_all($regexp_utf8_4bytes, $x, $z, PREG_PATTERN_ORDER)) {
+        foreach ($z[0] as $k) {
+            $ku = utf_8_to_unicode($k);
+            $x = str_replace($k, $ku, $x);
+        }
+    }
+
+    return $x;
 }

Please login to merge, or discard this patch.

Spacing +51 added lines, -51 removed lines patch added patch discarded remove patch

		@@ -73,7 +73,7 @@ discard block
		block discarded – undo
73	73	}
74	74	}
75	75
76		- if (find_in_path($charset . '.php', 'charsets/', true)) {
	76	+ if (find_in_path($charset.'.php', 'charsets/', true)) {
77	77	return $charset;
78	78	} else {
79	79	spip_log("Erreur: pas de fichier de conversion 'charsets/$charset'");
		@@ -159,7 +159,7 @@ discard block
		block discarded – undo
159	159	static $pcre_ok = 0;
160	160
161	161	if (!$pcre_ok) {
162		- $s = " " . chr(195) . chr(169) . "t" . chr(195) . chr(169) . " ";
	162	+ $s = " ".chr(195).chr(169)."t".chr(195).chr(169)." ";
163	163	if (preg_match(',\W...\W,u', $s)) {
164	164	$pcre_ok = 1;
165	165	} else {
		@@ -260,38 +260,38 @@ discard block
		block discarded – undo
260	260
261	261	if (!isset($trans[$charset][$charset_cible])) {
262	262	$trans[$charset][$charset_cible] = array(
263		- $p . chr(128) => "€",
264		- $p . chr(129) => ' ', # pas affecte
265		- $p . chr(130) => "‚",
266		- $p . chr(131) => "ƒ",
267		- $p . chr(132) => "„",
268		- $p . chr(133) => "…",
269		- $p . chr(134) => "†",
270		- $p . chr(135) => "‡",
271		- $p . chr(136) => "ˆ",
272		- $p . chr(137) => "‰",
273		- $p . chr(138) => "Š",
274		- $p . chr(139) => "‹",
275		- $p . chr(140) => "Œ",
276		- $p . chr(141) => ' ', # pas affecte
277		- $p . chr(142) => "Ž",
278		- $p . chr(143) => ' ', # pas affecte
279		- $p . chr(144) => ' ', # pas affecte
280		- $p . chr(145) => "‘",
281		- $p . chr(146) => "’",
282		- $p . chr(147) => "“",
283		- $p . chr(148) => "”",
284		- $p . chr(149) => "•",
285		- $p . chr(150) => "–",
286		- $p . chr(151) => "—",
287		- $p . chr(152) => "˜",
288		- $p . chr(153) => "™",
289		- $p . chr(154) => "š",
290		- $p . chr(155) => "›",
291		- $p . chr(156) => "œ",
292		- $p . chr(157) => ' ', # pas affecte
293		- $p . chr(158) => "ž",
294		- $p . chr(159) => "Ÿ",
	263	+ $p.chr(128) => "€",
	264	+ $p.chr(129) => ' ', # pas affecte
	265	+ $p.chr(130) => "‚",
	266	+ $p.chr(131) => "ƒ",
	267	+ $p.chr(132) => "„",
	268	+ $p.chr(133) => "…",
	269	+ $p.chr(134) => "†",
	270	+ $p.chr(135) => "‡",
	271	+ $p.chr(136) => "ˆ",
	272	+ $p.chr(137) => "‰",
	273	+ $p.chr(138) => "Š",
	274	+ $p.chr(139) => "‹",
	275	+ $p.chr(140) => "Œ",
	276	+ $p.chr(141) => ' ', # pas affecte
	277	+ $p.chr(142) => "Ž",
	278	+ $p.chr(143) => ' ', # pas affecte
	279	+ $p.chr(144) => ' ', # pas affecte
	280	+ $p.chr(145) => "‘",
	281	+ $p.chr(146) => "’",
	282	+ $p.chr(147) => "“",
	283	+ $p.chr(148) => "”",
	284	+ $p.chr(149) => "•",
	285	+ $p.chr(150) => "–",
	286	+ $p.chr(151) => "—",
	287	+ $p.chr(152) => "˜",
	288	+ $p.chr(153) => "™",
	289	+ $p.chr(154) => "š",
	290	+ $p.chr(155) => "›",
	291	+ $p.chr(156) => "œ",
	292	+ $p.chr(157) => ' ', # pas affecte
	293	+ $p.chr(158) => "ž",
	294	+ $p.chr(159) => "Ÿ",
295	295	);
296	296	if ($charset_cible != 'unicode') {
297	297	foreach ($trans[$charset][$charset_cible] as $k => $c) {
		@@ -421,7 +421,7 @@ discard block
		block discarded – undo
421	421	and is_array($GLOBALS['CHARSET'][$cset])
422	422	) {
423	423	foreach ($GLOBALS['CHARSET'][$cset] as $key => $val) {
424		- $trans[$charset][chr($key)] = '&#' . $val . ';';
	424	+ $trans[$charset][chr($key)] = '&#'.$val.';';
425	425	}
426	426	}
427	427	}
		@@ -488,11 +488,11 @@ discard block
		block discarded – undo
488	488	$h = dechex($e);
489	489	if ($s = isset($CHARSET_REVERSE[$charset][$e])) {
490	490	$s = $CHARSET_REVERSE[$charset][$e];
491		- $t['&#' . $e . ';'] = $t['&#0' . $e . ';'] = $t['&#00' . $e . ';'] = chr($s);
492		- $t['&#x' . $h . ';'] = $t['&#x0' . $h . ';'] = $t['&#x00' . $h . ';'] = chr($s);
	491	+ $t['&#'.$e.';'] = $t['&#0'.$e.';'] = $t['&#00'.$e.';'] = chr($s);
	492	+ $t['&#x'.$h.';'] = $t['&#x0'.$h.';'] = $t['&#x00'.$h.';'] = chr($s);
493	493	} else {
494		- $t['&#' . $e . ';'] = $t['&#0' . $e . ';'] = $t['&#00' . $e . ';'] = chr($e);
495		- $t['&#x' . $h . ';'] = $t['&#x0' . $h . ';'] = $t['&#x00' . $h . ';'] = chr($e);
	494	+ $t['&#'.$e.';'] = $t['&#0'.$e.';'] = $t['&#00'.$e.';'] = chr($e);
	495	+ $t['&#x'.$h.';'] = $t['&#x0'.$h.';'] = $t['&#x00'.$h.';'] = chr($e);
496	496	}
497	497	}
498	498	}
		@@ -536,7 +536,7 @@ discard block
		block discarded – undo
536	536	and is_array($GLOBALS['CHARSET'][$cset])
537	537	) {
538	538	foreach ($GLOBALS['CHARSET'][$cset] as $key => $val) {
539		- $trans[$charset][chr($key)] = unicode2charset('&#' . $val . ';');
	539	+ $trans[$charset][chr($key)] = unicode2charset('&#'.$val.';');
540	540	}
541	541	}
542	542	}
		@@ -643,7 +643,7 @@ discard block
		block discarded – undo
643	643	}
644	644	$thisPos++;
645	645	}
646		- $encodedLetter = "&#" . preg_replace('/^0+/', '', $decimalCode) . ';';
	646	+ $encodedLetter = "&#".preg_replace('/^0+/', '', $decimalCode).';';
647	647	$encodedString .= $encodedLetter;
648	648	}
649	649	}
		@@ -686,7 +686,7 @@ discard block
		block discarded – undo
686	686	} // ignorer le BOM - http://www.unicode.org/faq/utf_bom.html
687	687	else {
688	688	if ($word != 65279) {
689		- $texte .= '&#' . $word . ';';
	689	+ $texte .= '&#'.$word.';';
690	690	}
691	691	}
692	692	}
		@@ -715,13 +715,13 @@ discard block
		block discarded – undo
715	715	return chr($num);
716	716	}
717	717	if ($num < 2048) {
718		- return chr(($num >> 6) + 192) . chr(($num & 63) + 128);
	718	+ return chr(($num >> 6) + 192).chr(($num & 63) + 128);
719	719	}
720	720	if ($num < 65536) {
721		- return chr(($num >> 12) + 224) . chr((($num >> 6) & 63) + 128) . chr(($num & 63) + 128);
	721	+ return chr(($num >> 12) + 224).chr((($num >> 6) & 63) + 128).chr(($num & 63) + 128);
722	722	}
723	723	if ($num < 1114112) {
724		- return chr(($num >> 18) + 240) . chr((($num >> 12) & 63) + 128) . chr((($num >> 6) & 63) + 128) . chr(($num & 63) + 128);
	724	+ return chr(($num >> 18) + 240).chr((($num >> 12) & 63) + 128).chr((($num >> 6) & 63) + 128).chr(($num & 63) + 128);
725	725	}
726	726
727	727	return '';
		@@ -777,7 +777,7 @@ discard block
		block discarded – undo
777	777	while (preg_match(',&#0*([0-9]+);,S', $texte, $regs) and !isset($vu[$regs[1]])) {
778	778	$num = $regs[1];
779	779	$vu[$num] = true;
780		- $s = '\u' . sprintf("%04x", $num);
	780	+ $s = '\u'.sprintf("%04x", $num);
781	781	$texte = str_replace($regs[0], $s, $texte);
782	782	}
783	783
		@@ -794,7 +794,7 @@ discard block
		block discarded – undo
794	794	**/
795	795	function javascript_to_unicode($texte) {
796	796	while (preg_match(",%u([0-9A-F][0-9A-F][0-9A-F][0-9A-F]),", $texte, $regs)) {
797		- $texte = str_replace($regs[0], "&#" . hexdec($regs[1]) . ";", $texte);
	797	+ $texte = str_replace($regs[0], "&#".hexdec($regs[1]).";", $texte);
798	798	}
799	799
800	800	return $texte;
		@@ -839,7 +839,7 @@ discard block
		block discarded – undo
839	839	return $texte;
840	840	}
841	841
842		- $table_translit = 'translit' . $complexe;
	842	+ $table_translit = 'translit'.$complexe;
843	843
844	844	// 2. Translitterer grace a la table predefinie
845	845	if (!isset($trans[$complexe])) {
		@@ -930,7 +930,7 @@ discard block
		block discarded – undo
930	930	* true s'il a un BOM
931	931	**/
932	932	function bom_utf8($texte) {
933		- return (substr($texte, 0, 3) == chr(0xEF) . chr(0xBB) . chr(0xBF));
	933	+ return (substr($texte, 0, 3) == chr(0xEF).chr(0xBB).chr(0xBF));
934	934	}
935	935
936	936	/**
		@@ -1125,7 +1125,7 @@ discard block
		block discarded – undo
1125	1125	// on prend n fois la longueur desiree, pour etre surs d'avoir tout
1126	1126	// (un caractere utf-8 prenant au maximum n bytes)
1127	1127	$n = 0;
1128		- while (preg_match(',[\x80-\xBF]{' . (++$n) . '},', $c)) {
	1128	+ while (preg_match(',[\x80-\xBF]{'.(++$n).'},', $c)) {
1129	1129	;
1130	1130	}
1131	1131	$c = substr($c, 0, $n * $length);
		@@ -1159,7 +1159,7 @@ discard block
		block discarded – undo
1159	1159
1160	1160	$lettre1 = mb_strtoupper(spip_substr($c, 0, 1));
1161	1161
1162		- return $lettre1 . spip_substr($c, 1);
	1162	+ return $lettre1.spip_substr($c, 1);
1163	1163	}
1164	1164
1165	1165	/**

Please login to merge, or discard this patch.

spip / SPIP

Push — master ( 8414fb...da8260 )

Status

Category

Indentation +703 added lines, -703 removed lines patch added patch discarded remove patch

Spacing +51 added lines, -51 removed lines patch added patch discarded remove patch