328 lines
8.5 KiB
PHP

<?php
/* vim: set expandtab sw=4 ts=4 sts=4: */
/**
* Hold the PMA\libraries\Encoding class
*
* @package PhpMyAdmin
*/
namespace PMA\libraries;
use PMA\libraries\config\ConfigFile;
/**
* Encoding conversion helper class
*
* @package PhpMyAdmin
*/
class Encoding
{
/**
* None encoding conversion engine
*
* @var int
*/
const ENGINE_NONE = 0;
/**
* iconv encoding conversion engine
*
* @var int
*/
const ENGINE_ICONV = 1;
/**
* recode encoding conversion engine
*
* @var int
*/
const ENGINE_RECODE = 2;
/**
* mbstring encoding conversion engine
*
* @var int
*/
const ENGINE_MB = 3;
/**
* Chosen encoding engine
*
* @var int
*/
private static $_engine = null;
/**
* Map of conversion engine configurations
*
* Each entry contains:
*
* - function to detect
* - engine contant
* - extension name to warn when missing
*
* @var array
*/
private static $_enginemap = array(
'iconv' => array('iconv', self::ENGINE_ICONV, 'iconv'),
'recode' => array('recode_string', self::ENGINE_RECODE, 'recode'),
'mb' => array('mb_convert_encoding', self::ENGINE_MB, 'mbstring'),
'none' => array('isset', self::ENGINE_NONE, ''),
);
/**
* Order of automatic detection of engines
*
* @var array
*/
private static $_engineorder = array(
'mb', 'iconv', 'recode',
);
/**
* Kanji encodings list
*
* @var string
*/
private static $_kanji_encodings = 'ASCII,SJIS,EUC-JP,JIS';
/**
* Initializes encoding engine detecting available backends.
*
* @return void
*/
public static function initEngine()
{
$engine = 'auto';
if (isset($GLOBALS['cfg']['RecodingEngine'])) {
$engine = $GLOBALS['cfg']['RecodingEngine'];
}
/* Use user configuration */
if (isset(self::$_enginemap[$engine])) {
if (@function_exists(self::$_enginemap[$engine][0])) {
self::$_engine = self::$_enginemap[$engine][1];
return;
} else {
PMA_warnMissingExtension(self::$_enginemap[$engine][2]);
}
}
/* Autodetection */
foreach (self::$_engineorder as $engine) {
if (@function_exists(self::$_enginemap[$engine][0])) {
self::$_engine = self::$_enginemap[$engine][1];
return;
}
}
/* Fallback to none conversion */
self::$_engine = self::ENGINE_NONE;
}
/**
* Setter for engine. Use with caution, mostly useful for testing.
*
* @return void
*/
public static function setEngine($engine)
{
self::$_engine = $engine;
}
/**
* Checks whether there is any charset conversion supported
*
* @return bool
*/
public static function isSupported()
{
if (is_null(self::$_engine)) {
self::initEngine();
}
return self::$_engine != self::ENGINE_NONE;
}
/**
* Converts encoding of text according to parameters with detected
* conversion function.
*
* @param string $src_charset source charset
* @param string $dest_charset target charset
* @param string $what what to convert
*
* @return string converted text
*
* @access public
*/
public static function convertString($src_charset, $dest_charset, $what)
{
if ($src_charset == $dest_charset) {
return $what;
}
if (is_null(self::$_engine)) {
self::initEngine();
}
switch (self::$_engine) {
case self::ENGINE_RECODE:
return recode_string(
$src_charset . '..' . $dest_charset,
$what
);
case self::ENGINE_ICONV:
return iconv(
$src_charset,
$dest_charset .
(isset($GLOBALS['cfg']['IconvExtraParams']) ? $GLOBALS['cfg']['IconvExtraParams'] : ''),
$what
);
case self::ENGINE_MB:
return mb_convert_encoding(
$what,
$dest_charset,
$src_charset
);
default:
return $what;
}
}
/**
* Detects whether Kanji encoding is available
*
* @return bool
*/
public static function canConvertKanji()
{
return (
$GLOBALS['lang'] == 'ja' &&
function_exists('mb_convert_encoding')
);
}
/**
* Setter for Kanji encodings. Use with caution, mostly useful for testing.
*
* @return string
*/
public static function getKanjiEncodings()
{
return self::$_kanji_encodings;
}
/**
* Setter for Kanji encodings. Use with caution, mostly useful for testing.
*
* @return void
*/
public static function setKanjiEncodings($value)
{
self::$_kanji_encodings = $value;
}
/**
* Reverses SJIS & EUC-JP position in the encoding codes list
*
* @return void
*/
public static function kanjiChangeOrder()
{
$parts = explode(',', self::$_kanji_encodings);
if ($parts[1] == 'EUC-JP') {
self::$_kanji_encodings = 'ASCII,SJIS,EUC-JP,JIS';
} else {
self::$_kanji_encodings = 'ASCII,EUC-JP,SJIS,JIS';
}
}
/**
* Kanji string encoding convert
*
* @param string $str the string to convert
* @param string $enc the destination encoding code
* @param string $kana set 'kana' convert to JIS-X208-kana
*
* @return string the converted string
*/
public static function kanjiStrConv($str, $enc, $kana)
{
if ($enc == '' && $kana == '') {
return $str;
}
$string_encoding = mb_detect_encoding($str, self::$_kanji_encodings);
if ($string_encoding === false) {
$string_encoding = 'utf-8';
}
if ($kana == 'kana') {
$dist = mb_convert_kana($str, 'KV', $string_encoding);
$str = $dist;
}
if ($string_encoding != $enc && $enc != '') {
$dist = mb_convert_encoding($str, $enc, $string_encoding);
} else {
$dist = $str;
}
return $dist;
}
/**
* Kanji file encoding convert
*
* @param string $file the name of the file to convert
* @param string $enc the destination encoding code
* @param string $kana set 'kana' convert to JIS-X208-kana
*
* @return string the name of the converted file
*/
public static function kanjiFileConv($file, $enc, $kana)
{
if ($enc == '' && $kana == '') {
return $file;
}
$tmpfname = tempnam(ConfigFile::getDefaultTempDirectory(), $enc);
$fpd = fopen($tmpfname, 'wb');
$fps = fopen($file, 'r');
self::kanjiChangeOrder();
while (!feof($fps)) {
$line = fgets($fps, 4096);
$dist = self::kanjiStrConv($line, $enc, $kana);
fputs($fpd, $dist);
} // end while
self::kanjiChangeOrder();
fclose($fps);
fclose($fpd);
unlink($file);
return $tmpfname;
}
/**
* Defines radio form fields to switch between encoding modes
*
* @return string xhtml code for the radio controls
*/
public static function kanjiEncodingForm()
{
return '<ul><li>'
. '<input type="radio" name="knjenc" value="" checked="checked" '
. 'id="kj-none" />'
. '<label for="kj-none">'
/* l10n: This is currently used only in Japanese locales */
. _pgettext('None encoding conversion', 'None')
. '</label>'
. '<input type="radio" name="knjenc" value="EUC-JP" id="kj-euc" />'
. '<label for="kj-euc">EUC</label>'
. '<input type="radio" name="knjenc" value="SJIS" id="kj-sjis" />'
. '<label for="kj-sjis">SJIS</label>'
. '</li>'
. '<li>'
. '<input type="checkbox" name="xkana" value="kana" id="kj-kana" />'
. '<label for="kj-kana">'
/* l10n: This is currently used only in Japanese locales */
. __('Convert to Kana')
. '</label><br />'
. '</li></ul>';
}
}