关于这个翻译小工具的算法,很多人问我,因为有段时间了,最近一直没更新
下面就几个函数做些说明,以方便大家转换成其他语言。
整个算法不是我的,我只是把google的js翻译成php,就是需要总要研究google的js,
最开始使用在github上面,参考网址https://github.com/Stichoza/google-translate-php/issues/32
后来因为总要研究测试google的算法,就自己弄了这个小工具,
工具地址:http://www.tastemylife.com/
define('GOOGLE_URL', 'https://translate.google.cn/translate_a/');//这里定义google的网址
define('UA', isset($_SERVER['HTTP_USER_AGENT']) && !empty($_SERVER['HTTP_USER_AGENT']) ? $_SERVER['HTTP_USER_AGENT'] : 'Mozilla/5.0 (Android; Mobile; rv:22.0) Gecko/22.0 Firefox/22.0');
session_start();
//这个函数是无符号右移
//参考http://www.shangxueba.com/jingyan/1911053.html
function shr32($x, $bits)
{
if($bits <= 0){
return $x;
}
if($bits >= 32){
return 0;
}
$bin = decbin($x);
$l = strlen($bin);
if($l > 32){
$bin = substr($bin, $l - 32, 32);
}elseif($l < 32){
$bin = str_pad($bin, 32, '0', STR_PAD_LEFT);
}
return bindec(str_pad(substr($bin, 0, 32 - $bits), 32, '0', STR_PAD_LEFT));
}
//这个就是javascript的charCodeAt
//PHP版本的在这里http://www.phpjiayuan.com/90/225.html
function charCodeAt($str, $index)
{
$char = mb_substr($str, $index, 1, 'UTF-8');
if (mb_check_encoding($char, 'UTF-8'))
{
$ret = mb_convert_encoding($char, 'UTF-32BE', 'UTF-8');
return hexdec(bin2hex($ret));
}
else
{
return null;
}
}
//直接复制google
function RL($a, $b)
{
for($c = 0; $c < strlen($b) - 2; $c +=3) {
$d = $b{$c+2};
$d = $d >= 'a' ? charCodeAt($d,0) - 87 : intval($d);
$d = $b{$c+1} == '+' ? shr32($a, $d) : $a << $d;
$a = $b{$c} == '+' ? ($a + $d & 4294967295) : $a ^ $d;
}
return $a;
}
//静态TKK,动态获取请使用另外一个方法
function TKK()
{
$a = 561666268;
$b = 1526272306;
return 406398 . '.' . ($a + $b);
}
//直接复制google
function TL($a)
{
$tkk = explode('.', TKK());
$b = $tkk[0];
for($d = array(), $e = 0, $f = 0; $f < mb_strlen ( $a, 'UTF-8' ); $f ++) {
$g = charCodeAt ( $a, $f );
if (128 > $g) {
$d [$e ++] = $g;
} else {
if (2048 > $g) {
$d [$e ++] = $g >> 6 | 192;
} else {
if (55296 == ($g & 64512) && $f + 1 < mb_strlen ( $a, 'UTF-8' ) && 56320 == (charCodeAt ( $a, $f + 1 ) & 64512)) {
$g = 65536 + (($g & 1023) << 10) + (charCodeAt ( $a, ++ $f ) & 1023);
$d [$e ++] = $g >> 18 | 240;
$d [$e ++] = $g >> 12 & 63 | 128;
} else {
$d [$e ++] = $g >> 12 | 224;
$d [$e ++] = $g >> 6 & 63 | 128;
}
}
$d [$e ++] = $g & 63 | 128;
}
}
$a = $b;
for($e = 0; $e < count ( $d ); $e ++) {
$a += $d [$e];
$a = RL ( $a, '+-a^+6' );
}
$a = RL ( $a, "+-3^+b+-f" );
$a ^= $tkk[1];
if (0 > $a) {
$a = ($a & 2147483647) + 2147483648;
}
$a = fmod ( $a, pow ( 10, 6 ) );
return $a . "." . ($a ^ $b);
}
function translate($sl, $tl, $q, $param = 't?client=webapp', $method = 'get')
{
$tk = TL($q);
$q = urlencode(stripslashes($q));
$resultRegexes = array(
'/,+/' => ',',
'/\[,/' => '[',
);
$url = GOOGLE_URL . $param . "&sl=".$sl."&tl=".$tl."&hl=".$tl."&dt=bd&dt=ex&dt=ld&dt=md&dt=qca&dt=rw&dt=rm&dt=ss&dt=t&dt=at&ie=UTF-8&oe=UTF-8&otf=2&ssel=0&tsel=0&kc=1&tk=". $tk ;
if ( $method == 'get' ) $url .= "&q=" . $q;
$output = sendHttpRequest($url, $method == 'get' ? 0 : 1, $method == 'get' ? '' : "&q=" . $q, array('User-Agent' => UA));
return $output;
}