be9704a768
TODO: add files to database TODO: hash folder to stick files in
307 lines
No EOL
7.4 KiB
PHP
307 lines
No EOL
7.4 KiB
PHP
<?php
|
|
/*
|
|
Ryzom Core Web-Based Translation Tool
|
|
Copyright (C) 2011 Piotr Kaczmarek <p.kaczmarek@openlink.pl>
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
?>
|
|
<?php
|
|
class PhraseParser
|
|
{
|
|
var $debug = false;
|
|
|
|
function removeComments($str)
|
|
{
|
|
//As a pertinent note, there's an issue with this function where parsing any string longer than 94326 characters long will silently return null. So be careful where you use it at.
|
|
//http://pl.php.net/manual/en/function.preg-replace.php#98843
|
|
ini_set('pcre.backtrack_limit', 10000000);
|
|
//$returnString = preg_replace('!/\*.*?\*/!s', '', $str); // /* .*? */ s
|
|
// added [^/] because there was //******* in translation file
|
|
$returnString = preg_replace('![^/]/\*.*?\*/!s', '', $str); // /* .*? */ s
|
|
// PHP 5.2.0
|
|
// if (PREG_NO_ERROR !== preg_last_error())
|
|
if ($returnString === null)
|
|
{
|
|
$returnStr = $str;
|
|
var_dump("PREG ERROR");
|
|
// exception
|
|
}
|
|
return $returnString;
|
|
}
|
|
|
|
function removeBOM($str)
|
|
{
|
|
if(($bom = substr($str, 0,3)) == pack("CCC",0xef,0xbb,0xbf))
|
|
{
|
|
$bla = substr($str, 3);
|
|
return $bla;
|
|
}
|
|
else
|
|
{
|
|
return $str;
|
|
}
|
|
}
|
|
|
|
function addBOM($str)
|
|
{
|
|
if(($bom = substr($str, 0,3)) != pack("CCC",0xef,0xbb,0xbf))
|
|
return pack("CCC",0xef,0xbb,0xbf) . $str;
|
|
else
|
|
return $str;
|
|
}
|
|
|
|
function parseLine($str)
|
|
{
|
|
$arr = array();
|
|
if (mb_substr($str, 0, 2) == "//")
|
|
{
|
|
if (mb_substr($str, 0, 7) == "// DIFF")
|
|
{
|
|
$tmp = explode(" ", $str);
|
|
$type = 'diff';
|
|
$command = mb_strtolower($tmp[2]);
|
|
$args = isset($tmp[3]) ? $tmp[3] : null;
|
|
if ($command == "add" || $command == "changed")
|
|
{
|
|
if (isset($args))
|
|
$index = intval($args);
|
|
else
|
|
$index = null;
|
|
$command = mb_substr($str, 3);
|
|
}
|
|
else
|
|
unset($type);
|
|
}
|
|
else if (mb_substr($str, 0, 8) == "// INDEX")
|
|
{
|
|
list($j, $type, $index) = explode(" ", $str);
|
|
$type = "internal_index";
|
|
}
|
|
else if (mb_substr($str, 0, 13) == "// HASH_VALUE")
|
|
{
|
|
list($j, $type, $hash_value) = explode(" ", $str);
|
|
$type = "hash_value";
|
|
}
|
|
/* if (!isset($type))
|
|
{
|
|
var_dump(isset($type));
|
|
debug_print_backtrace();
|
|
}
|
|
var_dump($type);*/
|
|
if (isset($type))
|
|
{
|
|
$type = mb_strtolower($type);
|
|
$arr = compact("type","command","index","hash_value");
|
|
}
|
|
}
|
|
else if (!(mb_substr($str, 0, 2) == "//") && mb_strlen($str))
|
|
{
|
|
$type = "string";
|
|
$string = "";
|
|
$identifier = "";
|
|
$arguments = "";
|
|
$body = "";
|
|
if (preg_match('|^([0-9A-Za-z@_]*) \((.*?)\).*$|', $str, $matches))
|
|
{
|
|
$identifier = $matches[1];
|
|
$arguments = $matches[2];
|
|
}
|
|
else if ($str == "{")
|
|
$body = "begin";
|
|
else if ($str == "}")
|
|
$body = "end";
|
|
else
|
|
{
|
|
$string = $str;
|
|
}
|
|
$arr = compact("type", "identifier", "arguments", "string", "body");
|
|
}
|
|
/* echo "<pre>################################\n";
|
|
var_dump($str);
|
|
var_dump($arr);
|
|
echo "</pre>\n";*/
|
|
return $arr;
|
|
}
|
|
|
|
function addEnt(&$parsedEnt, &$entities, &$newEnt)
|
|
{
|
|
if ($this->debug)
|
|
{
|
|
echo "\t%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%\n";
|
|
echo "\t%%%% newEnt %%%%%%%%% newEnt %%%%%%%%% newEnt %%%%%%%%% newEnt %%%%%\n";
|
|
echo "\t%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%\n\n";
|
|
var_dump($parsedEnt);
|
|
}
|
|
if (!isset($parsedEnt["diff"]) && !isset($parsedEnt["index"]))
|
|
$parsedEnt["index"] = $parsedEnt["internal_index"];
|
|
|
|
$parsedEnt["type"] = "phrase";
|
|
$entities[] = $parsedEnt;
|
|
$parsedEnt =array();
|
|
$newEnt = false;
|
|
}
|
|
|
|
function parseFile($file)
|
|
{
|
|
$parsedEnt = array();
|
|
$newEnt = false;
|
|
$prevStringLine = false;
|
|
$entities = array();
|
|
|
|
$file = $this->removeBOM($file);
|
|
// var_dump($file);
|
|
$file = $this->removeComments($file);
|
|
// var_dump($file);
|
|
$lines = explode("\n", $file);
|
|
if ($this->debug)
|
|
{
|
|
echo "<pre>\n\n";
|
|
}
|
|
$line_no=1;
|
|
foreach ($lines as $line)
|
|
{
|
|
if ($this->debug)
|
|
{
|
|
echo "\n\t#################### LINE NUMBER " . $line_no++ . "\n\n";
|
|
var_dump($line);
|
|
}
|
|
|
|
$line = rtrim($line, "\r\n");
|
|
$parsedLine = $this->parseLine($line);
|
|
|
|
if ($this->debug)
|
|
{
|
|
echo "%%%% parsedLine\n";
|
|
var_dump($parsedLine);
|
|
echo "\n";
|
|
|
|
echo "%%%% prevStringLine\n";
|
|
var_dump($prevStringLine);
|
|
echo "\n";
|
|
}
|
|
|
|
if (!$parsedLine)
|
|
continue;
|
|
|
|
// if line start with diff (diff files) or hash_value (translated files) and before was line with translation, then we start new ent
|
|
|
|
if ($prevStringLine && (
|
|
($parsedLine["type"] == "diff" && $parsedEnt) || ($parsedLine["type"] == "hash_value" && $parsedEnt)
|
|
))
|
|
{
|
|
/* echo "%%%% prevStringLine %%%%%\n";
|
|
var_dump($parsedEnt);*/
|
|
$newEnt = true;
|
|
}
|
|
|
|
if ($newEnt)
|
|
{
|
|
$this->addEnt($parsedEnt, $entities, $newEnt);
|
|
}
|
|
|
|
if ($parsedLine["type"] == "internal_index")
|
|
$parsedEnt["internal_index"] = $parsedLine["index"];
|
|
|
|
if ($parsedLine["type"] == "string")
|
|
{
|
|
$prevStringLine = true;
|
|
|
|
if ($parsedLine["body"] == "begin" || $parsedLine["body"] == "end")
|
|
continue;
|
|
|
|
if ($this->debug)
|
|
{
|
|
echo "%%%% parsedEnt before %%%%%\n";
|
|
var_dump($parsedEnt);
|
|
|
|
// echo "%%%% parsedLine %%%%%\n";
|
|
// var_dump($parsedLine);
|
|
}
|
|
|
|
if (!$parsedLine['identifier'])
|
|
{
|
|
if ($this->debug) echo "%%%% parsedEnt ZLACZENIE \n";
|
|
if ($this->debug && !isset($parsedEnt['string']))
|
|
{
|
|
echo "!isset parsedEnt['string']\n";
|
|
var_dump($line);
|
|
var_dump($parsedEnt);
|
|
var_dump($parsedLine);
|
|
}
|
|
$parsedEnt['string'] .= $parsedLine['string'] . "\n";
|
|
}
|
|
else
|
|
{
|
|
if ($this->debug) echo "DODANIE \n";
|
|
$parsedEnt += $parsedLine;
|
|
// $parsedEnt['string'] .= "\n";
|
|
}
|
|
|
|
if ($this->debug)
|
|
{
|
|
echo "%%%% parsedEnt after %%%%%\n";
|
|
var_dump($parsedEnt);
|
|
}
|
|
}
|
|
else
|
|
$prevStringLine = false;
|
|
|
|
if ($parsedLine["type"] == "diff")
|
|
{
|
|
$parsedEnt["diff"] = $parsedEnt["command"] = $parsedLine["command"];
|
|
$parsedEnt["index"] = $parsedLine["index"];
|
|
}
|
|
}
|
|
if ($parsedEnt)
|
|
{
|
|
$this->addEnt($parsedEnt, $entities, $newEnt);
|
|
}
|
|
|
|
if ($this->debug)
|
|
{
|
|
echo "<pre>";
|
|
var_dump($entities);
|
|
echo "</pre>\n";
|
|
}
|
|
return $entities;
|
|
}
|
|
|
|
function CRLF($s)
|
|
{
|
|
$s = str_replace("\r\n", "\n", $s);
|
|
$s = str_replace("\n", "\r\n", $s);
|
|
return $s;
|
|
}
|
|
|
|
function buildFile($entities)
|
|
{
|
|
$content = '// DIFF_VERSION 2' . "\n";
|
|
foreach ($entities as $ent)
|
|
{
|
|
if (isset($ent['command']))
|
|
$content .= '// ' . $ent['command'] . "\n";
|
|
if (isset($ent['hash_value']))
|
|
$content .= '// HASH_VALUE ' . $ent['hash_value'];
|
|
/* if (isset($ent['command']))
|
|
$content .= '// INDEX ' . $ent['internal_index'] . "\n";
|
|
else
|
|
$content .= '// INDEX ' . $ent['index'] . "\n";*/
|
|
$content .= $ent['identifier'] . ' (' . $ent['arguments'] . ')' . "\n" . '{' . "\n" . $ent['string'] . "\n" . '}' . "\n";
|
|
$content .= "\n";
|
|
}
|
|
return $this->addBOM($this->CRLF($content));
|
|
}
|
|
}
|
|
?>
|