mirror of
https://github.com/alchemy-fr/Phraseanet.git
synced 2025-10-13 21:13:26 +00:00
Fix CS
This commit is contained in:
@@ -25,138 +25,126 @@ use Symfony\Component\Console\Command\Command;
|
||||
class module_console_sphinxGenerateSuggestion extends Command
|
||||
{
|
||||
|
||||
public function __construct($name = null)
|
||||
{
|
||||
parent::__construct($name);
|
||||
|
||||
$this->setDescription('Generate suggestions for Sphinx Search Engine');
|
||||
|
||||
|
||||
return $this;
|
||||
}
|
||||
|
||||
public function execute(InputInterface $input, OutputInterface $output)
|
||||
{
|
||||
define('FREQ_THRESHOLD', 10);
|
||||
define('SUGGEST_DEBUG', 0);
|
||||
|
||||
$appbox = \appbox::get_instance(\bootstrap::getCore());
|
||||
$registry = $appbox->get_registry();
|
||||
|
||||
$params = phrasea::sbas_params();
|
||||
|
||||
foreach ($params as $sbas_id => $p)
|
||||
public function __construct($name = null)
|
||||
{
|
||||
$index = crc32(
|
||||
str_replace(
|
||||
array('.', '%')
|
||||
, '_'
|
||||
, sprintf('%s_%s_%s_%s', $p['host'], $p['port'], $p['user'], $p['dbname'])
|
||||
)
|
||||
);
|
||||
parent::__construct($name);
|
||||
|
||||
$tmp_file = $registry->get('GV_RootPath') . 'tmp/dict' . $index . '.txt';
|
||||
$this->setDescription('Generate suggestions for Sphinx Search Engine');
|
||||
|
||||
$databox = databox::get_instance($sbas_id);
|
||||
|
||||
$output->writeln("process Databox " . $databox->get_viewname() . " / $index\n");
|
||||
|
||||
if(!is_executable("/usr/local/bin/indexer"))
|
||||
{
|
||||
$output->writeln("<error>'/usr/local/bin/indexer' is not executable</error>");
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
||||
if(!file_exists($tmp_file))
|
||||
{
|
||||
$output->writeln("<error> file '".$tmp_file."' does not exist</error>");
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
||||
$cmd = '/usr/local/bin/indexer metadatas' . $index . ' --buildstops ' . $tmp_file . ' 1000000 --buildfreqs';
|
||||
exec($cmd);
|
||||
|
||||
try
|
||||
{
|
||||
$connbas = connection::getPDOConnection($sbas_id);
|
||||
}
|
||||
catch (Exception $e)
|
||||
{
|
||||
continue;
|
||||
}
|
||||
|
||||
$sql = 'TRUNCATE suggest';
|
||||
$stmt = $connbas->prepare($sql);
|
||||
$stmt->execute();
|
||||
$stmt->closeCursor();
|
||||
|
||||
$sql = $this->BuildDictionarySQL($output, file_get_contents($tmp_file));
|
||||
|
||||
if (trim($sql) !== '')
|
||||
{
|
||||
$stmt = $connbas->prepare($sql);
|
||||
$stmt->execute();
|
||||
$stmt->closeCursor();
|
||||
}
|
||||
|
||||
unlink($tmp_file);
|
||||
return $this;
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
protected function BuildTrigrams($keyword)
|
||||
{
|
||||
$t = "__" . $keyword . "__";
|
||||
|
||||
$trigrams = "";
|
||||
for ($i = 0; $i < strlen($t) - 2; $i++)
|
||||
$trigrams .= substr($t, $i, 3) . " ";
|
||||
|
||||
return $trigrams;
|
||||
}
|
||||
|
||||
protected function BuildDictionarySQL(OutputInterface $output, $in)
|
||||
{
|
||||
$out = '';
|
||||
|
||||
$n = 0;
|
||||
$lines = explode("\n", $in);
|
||||
foreach ($lines as $line)
|
||||
public function execute(InputInterface $input, OutputInterface $output)
|
||||
{
|
||||
if (trim($line) === '')
|
||||
continue;
|
||||
list ( $keyword, $freq ) = explode(" ", trim($line));
|
||||
define('FREQ_THRESHOLD', 10);
|
||||
define('SUGGEST_DEBUG', 0);
|
||||
|
||||
if ($freq < FREQ_THRESHOLD || strstr($keyword, "_") !== false || strstr($keyword, "'") !== false)
|
||||
continue;
|
||||
$appbox = \appbox::get_instance(\bootstrap::getCore());
|
||||
$registry = $appbox->get_registry();
|
||||
|
||||
if (ctype_digit($keyword))
|
||||
{
|
||||
continue;
|
||||
}
|
||||
if (mb_strlen($keyword) < 3)
|
||||
{
|
||||
continue;
|
||||
}
|
||||
$params = phrasea::sbas_params();
|
||||
|
||||
$trigrams = $this->BuildTrigrams($keyword);
|
||||
foreach ($params as $sbas_id => $p) {
|
||||
$index = crc32(
|
||||
str_replace(
|
||||
array('.', '%')
|
||||
, '_'
|
||||
, sprintf('%s_%s_%s_%s', $p['host'], $p['port'], $p['user'], $p['dbname'])
|
||||
)
|
||||
);
|
||||
|
||||
if ($n++)
|
||||
$out .= ",\n";
|
||||
$out .= "( $n, '$keyword', '$trigrams', $freq )";
|
||||
$tmp_file = $registry->get('GV_RootPath') . 'tmp/dict' . $index . '.txt';
|
||||
|
||||
$databox = databox::get_instance($sbas_id);
|
||||
|
||||
$output->writeln("process Databox " . $databox->get_viewname() . " / $index\n");
|
||||
|
||||
if ( ! is_executable("/usr/local/bin/indexer")) {
|
||||
$output->writeln("<error>'/usr/local/bin/indexer' is not executable</error>");
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
||||
if ( ! file_exists($tmp_file)) {
|
||||
$output->writeln("<error> file '" . $tmp_file . "' does not exist</error>");
|
||||
|
||||
return 1;
|
||||
}
|
||||
|
||||
$cmd = '/usr/local/bin/indexer metadatas' . $index . ' --buildstops ' . $tmp_file . ' 1000000 --buildfreqs';
|
||||
exec($cmd);
|
||||
|
||||
try {
|
||||
$connbas = connection::getPDOConnection($sbas_id);
|
||||
} catch (Exception $e) {
|
||||
continue;
|
||||
}
|
||||
|
||||
$sql = 'TRUNCATE suggest';
|
||||
$stmt = $connbas->prepare($sql);
|
||||
$stmt->execute();
|
||||
$stmt->closeCursor();
|
||||
|
||||
$sql = $this->BuildDictionarySQL($output, file_get_contents($tmp_file));
|
||||
|
||||
if (trim($sql) !== '') {
|
||||
$stmt = $connbas->prepare($sql);
|
||||
$stmt->execute();
|
||||
$stmt->closeCursor();
|
||||
}
|
||||
|
||||
unlink($tmp_file);
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
if (trim($out) !== '')
|
||||
protected function BuildTrigrams($keyword)
|
||||
{
|
||||
$out = "INSERT INTO suggest VALUES " . $out . ";";
|
||||
$t = "__" . $keyword . "__";
|
||||
|
||||
$trigrams = "";
|
||||
for ($i = 0; $i < strlen($t) - 2; $i ++ )
|
||||
$trigrams .= substr($t, $i, 3) . " ";
|
||||
|
||||
return $trigrams;
|
||||
}
|
||||
|
||||
$output->writeln(sprintf("Generated <info>%d</info> suggestions", $n));
|
||||
protected function BuildDictionarySQL(OutputInterface $output, $in)
|
||||
{
|
||||
$out = '';
|
||||
|
||||
return $out;
|
||||
}
|
||||
$n = 0;
|
||||
$lines = explode("\n", $in);
|
||||
foreach ($lines as $line) {
|
||||
if (trim($line) === '')
|
||||
continue;
|
||||
list ( $keyword, $freq ) = explode(" ", trim($line));
|
||||
|
||||
if ($freq < FREQ_THRESHOLD || strstr($keyword, "_") !== false || strstr($keyword, "'") !== false)
|
||||
continue;
|
||||
|
||||
if (ctype_digit($keyword)) {
|
||||
continue;
|
||||
}
|
||||
if (mb_strlen($keyword) < 3) {
|
||||
continue;
|
||||
}
|
||||
|
||||
$trigrams = $this->BuildTrigrams($keyword);
|
||||
|
||||
if ($n ++)
|
||||
$out .= ",\n";
|
||||
$out .= "( $n, '$keyword', '$trigrams', $freq )";
|
||||
}
|
||||
|
||||
if (trim($out) !== '') {
|
||||
$out = "INSERT INTO suggest VALUES " . $out . ";";
|
||||
}
|
||||
|
||||
$output->writeln(sprintf("Generated <info>%d</info> suggestions", $n));
|
||||
|
||||
return $out;
|
||||
}
|
||||
}
|
||||
|
Reference in New Issue
Block a user