mirror of
https://github.com/alchemy-fr/Phraseanet.git
synced 2025-10-24 10:23:17 +00:00

* portage commande searchengine:index vers 4.1 * FIX Indexer * Update DataboxFetcherFactory.php
301 lines
11 KiB
PHP
301 lines
11 KiB
PHP
<?php
|
|
|
|
/*
|
|
* This file is part of Phraseanet
|
|
*
|
|
* (c) 2005-2016 Alchemy
|
|
*
|
|
* For the full copyright and license information, please view the LICENSE
|
|
* file that was distributed with this source code.
|
|
*/
|
|
|
|
namespace Alchemy\Phrasea\Core\Provider;
|
|
|
|
use Alchemy\Phrasea\Core\LazyLocator;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\DataboxFetcherFactory;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\ElasticsearchOptions;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Index;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\IndexLocator;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Search\QueryVisitor;
|
|
use Alchemy\Phrasea\SearchEngine\SearchEngineLogger;
|
|
use Alchemy\Phrasea\Exception\InvalidArgumentException;
|
|
use Alchemy\Phrasea\SearchEngine\SearchEngineInterface;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\ElasticSearchEngine;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Indexer;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\IndexerSubscriber;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Indexer\RecordIndexer;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Indexer\TermIndexer;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\RecordHelper;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Search\Escaper;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Search\FacetsResponse;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Search\QueryContextFactory;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Search\QueryCompiler;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Structure\GlobalStructure;
|
|
use Alchemy\Phrasea\SearchEngine\Elastic\Thesaurus;
|
|
use Elasticsearch\ClientBuilder;
|
|
use Hoa\Compiler;
|
|
use Hoa\File;
|
|
use Monolog\Handler\ErrorLogHandler;
|
|
use Monolog\Handler\RotatingFileHandler;
|
|
use Monolog\Logger;
|
|
use Silex\Application;
|
|
use Silex\ServiceProviderInterface;
|
|
use Symfony\Component\EventDispatcher\EventDispatcherInterface;
|
|
use Symfony\Component\HttpKernel\KernelEvents;
|
|
|
|
class SearchEngineServiceProvider implements ServiceProviderInterface
|
|
{
|
|
public function register(Application $app)
|
|
{
|
|
$this->registerElasticSearchClient($app);
|
|
$this->registerQueryParser($app);
|
|
$this->registerIndexer($app);
|
|
$this->registerSearchEngine($app);
|
|
}
|
|
|
|
public function boot(Application $app)
|
|
{
|
|
}
|
|
|
|
/**
|
|
* @param Application $app
|
|
* @return Application
|
|
*/
|
|
private function registerSearchEngine(Application $app)
|
|
{
|
|
$app['phraseanet.SE'] = function ($app) {
|
|
return $app['search_engine'];
|
|
};
|
|
|
|
$app['phraseanet.SE.logger'] = $app->share(function (Application $app) {
|
|
return new SearchEngineLogger($app);
|
|
});
|
|
|
|
$app['search_engine'] = $app->share(function ($app) {
|
|
$type = $app['conf']->get(['main', 'search-engine', 'type']);
|
|
if ($type !== SearchEngineInterface::TYPE_ELASTICSEARCH) {
|
|
throw new InvalidArgumentException(sprintf('Invalid search engine type "%s".', $type));
|
|
}
|
|
|
|
/** @var ElasticsearchOptions $options */
|
|
$options = $app['elasticsearch.options'];
|
|
|
|
return new ElasticSearchEngine(
|
|
$app,
|
|
$app['search_engine.structure'],
|
|
$app['elasticsearch.client'],
|
|
$app['query_context.factory'],
|
|
$app['elasticsearch.facets_response.factory'],
|
|
$options
|
|
);
|
|
});
|
|
|
|
$app['search_engine.structure'] = $app->share(function (\Alchemy\Phrasea\Application $app) {
|
|
$databoxes = $app->getDataboxes();
|
|
|
|
return GlobalStructure::createFromDataboxes($databoxes);
|
|
});
|
|
|
|
$app['elasticsearch.facets_response.factory'] = $app->protect(function (array $response) use ($app) {
|
|
return new FacetsResponse(new Escaper(), $response, $app['search_engine.structure']);
|
|
});
|
|
|
|
return $app;
|
|
}
|
|
|
|
/**
|
|
* @param Application $app
|
|
* @return Application
|
|
*/
|
|
private function registerIndexer(Application $app)
|
|
{
|
|
/* Indexer related services */
|
|
$app['elasticsearch.index'] = $app->share(function ($app) {
|
|
return new Index($app['elasticsearch.options'], $app['elasticsearch.index.locator']);
|
|
});
|
|
|
|
$app['elasticsearch.index.record'] = $app->share(function ($app) {
|
|
return new Indexer\RecordIndex($app['search_engine.structure'], array_keys($app['locales.available']));
|
|
});
|
|
|
|
$app['elasticsearch.index.term'] = $app->share(function ($app) {
|
|
return new Indexer\TermIndex(array_keys($app['locales.available']));
|
|
});
|
|
|
|
$app['elasticsearch.index.locator'] = $app->share(function ($app) {
|
|
return new IndexLocator($app, 'elasticsearch.index.record', 'elasticsearch.index.term');
|
|
});
|
|
|
|
$app['elasticsearch.indexer'] = $app->share(function ($app) {
|
|
return new Indexer(
|
|
$app['elasticsearch.client'],
|
|
$app['elasticsearch.index'],
|
|
$app['elasticsearch.indexer.term_indexer'],
|
|
$app['elasticsearch.indexer.record_indexer'],
|
|
$app['monolog']
|
|
);
|
|
});
|
|
|
|
$app['elasticsearch.indexer.term_indexer'] = $app->share(function ($app) {
|
|
return new TermIndexer(
|
|
$app['phraseanet.appbox'],
|
|
$app['monolog']
|
|
);
|
|
});
|
|
|
|
$app['elasticsearch.indexer.databox_fetcher_factory'] = $app->share(function ($app) {
|
|
return new DataboxFetcherFactory(
|
|
$app['elasticsearch.record_helper'],
|
|
$app['elasticsearch.options'],
|
|
$app,
|
|
'search_engine.structure',
|
|
'thesaurus'
|
|
);
|
|
});
|
|
|
|
$app['elasticsearch.indexer.record_indexer'] = $app->share(function ($app) {
|
|
// TODO Use upcoming monolog factory
|
|
$logger = new Logger('indexer');
|
|
$logger->pushHandler(new ErrorLogHandler());
|
|
|
|
return new RecordIndexer(
|
|
$app['elasticsearch.indexer.databox_fetcher_factory'],
|
|
$app['elasticsearch.record_helper'],
|
|
$app['dispatcher'],
|
|
$app['monolog']
|
|
);
|
|
});
|
|
|
|
$app['elasticsearch.record_helper'] = $app->share(function ($app) {
|
|
return new RecordHelper($app['phraseanet.appbox']);
|
|
});
|
|
|
|
$app['dispatcher'] = $app
|
|
->share($app->extend('dispatcher', function (EventDispatcherInterface $dispatcher, $app) {
|
|
$subscriber = new IndexerSubscriber(new LazyLocator($app, 'elasticsearch.indexer'));
|
|
|
|
$dispatcher->addSubscriber($subscriber);
|
|
|
|
$listener = array($subscriber, 'flushQueue');
|
|
|
|
// Add synchronous flush when used in CLI.
|
|
if (isset($app['console'])) {
|
|
foreach (array_keys($subscriber->getSubscribedEvents()) as $eventName) {
|
|
$dispatcher->addListener($eventName, $listener, -10);
|
|
}
|
|
|
|
return $dispatcher;
|
|
}
|
|
|
|
$dispatcher->addListener(KernelEvents::TERMINATE, $listener);
|
|
|
|
return $dispatcher;
|
|
}));
|
|
|
|
return $app;
|
|
}
|
|
|
|
/**
|
|
* @param Application $app
|
|
* @return Application
|
|
*/
|
|
private function registerElasticSearchClient(Application $app)
|
|
{
|
|
/* Low-level elasticsearch services */
|
|
$app['elasticsearch.client'] = $app->share(function ($app) {
|
|
/** @var ElasticsearchOptions $options */
|
|
$options = $app['elasticsearch.options'];
|
|
$clientParams = ['hosts' => [sprintf('%s:%s', $options->getHost(), $options->getPort())]];
|
|
|
|
// Create file logger for debug
|
|
if ($app['debug']) {
|
|
/** @var Logger $logger */
|
|
$logger = new $app['monolog.logger.class']('search logger');
|
|
$logger->pushHandler(new RotatingFileHandler($app['log.path'] . DIRECTORY_SEPARATOR . 'elasticsearch.log',
|
|
2, Logger::INFO));
|
|
|
|
$clientParams['logObject'] = $logger;
|
|
$clientParams['logging'] = true;
|
|
}
|
|
|
|
$clientBuilder = ClientBuilder::create()
|
|
->setHosts($clientParams['hosts']);
|
|
if(array_key_exists('logObject', $clientParams)) {
|
|
$clientBuilder->setLogger($clientParams['logObject']);
|
|
}
|
|
|
|
return $clientBuilder->build();
|
|
});
|
|
|
|
$app['elasticsearch.options'] = $app->share(function ($app) {
|
|
$options = ElasticsearchOptions::fromArray($app['conf']->get(['main', 'search-engine', 'options'], []));
|
|
|
|
if (empty($options->getIndexName())) {
|
|
$options->setIndexName(strtolower(sprintf('phraseanet_%s', str_replace(
|
|
array('/', '.'), array('', ''),
|
|
$app['conf']->get(['main', 'key'])
|
|
))));
|
|
}
|
|
|
|
return $options;
|
|
});
|
|
|
|
return $app;
|
|
}
|
|
|
|
/**
|
|
* @param Application $app
|
|
*/
|
|
private function registerQueryParser(Application $app)
|
|
{
|
|
/* Querying helper services */
|
|
$app['thesaurus'] = $app->share(function ($app) {
|
|
$logger = new Logger('thesaurus');
|
|
$logger->pushHandler(new ErrorLogHandler(
|
|
ErrorLogHandler::OPERATING_SYSTEM,
|
|
$app['debug'] ? Logger::DEBUG : Logger::ERROR
|
|
));
|
|
|
|
return new Thesaurus(
|
|
$app['elasticsearch.client'],
|
|
$app['elasticsearch.options'],
|
|
$logger
|
|
);
|
|
});
|
|
|
|
$app['query_context.factory'] = $app->share(function ($app) {
|
|
return new QueryContextFactory(
|
|
$app['search_engine.structure'],
|
|
array_keys($app['locales.available']),
|
|
$app['locale']
|
|
);
|
|
});
|
|
|
|
$app['query_parser.grammar_path'] = function ($app) {
|
|
$configPath = ['registry', 'searchengine', 'query-grammar-path'];
|
|
$grammarPath = $app['conf']->get($configPath, 'grammar/query.pp');
|
|
$projectRoot = '../../../../..';
|
|
|
|
return realpath(implode('/', [__DIR__, $projectRoot, $grammarPath]));
|
|
};
|
|
|
|
$app['query_parser'] = $app->share(function ($app) {
|
|
$grammarPath = $app['query_parser.grammar_path'];
|
|
|
|
return Compiler\Llk\Llk::load(new File\Read($grammarPath));
|
|
});
|
|
|
|
$app['query_visitor.factory'] = $app->protect(function () use ($app) {
|
|
return new QueryVisitor($app['search_engine.structure']);
|
|
});
|
|
|
|
$app['query_compiler'] = $app->share(function ($app) {
|
|
return new QueryCompiler(
|
|
$app['query_parser'],
|
|
$app['query_visitor.factory'],
|
|
$app['thesaurus']
|
|
);
|
|
});
|
|
}
|
|
}
|