Files
Phraseanet/lib/Alchemy/Phrasea/SearchEngine/SearchEngineOptions.php
2016-06-28 13:12:58 +02:00

749 lines
20 KiB
PHP

<?php
/*
* This file is part of Phraseanet
*
* (c) 2005-2016 Alchemy
*
* For the full copyright and license information, please view the LICENSE
* file that was distributed with this source code.
*/
namespace Alchemy\Phrasea\SearchEngine;
use Alchemy\Phrasea\Application;
use Alchemy\Phrasea\Authentication\ACLProvider;
use Alchemy\Phrasea\Authentication\Authenticator;
use Alchemy\Phrasea\Collection\CollectionRepository;
use Alchemy\Phrasea\Collection\Reference\CollectionReferenceCollection;
use Assert\Assertion;
use Symfony\Component\HttpFoundation\Request;
use Symfony\Component\HttpKernel\Exception\BadRequestHttpException;
class SearchEngineOptions
{
const RECORD_RECORD = 0;
const RECORD_GROUPING = 1;
const RECORD_STORY = 2;
const TYPE_IMAGE = 'image';
const TYPE_VIDEO = 'video';
const TYPE_AUDIO = 'audio';
const TYPE_DOCUMENT = 'document';
const TYPE_FLASH = 'flash';
const TYPE_UNKNOWN = 'unknown';
const TYPE_ALL = '';
const SORT_RELEVANCE = 'relevance';
const SORT_CREATED_ON = 'created_on';
const SORT_RANDOM = 'random';
const SORT_MODE_ASC = 'asc';
const SORT_MODE_DESC = 'desc';
private static $serializable_properties = [
'record_type',
'search_type',
'collections',
'fields',
'status',
'date_min',
'date_max',
'date_fields',
'i18n',
'stemming',
'sort_by',
'sort_ord',
'business_fields',
'max_results',
'first_result',
];
/**
* @param Application $app
* @return callable[]
*/
private static function getHydrateMethods(Application $app)
{
$fieldNormalizer = function ($value) use ($app) {
return array_map(function ($serialized) use ($app) {
$data = explode('_', $serialized, 2);
return $app->findDataboxById($data[0])->get_meta_structure()->get_element($data[1]);
}, $value);
};
$collectionNormalizer = function ($value) use ($app) {
$references = new CollectionReferenceCollection($app['repo.collection-references']->findMany($value));
$collections = [];
foreach ($references->groupByDataboxIdAndCollectionId() as $databoxId => $indexes) {
/** @var CollectionRepository $repository */
$repository = $app['repo.collections-registry']->getRepositoryByDatabox($databoxId);
foreach ($indexes as $collectionId => $index) {
$coll = $repository->find($collectionId);
$collections[$coll->get_base_id()] = $coll;
}
}
return $collections;
};
$optionSetter = function ($setter) {
return function ($value, SearchEngineOptions $options) use ($setter) {
$options->{$setter}($value);
};
};
return [
'record_type' => $optionSetter('setRecordType'),
'search_type' => $optionSetter('setSearchType'),
'status' => $optionSetter('setStatus'),
'date_min' => function ($value, SearchEngineOptions $options) {
$options->setMinDate($value ? \DateTime::createFromFormat(DATE_ATOM, $value) : null);
},
'date_max' => function ($value, SearchEngineOptions $options) {
$options->setMaxDate($value ? \DateTime::createFromFormat(DATE_ATOM, $value) : null);
},
'i18n' => function ($value, SearchEngineOptions $options) {
if ($value) {
$options->setLocale($value);
}
},
'stemming' => $optionSetter('setStemming'),
'date_fields' => function ($value, SearchEngineOptions $options) use ($fieldNormalizer) {
$options->setDateFields($fieldNormalizer($value));
},
'fields' => function ($value, SearchEngineOptions $options) use ($fieldNormalizer) {
$options->setFields($fieldNormalizer($value));
},
'collections' => function ($value, SearchEngineOptions $options) use ($collectionNormalizer) {
$options->onCollections($collectionNormalizer($value));
},
'business_fields' => function ($value, SearchEngineOptions $options) use ($collectionNormalizer) {
$options->allowBusinessFieldsOn($collectionNormalizer($value));
},
'first_result' => $optionSetter('setFirstResult'),
'max_results' => $optionSetter('setMaxResults'),
];
}
/** @var string */
protected $record_type = self::TYPE_ALL;
protected $search_type = self::RECORD_RECORD;
/** @var \collection[] */
protected $collections = [];
/** @var null|\databox[] */
private $databoxes;
/** @var \databox_field[] */
protected $fields = [];
protected $status = [];
/** @var \DateTime */
protected $date_min;
/** @var \DateTime */
protected $date_max;
protected $date_fields = [];
/** @var string */
protected $i18n;
/** @var bool */
protected $stemming = true;
/** @var string */
protected $sort_by;
/** @var string */
protected $sort_ord = self::SORT_MODE_DESC;
protected $business_fields = [];
/**
* @var int
*/
private $max_results = 10;
/**
* @var int
*/
private $first_result = 0;
/**
* Defines locale code to use for query
*
* @param string $locale An i18n locale code
* @return $this
*/
public function setLocale($locale)
{
if ($locale && !preg_match('/[a-z]{2,3}/', $locale)) {
throw new \InvalidArgumentException('Locale must be a valid i18n code');
}
$this->i18n = $locale;
return $this;
}
/**
* Returns the locale value
*
* @return string
*/
public function getLocale()
{
return $this->i18n;
}
/**
* @param string $sort_by
* @param string $sort_ord
* @return $this
*/
public function setSort($sort_by, $sort_ord = self::SORT_MODE_DESC)
{
$this->sort_by = $sort_by;
$this->sort_ord = $sort_ord;
return $this;
}
/**
* Allows business fields query on the given collections
*
* @param \collection[] $collection An array of collection
* @return $this
*/
public function allowBusinessFieldsOn(array $collection)
{
$this->business_fields = $collection;
return $this;
}
/**
* Reset business fields settings
*
* @return $this
*/
public function disallowBusinessFields()
{
$this->business_fields = [];
return $this;
}
/**
* Returns an array of collection on which business fields are allowed to
* search on
*
* @return \collection[] An array of collection
*/
public function getBusinessFieldsOn()
{
return $this->business_fields;
}
/**
* Returns the sort criteria
*
* @return string
*/
public function getSortBy()
{
return $this->sort_by;
}
/**
* Returns the sort order
*
* @return string
*/
public function getSortOrder()
{
return $this->sort_ord;
}
/**
* Tells whether to use stemming or not
*
* @param boolean $boolean
* @return $this
*/
public function setStemming($boolean)
{
$this->stemming = !!$boolean;
return $this;
}
/**
* Return wheter the use of stemming is enabled or not
*
* @return boolean
*/
public function isStemmed()
{
return $this->stemming;
}
/**
* Set document type to search for
*
* @param int $search_type
* @return $this
*/
public function setSearchType($search_type)
{
switch ($search_type) {
case self::RECORD_RECORD:
default:
$this->search_type = self::RECORD_RECORD;
break;
case self::RECORD_GROUPING:
case self::RECORD_STORY:
$this->search_type = self::RECORD_GROUPING;
break;
}
return $this;
}
/**
* Returns the type of documents type to search for
*
* @return int
*/
public function getSearchType()
{
return $this->search_type;
}
/**
* Set the collections where to search for
*
* @param \collection[] $collections An array of collection
* @return $this
*/
public function onCollections(array $collections)
{
$this->collections = $collections;
// Defer databox retrieval
$this->databoxes = null;
return $this;
}
/**
* Returns the collections on which the search occurs
*
* @return \collection[] An array of collection
*/
public function getCollections()
{
return $this->collections;
}
/**
* Returns an array containing all the databoxes where the search will
* happen
*
* @return \databox[]
*/
public function getDataboxes()
{
if (null === $this->databoxes) {
$databoxes = [];
foreach ($this->collections as $collection) {
$databoxes[$collection->get_databox()->get_sbas_id()] = $collection->get_databox();
}
$this->databoxes = array_values($databoxes);
}
return $this->databoxes;
}
/**
* @param \databox_field[] $fields An array of Databox fields
* @return $this
*/
public function setFields(array $fields)
{
$this->fields = $fields;
return $this;
}
public function getFields()
{
return $this->fields;
}
/**
* @param array $status
* @return $this
*/
public function setStatus(array $status)
{
$this->status = $status;
return $this;
}
/**
* @return array
*/
public function getStatus()
{
return $this->status;
}
/**
* @param string $record_type
* @return $this
*/
public function setRecordType($record_type)
{
switch ($record_type) {
case self::TYPE_ALL:
default:
$this->record_type = self::TYPE_ALL;
break;
case self::TYPE_AUDIO:
$this->record_type = self::TYPE_AUDIO;
break;
case self::TYPE_VIDEO:
$this->record_type = self::TYPE_VIDEO;
break;
case self::TYPE_DOCUMENT:
$this->record_type = self::TYPE_DOCUMENT;
break;
case self::TYPE_FLASH:
$this->record_type = self::TYPE_FLASH;
break;
case self::TYPE_IMAGE:
$this->record_type = self::TYPE_IMAGE;
break;
case self::TYPE_UNKNOWN:
$this->record_type = self::TYPE_UNKNOWN;
break;
}
return $this;
}
/** @return string */
public function getRecordType()
{
return $this->record_type;
}
/**
* @return $this
*/
public function setMinDate(\DateTime $min_date = null)
{
if ($min_date && $this->date_max && $min_date > $this->date_max) {
throw new \LogicException('Min-date should be before max-date');
}
$this->date_min = $min_date;
return $this;
}
/** @return \DateTime
*/
public function getMinDate()
{
return $this->date_min;
}
/**
* @param \DateTime|string $max_date
* @return $this
*/
public function setMaxDate(\DateTime $max_date = null)
{
if ($max_date && $this->date_max && $max_date < $this->date_min) {
throw new \LogicException('Min-date should be before max-date');
}
$this->date_max = $max_date;
return $this;
}
/** @return \DateTime */
public function getMaxDate()
{
return $this->date_max;
}
/**
* @param \databox_field[] $fields
* @return $this
*/
public function setDateFields(array $fields)
{
$this->date_fields = $fields;
return $this;
}
/** @return \databox_field[] */
public function getDateFields()
{
return $this->date_fields;
}
public function serialize()
{
$ret = [];
foreach (self::$serializable_properties as $key) {
$value = $this->{$key};
if ($value instanceof \DateTime) {
$value = $value->format(DATE_ATOM);
}
if (in_array($key, ['date_fields', 'fields'])) {
$value = array_map(function (\databox_field $field) {
return $field->get_databox()->get_sbas_id() . '_' . $field->get_id();
}, $value);
}
if (in_array($key, ['collections', 'business_fields'])) {
$value = array_map(function (\collection $collection) {
return $collection->get_base_id();
}, $value);
}
$ret[$key] = $value;
}
return \p4string::jsonencode($ret);
}
/**
*
* @param Application $app
* @param string $serialized
*
* @return $this
*
* @throws \InvalidArgumentException
* @throws \RuntimeException
*/
public static function hydrate(Application $app, $serialized)
{
$serialized = json_decode($serialized, true);
if (!is_array($serialized)) {
throw new \InvalidArgumentException('SearchEngineOptions data are corrupted');
}
$options = new static();
$options->disallowBusinessFields();
$methods = self::getHydrateMethods($app);
$sort_by = null;
$methods['sort_by'] = function ($value) use (&$sort_by) {
$sort_by = $value;
};
$sort_ord = null;
$methods['sort_ord'] = function ($value) use (&$sort_ord) {
$sort_ord = $value;
};
foreach ($serialized as $key => $value) {
if (!isset($methods[$key])) {
throw new \RuntimeException(sprintf('Unable to handle key `%s`', $key));
}
if ($value instanceof \stdClass) {
$value = (array)$value;
}
$callable = $methods[$key];
$callable($value, $options);
}
if ($sort_by) {
if ($sort_ord) {
$options->setSort($sort_by, $sort_ord);
} else {
$options->setSort($sort_by);
}
}
return $options;
}
/**
* Creates options based on a Symfony Request object
*
* @param Application $app
* @param Request $request
*
* @return static
*/
public static function fromRequest(Application $app, Request $request)
{
$options = new static();
$options->disallowBusinessFields();
$options->setLocale($app['locale']);
/** @var Authenticator $authenticator */
$authenticator = $app->getAuthenticator();
$isAuthenticated = $authenticator->isAuthenticated();
/** @var ACLProvider $aclProvider */
$aclProvider = $app['acl'];
$acl = $isAuthenticated ? $aclProvider->get($authenticator->getUser()) : null;
$selected_bases = $request->get('bases');
if (is_array($selected_bases)) {
$bas = [];
foreach ($selected_bases as $bas_id) {
try {
$bas[$bas_id] = \collection::getByBaseId($app, $bas_id);
} catch (\Exception_Databox_CollectionNotFound $e) {
// Ignore
}
}
} elseif (!$isAuthenticated) {
$bas = $app->getOpenCollections();
} else {
$bas = $acl->get_granted_base();
}
// Filter out not found collections
$bas = array_filter($bas);
if ($acl) {
$filter = function (\collection $collection) use ($acl) {
return $acl->has_access_to_base($collection->get_base_id());
};
} else {
$openCollections = $app->getOpenCollections();
$filter = function (\collection $collection) use ($openCollections) {
return in_array($collection, $openCollections);
};
}
/** @var \collection[] $bas */
$bas = array_filter($bas, $filter);
if (!empty($selected_bases) && empty($bas)) {
throw new BadRequestHttpException('No collections match your criteria');
}
$options->onCollections($bas);
if ($isAuthenticated && $acl->has_right('modifyrecord')) {
$bf = array_filter($bas, function (\collection $collection) use ($acl) {
return $acl->has_right_on_base($collection->get_base_id(), 'canmodifrecord');
});
$options->allowBusinessFieldsOn($bf);
}
$status = is_array($request->get('status')) ? $request->get('status') : [];
$fields = is_array($request->get('fields')) ? $request->get('fields') : [];
if (empty($fields)) {
// Select all fields (business included)
foreach ($options->getDataboxes() as $databox) {
foreach ($databox->get_meta_structure() as $field) {
$fields[] = $field->get_name();
}
}
$fields = array_unique($fields);
}
$databoxFields = [];
$databoxes = $options->getDataboxes();
foreach ($databoxes as $databox) {
$metaStructure = $databox->get_meta_structure();
foreach ($fields as $field) {
try {
$databoxField = $metaStructure->get_element_by_name($field);
} catch (\Exception $e) {
continue;
}
if ($databoxField) {
$databoxFields[] = $databoxField;
}
}
}
$options->setFields($databoxFields);
$options->setStatus($status);
$options->setSearchType($request->get('search_type'));
$options->setRecordType($request->get('record_type'));
$min_date = $max_date = null;
if ($request->get('date_min')) {
$min_date = \DateTime::createFromFormat('Y/m/d H:i:s', $request->get('date_min') . ' 00:00:00');
}
if ($request->get('date_max')) {
$max_date = \DateTime::createFromFormat('Y/m/d H:i:s', $request->get('date_max') . ' 23:59:59');
}
$options->setMinDate($min_date);
$options->setMaxDate($max_date);
$databoxDateFields = [];
foreach ($databoxes as $databox) {
$metaStructure = $databox->get_meta_structure();
foreach (explode('|', $request->get('date_field')) as $field) {
try {
$databoxField = $metaStructure->get_element_by_name($field);
} catch (\Exception $e) {
continue;
}
if ($databoxField) {
$databoxDateFields[] = $databoxField;
}
}
}
$options->setDateFields($databoxDateFields);
$options->setSort($request->get('sort'), $request->get('ord', SearchEngineOptions::SORT_MODE_DESC));
$options->setStemming((Boolean) $request->get('stemme'));
return $options;
}
public function setMaxResults($max_results)
{
Assertion::greaterOrEqualThan($max_results, 0);
$this->max_results = (int)$max_results;
}
public function getMaxResults()
{
return $this->max_results;
}
/**
* @param int $first_result
* @return void
*/
public function setFirstResult($first_result)
{
Assertion::greaterOrEqualThan($first_result, 0);
$this->first_result = (int)$first_result;
}
/**
* @return int
*/
public function getFirstResult()
{
return $this->first_result;
}
}