502 lines
19 KiB
502 lines
19 KiB
<?php |
|
/** |
|
* @link http://www.yiiframework.com/ |
|
* @copyright Copyright (c) 2008 Yii Software LLC |
|
* @license http://www.yiiframework.com/license/ |
|
*/ |
|
|
|
namespace yii\elasticsearch; |
|
|
|
use Yii; |
|
use yii\base\Component; |
|
use yii\base\NotSupportedException; |
|
use yii\db\QueryInterface; |
|
use yii\db\QueryTrait; |
|
|
|
/** |
|
* Query represents a query to the search API of elasticsearch. |
|
* |
|
* Query provides a set of methods to facilitate the specification of different parameters of the query. |
|
* These methods can be chained together. |
|
* |
|
* By calling [[createCommand()]], we can get a [[Command]] instance which can be further |
|
* used to perform/execute the DB query against a database. |
|
* |
|
* For example, |
|
* |
|
* ~~~ |
|
* $query = new Query; |
|
* $query->fields('id, name') |
|
* ->from('myindex', 'users') |
|
* ->limit(10); |
|
* // build and execute the query |
|
* $command = $query->createCommand(); |
|
* $rows = $command->search(); // this way you get the raw output of elasticsearch. |
|
* ~~~ |
|
* |
|
* You would normally call `$query->search()` instead of creating a command as this method |
|
* adds the `indexBy()` feature and also removes some inconsistencies from the response. |
|
* |
|
* Query also provides some methods to easier get some parts of the result only: |
|
* |
|
* - [[one()]]: returns a single record populated with the first row of data. |
|
* - [[all()]]: returns all records based on the query results. |
|
* - [[count()]]: returns the number of records. |
|
* - [[scalar()]]: returns the value of the first column in the first row of the query result. |
|
* - [[column()]]: returns the value of the first column in the query result. |
|
* - [[exists()]]: returns a value indicating whether the query result has data or not. |
|
* |
|
* @author Carsten Brandt <mail@cebe.cc> |
|
* @since 2.0 |
|
*/ |
|
class Query extends Component implements QueryInterface |
|
{ |
|
use QueryTrait; |
|
|
|
/** |
|
* @var array the fields being retrieved from the documents. For example, `['id', 'name']`. |
|
* If not set, it means retrieving all fields. An empty array will result in no fields being |
|
* retrieved. This means that only the primaryKey of a record will be available in the result. |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-request-fields.html#search-request-fields |
|
* @see fields() |
|
*/ |
|
public $fields; |
|
/** |
|
* @var string|array The index to retrieve data from. This can be a string representing a single index |
|
* or a an array of multiple indexes. If this is not set, indexes are being queried. |
|
* @see from() |
|
*/ |
|
public $index; |
|
/** |
|
* @var string|array The type to retrieve data from. This can be a string representing a single type |
|
* or a an array of multiple types. If this is not set, all types are being queried. |
|
* @see from() |
|
*/ |
|
public $type; |
|
/** |
|
* @var integer A search timeout, bounding the search request to be executed within the specified time value |
|
* and bail with the hits accumulated up to that point when expired. Defaults to no timeout. |
|
* @see timeout() |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-request-body.html#_parameters_3 |
|
*/ |
|
public $timeout; |
|
/** |
|
* @var array|string The query part of this search query. This is an array or json string that follows the format of |
|
* the elasticsearch [Query DSL](http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/query-dsl.html). |
|
*/ |
|
public $query; |
|
/** |
|
* @var array|string The filter part of this search query. This is an array or json string that follows the format of |
|
* the elasticsearch [Query DSL](http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/query-dsl.html). |
|
*/ |
|
public $filter; |
|
|
|
public $facets = []; |
|
|
|
public function init() |
|
{ |
|
parent::init(); |
|
// setting the default limit according to elasticsearch defaults |
|
// http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-request-body.html#_parameters_3 |
|
if ($this->limit === null) { |
|
$this->limit = 10; |
|
} |
|
} |
|
|
|
/** |
|
* Creates a DB command that can be used to execute this query. |
|
* @param Connection $db the database connection used to execute the query. |
|
* If this parameter is not given, the `elasticsearch` application component will be used. |
|
* @return Command the created DB command instance. |
|
*/ |
|
public function createCommand($db = null) |
|
{ |
|
if ($db === null) { |
|
$db = Yii::$app->getComponent('elasticsearch'); |
|
} |
|
|
|
$commandConfig = $db->getQueryBuilder()->build($this); |
|
return $db->createCommand($commandConfig); |
|
} |
|
|
|
/** |
|
* Executes the query and returns all results as an array. |
|
* @param Connection $db the database connection used to execute the query. |
|
* If this parameter is not given, the `elasticsearch` application component will be used. |
|
* @return array the query results. If the query results in nothing, an empty array will be returned. |
|
*/ |
|
public function all($db = null) |
|
{ |
|
$result = $this->createCommand($db)->search(); |
|
if (empty($result['hits']['hits'])) { |
|
return []; |
|
} |
|
$rows = $result['hits']['hits']; |
|
if ($this->indexBy === null && $this->fields === null) { |
|
return $rows; |
|
} |
|
$models = []; |
|
foreach ($rows as $key => $row) { |
|
if ($this->fields !== null) { |
|
$row['_source'] = isset($row['fields']) ? $row['fields'] : []; |
|
unset($row['fields']); |
|
} |
|
if ($this->indexBy !== null) { |
|
if (is_string($this->indexBy)) { |
|
$key = $row['_source'][$this->indexBy]; |
|
} else { |
|
$key = call_user_func($this->indexBy, $row); |
|
} |
|
} |
|
$models[$key] = $row; |
|
} |
|
return $models; |
|
} |
|
|
|
/** |
|
* Executes the query and returns a single row of result. |
|
* @param Connection $db the database connection used to execute the query. |
|
* If this parameter is not given, the `elasticsearch` application component will be used. |
|
* @return array|boolean the first row (in terms of an array) of the query result. False is returned if the query |
|
* results in nothing. |
|
*/ |
|
public function one($db = null) |
|
{ |
|
$options['size'] = 1; |
|
$result = $this->createCommand($db)->search($options); |
|
if (empty($result['hits']['hits'])) { |
|
return false; |
|
} |
|
$record = reset($result['hits']['hits']); |
|
if ($this->fields !== null) { |
|
$record['_source'] = isset($record['fields']) ? $record['fields'] : []; |
|
unset($record['fields']); |
|
} |
|
return $record; |
|
} |
|
|
|
/** |
|
* Executes the query and returns the complete search result including e.g. hits, facets, totalCount. |
|
* @param Connection $db the database connection used to execute the query. |
|
* If this parameter is not given, the `elasticsearch` application component will be used. |
|
* @param array $options The options given with this query. Possible options are: |
|
* - [routing](http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search.html#search-routing) |
|
* - [search_type](http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-request-search-type.html) |
|
* @return array the query results. |
|
*/ |
|
public function search($db = null, $options = []) |
|
{ |
|
$result = $this->createCommand($db)->search($options); |
|
if (!empty($result['hits']['hits']) && ($this->indexBy === null || $this->fields === null)) { |
|
$rows = []; |
|
foreach ($result['hits']['hits'] as $key => $row) { |
|
if ($this->fields !== null) { |
|
$row['_source'] = isset($row['fields']) ? $row['fields'] : []; |
|
unset($row['fields']); |
|
} |
|
if ($this->indexBy !== null) { |
|
if (is_string($this->indexBy)) { |
|
$key = $row['_source'][$this->indexBy]; |
|
} else { |
|
$key = call_user_func($this->indexBy, $row); |
|
} |
|
} |
|
$rows[$key] = $row; |
|
} |
|
$result['hits']['hits'] = $rows; |
|
} |
|
return $result; |
|
} |
|
|
|
// TODO add query stats http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search.html#stats-groups |
|
|
|
// TODO add scroll/scan http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-request-search-type.html#scan |
|
|
|
/** |
|
* Executes the query and deletes all matching documents. |
|
* |
|
* This will not run facet queries. |
|
* |
|
* @param Connection $db the database connection used to execute the query. |
|
* If this parameter is not given, the `elasticsearch` application component will be used. |
|
* @return array the query results. If the query results in nothing, an empty array will be returned. |
|
*/ |
|
public function delete($db = null) |
|
{ |
|
// TODO implement http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/docs-delete-by-query.html |
|
throw new NotSupportedException('Delete by query is not implemented yet.'); |
|
} |
|
|
|
/** |
|
* Returns the query result as a scalar value. |
|
* The value returned will be the specified field in the first document of the query results. |
|
* @param string $field name of the attribute to select |
|
* @param Connection $db the database connection used to execute the query. |
|
* If this parameter is not given, the `elasticsearch` application component will be used. |
|
* @return string the value of the specified attribute in the first record of the query result. |
|
* Null is returned if the query result is empty or the field does not exist. |
|
*/ |
|
public function scalar($field, $db = null) |
|
{ |
|
$record = self::one($db); // TODO limit fields to the one required |
|
if ($record !== false && isset($record['_source'][$field])) { |
|
return $record['_source'][$field]; |
|
} else { |
|
return null; |
|
} |
|
} |
|
|
|
/** |
|
* Executes the query and returns the first column of the result. |
|
* @param string $field the field to query over |
|
* @param Connection $db the database connection used to execute the query. |
|
* If this parameter is not given, the `elasticsearch` application component will be used. |
|
* @return array the first column of the query result. An empty array is returned if the query results in nothing. |
|
*/ |
|
public function column($field, $db = null) |
|
{ |
|
$command = $this->createCommand($db); |
|
$command->queryParts['fields'] = [$field]; |
|
$result = $command->search(); |
|
if (empty($result['hits']['hits'])) { |
|
return []; |
|
} |
|
$column = []; |
|
foreach ($result['hits']['hits'] as $row) { |
|
$column[] = isset($row['fields'][$field]) ? $row['fields'][$field] : null; |
|
} |
|
return $column; |
|
} |
|
|
|
/** |
|
* Returns the number of records. |
|
* @param string $q the COUNT expression. This parameter is ignored by this implementation. |
|
* @param Connection $db the database connection used to execute the query. |
|
* If this parameter is not given, the `elasticsearch` application component will be used. |
|
* @return integer number of records |
|
*/ |
|
public function count($q = '*', $db = null) |
|
{ |
|
// TODO consider sending to _count api instead of _search for performance |
|
// only when no facety are registerted. |
|
// http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-count.html |
|
|
|
$options = []; |
|
$options['search_type'] = 'count'; |
|
return $this->createCommand($db)->search($options)['hits']['total']; |
|
} |
|
|
|
/** |
|
* Returns a value indicating whether the query result contains any row of data. |
|
* @param Connection $db the database connection used to execute the query. |
|
* If this parameter is not given, the `elasticsearch` application component will be used. |
|
* @return boolean whether the query result contains any row of data. |
|
*/ |
|
public function exists($db = null) |
|
{ |
|
return self::one($db) !== false; |
|
} |
|
|
|
/** |
|
* Adds a facet search to this query. |
|
* @param string $name the name of this facet |
|
* @param string $type the facet type. e.g. `terms`, `range`, `histogram`... |
|
* @param string|array $options the configuration options for this facet. Can be an array or a json string. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-query-facet.html |
|
*/ |
|
public function addFacet($name, $type, $options) |
|
{ |
|
$this->facets[$name] = [$type => $options]; |
|
return $this; |
|
} |
|
|
|
/** |
|
* The `terms facet` allow to specify field facets that return the N most frequent terms. |
|
* @param string $name the name of this facet |
|
* @param array $options additional option. Please refer to the elasticsearch documentation for details. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-terms-facet.html |
|
*/ |
|
public function addTermFacet($name, $options) |
|
{ |
|
return $this->addFacet($name, 'terms', $options); |
|
} |
|
|
|
/** |
|
* Range facet allows to specify a set of ranges and get both the number of docs (count) that fall |
|
* within each range, and aggregated data either based on the field, or using another field. |
|
* @param string $name the name of this facet |
|
* @param array $options additional option. Please refer to the elasticsearch documentation for details. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-range-facet.html |
|
*/ |
|
public function addRangeFacet($name, $options) |
|
{ |
|
return $this->addFacet($name, 'range', $options); |
|
} |
|
|
|
/** |
|
* The histogram facet works with numeric data by building a histogram across intervals of the field values. |
|
* Each value is "rounded" into an interval (or placed in a bucket), and statistics are provided per |
|
* interval/bucket (count and total). |
|
* @param string $name the name of this facet |
|
* @param array $options additional option. Please refer to the elasticsearch documentation for details. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-histogram-facet.html |
|
*/ |
|
public function addHistogramFacet($name, $options) |
|
{ |
|
return $this->addFacet($name, 'histogram', $options); |
|
} |
|
|
|
/** |
|
* A specific histogram facet that can work with date field types enhancing it over the regular histogram facet. |
|
* @param string $name the name of this facet |
|
* @param array $options additional option. Please refer to the elasticsearch documentation for details. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-date-histogram-facet.html |
|
*/ |
|
public function addDateHistogramFacet($name, $options) |
|
{ |
|
return $this->addFacet($name, 'date_histogram', $options); |
|
} |
|
|
|
/** |
|
* A filter facet (not to be confused with a facet filter) allows you to return a count of the hits matching the filter. |
|
* The filter itself can be expressed using the Query DSL. |
|
* @param string $name the name of this facet |
|
* @param string $filter the query in Query DSL |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-filter-facet.html |
|
*/ |
|
public function addFilterFacet($name, $filter) |
|
{ |
|
return $this->addFacet($name, 'filter', $filter); |
|
} |
|
|
|
/** |
|
* A facet query allows to return a count of the hits matching the facet query. |
|
* The query itself can be expressed using the Query DSL. |
|
* @param string $name the name of this facet |
|
* @param string $query the query in Query DSL |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-query-facet.html |
|
*/ |
|
public function addQueryFacet($name, $query) |
|
{ |
|
return $this->addFacet($name, 'query', $query); |
|
} |
|
|
|
/** |
|
* Statistical facet allows to compute statistical data on a numeric fields. The statistical data include count, |
|
* total, sum of squares, mean (average), minimum, maximum, variance, and standard deviation. |
|
* @param string $name the name of this facet |
|
* @param array $options additional option. Please refer to the elasticsearch documentation for details. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-statistical-facet.html |
|
*/ |
|
public function addStatisticalFacet($name, $options) |
|
{ |
|
return $this->addFacet($name, 'statistical', $options); |
|
} |
|
|
|
/** |
|
* The `terms_stats` facet combines both the terms and statistical allowing to compute stats computed on a field, |
|
* per term value driven by another field. |
|
* @param string $name the name of this facet |
|
* @param array $options additional option. Please refer to the elasticsearch documentation for details. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-terms-stats-facet.html |
|
*/ |
|
public function addTermsStatsFacet($name, $options) |
|
{ |
|
return $this->addFacet($name, 'terms_stats', $options); |
|
} |
|
|
|
/** |
|
* The `geo_distance` facet is a facet providing information for ranges of distances from a provided `geo_point` |
|
* including count of the number of hits that fall within each range, and aggregation information (like `total`). |
|
* @param string $name the name of this facet |
|
* @param array $options additional option. Please refer to the elasticsearch documentation for details. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-facets-geo-distance-facet.html |
|
*/ |
|
public function addGeoDistanceFacet($name, $options) |
|
{ |
|
return $this->addFacet($name, 'geo_distance', $options); |
|
} |
|
|
|
// TODO add suggesters http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-suggesters.html |
|
|
|
// TODO add validate query http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-validate.html |
|
|
|
// TODO support multi query via static method http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-multi-search.html |
|
|
|
/** |
|
* Sets the querypart of this search query. |
|
* @param string $query |
|
* @return static the query object itself |
|
*/ |
|
public function query($query) |
|
{ |
|
$this->query = $query; |
|
return $this; |
|
} |
|
|
|
/** |
|
* Sets the filter part of this search query. |
|
* @param string $filter |
|
* @return static the query object itself |
|
*/ |
|
public function filter($filter) |
|
{ |
|
$this->filter = $filter; |
|
return $this; |
|
} |
|
|
|
/** |
|
* Sets the index and type to retrieve documents from. |
|
* @param string|array $index The index to retrieve data from. This can be a string representing a single index |
|
* or a an array of multiple indexes. If this is `null` it means that all indexes are being queried. |
|
* @param string|array $type The type to retrieve data from. This can be a string representing a single type |
|
* or a an array of multiple types. If this is `null` it means that all types are being queried. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-search.html#search-multi-index-type |
|
*/ |
|
public function from($index, $type = null) |
|
{ |
|
$this->index = $index; |
|
$this->type = $type; |
|
return $this; |
|
} |
|
|
|
/** |
|
* Sets the fields to retrieve from the documents. |
|
* @param array $fields the fields to be selected. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-request-fields.html |
|
*/ |
|
public function fields($fields) |
|
{ |
|
if (is_array($fields) || $fields === null) { |
|
$this->fields = $fields; |
|
} else { |
|
$this->fields = func_get_args(); |
|
} |
|
return $this; |
|
} |
|
|
|
/** |
|
* Sets the search timeout. |
|
* @param integer $timeout A search timeout, bounding the search request to be executed within the specified time value |
|
* and bail with the hits accumulated up to that point when expired. Defaults to no timeout. |
|
* @return static the query object itself |
|
* @see http://www.elasticsearch.org/guide/en/elasticsearch/reference/current/search-request-body.html#_parameters_3 |
|
*/ |
|
public function timeout($timeout) |
|
{ |
|
$this->timeout = $timeout; |
|
return $this; |
|
} |
|
} |