2007-07-13 01:50:31 +04:00
|
|
|
<?php
|
|
|
|
/*
|
|
|
|
* $Id: Hook.php 1939 2007-07-05 23:47:48Z zYne $
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*
|
|
|
|
* This software consists of voluntary contributions made by many individuals
|
|
|
|
* and is licensed under the LGPL. For more information, see
|
2008-01-23 01:52:53 +03:00
|
|
|
* <http://www.phpdoctrine.org>.
|
2007-07-13 01:50:31 +04:00
|
|
|
*/
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Doctrine_Search_Query
|
|
|
|
*
|
|
|
|
* @package Doctrine
|
2007-10-04 01:43:22 +04:00
|
|
|
* @subpackage Search
|
|
|
|
* @author Konsta Vesterinen <kvesteri@cc.hut.fi>
|
2007-07-13 01:50:31 +04:00
|
|
|
* @license http://www.opensource.org/licenses/lgpl-license.php LGPL
|
2007-10-04 01:43:22 +04:00
|
|
|
* @version $Revision$
|
2008-02-22 21:11:35 +03:00
|
|
|
* @link www.phpdoctrine.org
|
2007-07-13 01:50:31 +04:00
|
|
|
* @since 1.0
|
|
|
|
*/
|
|
|
|
class Doctrine_Search_Query
|
|
|
|
{
|
2007-10-18 01:17:01 +04:00
|
|
|
|
2007-07-13 01:50:31 +04:00
|
|
|
/**
|
2007-07-27 02:57:36 +04:00
|
|
|
* @var Doctrine_Table $_table the index table
|
2007-07-13 01:50:31 +04:00
|
|
|
*/
|
2007-07-27 02:57:36 +04:00
|
|
|
protected $_table = array();
|
|
|
|
|
|
|
|
protected $_sql = '';
|
2007-08-02 02:53:33 +04:00
|
|
|
|
2007-08-02 16:01:38 +04:00
|
|
|
protected $_params = array();
|
|
|
|
|
2007-11-18 20:44:47 +03:00
|
|
|
protected $_words = array();
|
|
|
|
|
2007-11-24 21:58:33 +03:00
|
|
|
protected $_tokenizer;
|
2007-08-02 03:42:22 +04:00
|
|
|
|
2007-08-02 02:53:33 +04:00
|
|
|
protected $_condition;
|
2007-10-21 10:23:59 +04:00
|
|
|
|
2007-07-13 01:50:31 +04:00
|
|
|
/**
|
2007-10-18 01:17:01 +04:00
|
|
|
* @param Doctrine_Table $_table the index table
|
2007-07-13 01:50:31 +04:00
|
|
|
*/
|
2007-07-27 02:57:36 +04:00
|
|
|
public function __construct($table)
|
2007-07-13 01:50:31 +04:00
|
|
|
{
|
2007-07-27 23:24:28 +04:00
|
|
|
if (is_string($table)) {
|
|
|
|
$table = Doctrine_Manager::table($table);
|
2007-10-18 01:17:01 +04:00
|
|
|
} else {
|
|
|
|
if ( ! $table instanceof Doctrine_Table) {
|
|
|
|
throw new Doctrine_Search_Exception('Invalid argument type. Expected instance of Doctrine_Table.');
|
|
|
|
}
|
2007-07-27 23:24:28 +04:00
|
|
|
}
|
2007-07-27 02:57:36 +04:00
|
|
|
|
2007-11-24 21:58:33 +03:00
|
|
|
$this->_tokenizer = new Doctrine_Query_Tokenizer();
|
2007-07-27 02:57:36 +04:00
|
|
|
$this->_table = $table;
|
|
|
|
|
2007-08-02 02:53:33 +04:00
|
|
|
$foreignId = current(array_diff($this->_table->getColumnNames(), array('keyword', 'field', 'position')));
|
|
|
|
|
2007-08-02 03:42:22 +04:00
|
|
|
$this->_condition = $foreignId . ' %s (SELECT ' . $foreignId . ' FROM ' . $this->_table->getTableName() . ' WHERE ';
|
2007-07-13 01:50:31 +04:00
|
|
|
}
|
|
|
|
|
2007-10-18 01:17:01 +04:00
|
|
|
|
|
|
|
public function query($text)
|
2007-07-27 02:57:36 +04:00
|
|
|
{
|
2007-08-02 03:42:22 +04:00
|
|
|
$text = trim($text);
|
2007-10-18 01:17:01 +04:00
|
|
|
|
2007-08-02 03:42:22 +04:00
|
|
|
$foreignId = current(array_diff($this->_table->getColumnNames(), array('keyword', 'field', 'position')));
|
2007-08-01 23:37:28 +04:00
|
|
|
|
2007-07-27 03:44:09 +04:00
|
|
|
$weighted = false;
|
|
|
|
if (strpos($text, '^') === false) {
|
|
|
|
$select = 'SELECT COUNT(keyword) AS relevance, ' . $foreignId;
|
|
|
|
$from = 'FROM ' . $this->_table->getTableName();
|
|
|
|
} else {
|
|
|
|
// organize terms according weights
|
|
|
|
$weighted = true;
|
|
|
|
|
|
|
|
$select = 'SELECT SUM(sub_relevance) AS relevance, ' . $foreignId;
|
|
|
|
$from = 'FROM ' ;
|
|
|
|
}
|
2007-07-27 02:57:36 +04:00
|
|
|
|
2007-08-01 23:37:28 +04:00
|
|
|
$where = 'WHERE ';
|
|
|
|
$where .= $this->parseClause($text);
|
|
|
|
|
2007-07-27 03:10:04 +04:00
|
|
|
$groupby = 'GROUP BY ' . $foreignId;
|
2007-11-18 20:44:08 +03:00
|
|
|
$orderby = 'ORDER BY relevance DESC';
|
2007-07-27 03:10:04 +04:00
|
|
|
|
2007-07-27 02:57:36 +04:00
|
|
|
$this->_sql = $select . ' ' . $from . ' ' . $where . ' ' . $groupby . ' ' . $orderby;
|
|
|
|
}
|
2007-07-27 23:03:32 +04:00
|
|
|
|
2007-08-02 03:42:22 +04:00
|
|
|
public function parseClause($originalClause, $recursive = false)
|
2007-08-02 02:53:33 +04:00
|
|
|
{
|
2007-11-24 21:58:33 +03:00
|
|
|
$clause = $this->_tokenizer->bracketTrim($originalClause);
|
2007-08-02 02:53:33 +04:00
|
|
|
|
|
|
|
$brackets = false;
|
2007-07-27 23:03:32 +04:00
|
|
|
|
2007-08-02 02:53:33 +04:00
|
|
|
if ($clause !== $originalClause) {
|
|
|
|
$brackets = true;
|
|
|
|
}
|
2007-07-27 23:03:32 +04:00
|
|
|
|
2007-08-02 02:53:33 +04:00
|
|
|
$foreignId = current(array_diff($this->_table->getColumnNames(), array('keyword', 'field', 'position')));
|
|
|
|
|
2007-11-24 21:58:33 +03:00
|
|
|
$terms = $this->_tokenizer->sqlExplode($clause, ' OR ', '(', ')');
|
2007-08-02 03:42:22 +04:00
|
|
|
|
2007-07-27 23:03:32 +04:00
|
|
|
$ret = array();
|
|
|
|
|
2007-08-02 02:53:33 +04:00
|
|
|
if (count($terms) > 1) {
|
|
|
|
$leavesOnly = true;
|
2007-08-02 03:42:22 +04:00
|
|
|
|
2007-08-02 02:53:33 +04:00
|
|
|
foreach ($terms as $k => $term) {
|
|
|
|
if ($this->isExpression($term)) {
|
2007-08-02 03:42:22 +04:00
|
|
|
$ret[$k] = $this->parseClause($term, true);
|
2007-08-02 02:53:33 +04:00
|
|
|
$leavesOnly = false;
|
2007-08-01 23:37:28 +04:00
|
|
|
} else {
|
2007-08-02 02:53:33 +04:00
|
|
|
$ret[$k] = $this->parseTerm($term);
|
2007-07-27 23:03:32 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2007-08-02 02:53:33 +04:00
|
|
|
$return = implode(' OR ', $ret);
|
2007-07-27 23:03:32 +04:00
|
|
|
|
2007-08-02 03:42:22 +04:00
|
|
|
if ($leavesOnly && $recursive) {
|
|
|
|
$return = sprintf($this->_condition, 'IN') . $return . ')';
|
|
|
|
$brackets = false;
|
2007-08-02 02:53:33 +04:00
|
|
|
}
|
|
|
|
} else {
|
2007-11-24 21:58:33 +03:00
|
|
|
$terms = $this->_tokenizer->sqlExplode($clause, ' ', '(', ')');
|
2007-08-02 03:42:22 +04:00
|
|
|
|
|
|
|
if (count($terms) === 1 && ! $recursive) {
|
|
|
|
$return = $this->parseTerm($clause);
|
|
|
|
} else {
|
|
|
|
foreach ($terms as $k => $term) {
|
|
|
|
$term = trim($term);
|
|
|
|
|
|
|
|
if ($term === 'AND') {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (substr($term, 0, 1) === '-') {
|
|
|
|
$operator = 'NOT IN';
|
|
|
|
$term = substr($term, 1);
|
|
|
|
} else {
|
|
|
|
$operator = 'IN';
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($this->isExpression($term)) {
|
|
|
|
$ret[$k] = $this->parseClause($term, true);
|
|
|
|
} else {
|
|
|
|
$ret[$k] = sprintf($this->_condition, $operator) . $this->parseTerm($term) . ')';
|
|
|
|
}
|
2007-07-27 23:24:28 +04:00
|
|
|
}
|
2007-08-02 03:42:22 +04:00
|
|
|
$return = implode(' AND ', $ret);
|
2007-08-02 02:53:33 +04:00
|
|
|
}
|
|
|
|
}
|
2007-08-02 03:42:22 +04:00
|
|
|
|
2007-08-02 02:53:33 +04:00
|
|
|
if ($brackets) {
|
|
|
|
return '(' . $return . ')';
|
2007-07-27 23:03:32 +04:00
|
|
|
} else {
|
2007-08-02 02:53:33 +04:00
|
|
|
return $return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
public function isExpression($term)
|
|
|
|
{
|
|
|
|
if (strpos($term, '(') !== false) {
|
|
|
|
return true;
|
|
|
|
} else {
|
2007-11-24 21:58:33 +03:00
|
|
|
$terms = $this->_tokenizer->quoteExplode($term);
|
2007-08-02 02:53:33 +04:00
|
|
|
|
|
|
|
return (count($terms) > 1);
|
2007-07-27 23:24:28 +04:00
|
|
|
}
|
|
|
|
}
|
2007-07-28 00:18:58 +04:00
|
|
|
|
2007-07-27 03:10:04 +04:00
|
|
|
public function parseTerm($term)
|
|
|
|
{
|
2007-09-03 18:57:18 +04:00
|
|
|
$negation = false;
|
2007-08-01 23:37:28 +04:00
|
|
|
|
2007-07-27 03:10:04 +04:00
|
|
|
if (strpos($term, "'") === false) {
|
2007-08-02 16:01:38 +04:00
|
|
|
$where = $this->parseWord($term);
|
2007-07-27 03:10:04 +04:00
|
|
|
} else {
|
|
|
|
$term = trim($term, "' ");
|
2007-08-02 16:01:38 +04:00
|
|
|
|
2007-11-24 21:58:33 +03:00
|
|
|
$terms = $this->_tokenizer->quoteExplode($term);
|
2007-08-02 16:01:38 +04:00
|
|
|
$where = $this->parseWord($terms[0]);
|
|
|
|
|
2007-07-27 03:10:04 +04:00
|
|
|
foreach ($terms as $k => $word) {
|
|
|
|
if ($k === 0) {
|
|
|
|
continue;
|
|
|
|
}
|
2007-08-02 16:01:38 +04:00
|
|
|
$where .= ' AND (position + ' . $k . ') = (SELECT position FROM ' . $this->_table->getTableName() . ' WHERE ' . $this->parseWord($word) . ')';
|
2007-07-27 03:10:04 +04:00
|
|
|
}
|
2007-08-01 23:37:28 +04:00
|
|
|
}
|
2007-08-02 02:53:33 +04:00
|
|
|
return $where;
|
2007-07-27 03:10:04 +04:00
|
|
|
}
|
2007-11-18 20:44:47 +03:00
|
|
|
public function parseWord($word)
|
2007-08-02 16:01:38 +04:00
|
|
|
{
|
2007-11-18 20:44:47 +03:00
|
|
|
$this->_words[] = str_replace('*', '', $word);
|
|
|
|
|
2007-08-02 16:01:38 +04:00
|
|
|
if (strpos($word, '?') !== false ||
|
|
|
|
strpos($word, '*') !== false) {
|
2007-11-18 20:44:47 +03:00
|
|
|
|
2007-08-02 16:01:38 +04:00
|
|
|
$word = str_replace('*', '%', $word);
|
2007-07-13 01:50:31 +04:00
|
|
|
|
2007-08-02 16:01:38 +04:00
|
|
|
$where = 'keyword LIKE ?';
|
2007-11-18 20:44:47 +03:00
|
|
|
|
2007-08-02 16:01:38 +04:00
|
|
|
$params = array($word);
|
|
|
|
} else {
|
|
|
|
$where = 'keyword = ?';
|
|
|
|
}
|
2007-11-18 20:44:47 +03:00
|
|
|
|
2007-08-02 16:01:38 +04:00
|
|
|
$this->_params[] = $word;
|
|
|
|
|
|
|
|
return $where;
|
|
|
|
}
|
2007-11-18 20:44:47 +03:00
|
|
|
|
|
|
|
public function getWords()
|
|
|
|
{
|
|
|
|
return $this->_words;
|
|
|
|
}
|
2007-08-02 16:01:38 +04:00
|
|
|
public function getParams()
|
|
|
|
{
|
|
|
|
return $this->_params;
|
|
|
|
}
|
2007-07-27 02:57:36 +04:00
|
|
|
public function getSql()
|
|
|
|
{
|
|
|
|
return $this->_sql;
|
|
|
|
}
|
2007-10-18 01:17:01 +04:00
|
|
|
}
|