1
0
mirror of synced 2025-01-22 08:11:40 +03:00

236 lines
7.2 KiB
PHP
Raw Normal View History

2007-07-12 21:50:31 +00:00
<?php
/*
* $Id: Hook.php 1939 2007-07-05 23:47:48Z zYne $
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
* This software consists of voluntary contributions made by many individuals
* and is licensed under the LGPL. For more information, see
* <http://www.phpdoctrine.com>.
*/
/**
* Doctrine_Search_Query
*
* @package Doctrine
* @subpackage Search
* @author Konsta Vesterinen <kvesteri@cc.hut.fi>
2007-07-12 21:50:31 +00:00
* @license http://www.opensource.org/licenses/lgpl-license.php LGPL
* @version $Revision$
2007-07-12 21:50:31 +00:00
* @link www.phpdoctrine.com
* @since 1.0
*/
class Doctrine_Search_Query
{
2007-10-17 21:17:01 +00:00
2007-07-12 21:50:31 +00:00
/**
2007-07-26 22:57:36 +00:00
* @var Doctrine_Table $_table the index table
2007-07-12 21:50:31 +00:00
*/
2007-07-26 22:57:36 +00:00
protected $_table = array();
protected $_sql = '';
2007-08-01 22:53:33 +00:00
protected $_params = array();
2007-11-18 17:44:47 +00:00
protected $_words = array();
protected $_tokenizer;
2007-08-01 22:53:33 +00:00
protected $_condition;
2007-07-12 21:50:31 +00:00
/**
2007-10-17 21:17:01 +00:00
* @param Doctrine_Table $_table the index table
2007-07-12 21:50:31 +00:00
*/
2007-07-26 22:57:36 +00:00
public function __construct($table)
2007-07-12 21:50:31 +00:00
{
2007-07-27 19:24:28 +00:00
if (is_string($table)) {
$table = Doctrine_Manager::table($table);
2007-10-17 21:17:01 +00:00
} else {
if ( ! $table instanceof Doctrine_Table) {
throw new Doctrine_Search_Exception('Invalid argument type. Expected instance of Doctrine_Table.');
}
2007-07-27 19:24:28 +00:00
}
2007-07-26 22:57:36 +00:00
$this->_tokenizer = new Doctrine_Query_Tokenizer();
2007-07-26 22:57:36 +00:00
$this->_table = $table;
2007-08-01 22:53:33 +00:00
$foreignId = current(array_diff($this->_table->getColumnNames(), array('keyword', 'field', 'position')));
$this->_condition = $foreignId . ' %s (SELECT ' . $foreignId . ' FROM ' . $this->_table->getTableName() . ' WHERE ';
2007-07-12 21:50:31 +00:00
}
2007-10-17 21:17:01 +00:00
public function query($text)
2007-07-26 22:57:36 +00:00
{
$text = trim($text);
2007-10-17 21:17:01 +00:00
$foreignId = current(array_diff($this->_table->getColumnNames(), array('keyword', 'field', 'position')));
2007-08-01 19:37:28 +00:00
2007-07-26 23:44:09 +00:00
$weighted = false;
if (strpos($text, '^') === false) {
$select = 'SELECT COUNT(keyword) AS relevance, ' . $foreignId;
$from = 'FROM ' . $this->_table->getTableName();
} else {
// organize terms according weights
$weighted = true;
$select = 'SELECT SUM(sub_relevance) AS relevance, ' . $foreignId;
$from = 'FROM ' ;
}
2007-07-26 22:57:36 +00:00
2007-08-01 19:37:28 +00:00
$where = 'WHERE ';
$where .= $this->parseClause($text);
2007-07-26 23:10:04 +00:00
$groupby = 'GROUP BY ' . $foreignId;
2007-11-18 17:44:08 +00:00
$orderby = 'ORDER BY relevance DESC';
2007-07-26 23:10:04 +00:00
2007-07-26 22:57:36 +00:00
$this->_sql = $select . ' ' . $from . ' ' . $where . ' ' . $groupby . ' ' . $orderby;
}
2007-07-27 19:03:32 +00:00
public function parseClause($originalClause, $recursive = false)
2007-08-01 22:53:33 +00:00
{
$clause = $this->_tokenizer->bracketTrim($originalClause);
2007-08-01 22:53:33 +00:00
$brackets = false;
2007-07-27 19:03:32 +00:00
2007-08-01 22:53:33 +00:00
if ($clause !== $originalClause) {
$brackets = true;
}
2007-07-27 19:03:32 +00:00
2007-08-01 22:53:33 +00:00
$foreignId = current(array_diff($this->_table->getColumnNames(), array('keyword', 'field', 'position')));
$terms = $this->_tokenizer->sqlExplode($clause, ' OR ', '(', ')');
2007-07-27 19:03:32 +00:00
$ret = array();
2007-08-01 22:53:33 +00:00
if (count($terms) > 1) {
$leavesOnly = true;
2007-08-01 22:53:33 +00:00
foreach ($terms as $k => $term) {
if ($this->isExpression($term)) {
$ret[$k] = $this->parseClause($term, true);
2007-08-01 22:53:33 +00:00
$leavesOnly = false;
2007-08-01 19:37:28 +00:00
} else {
2007-08-01 22:53:33 +00:00
$ret[$k] = $this->parseTerm($term);
2007-07-27 19:03:32 +00:00
}
}
2007-08-01 22:53:33 +00:00
$return = implode(' OR ', $ret);
2007-07-27 19:03:32 +00:00
if ($leavesOnly && $recursive) {
$return = sprintf($this->_condition, 'IN') . $return . ')';
$brackets = false;
2007-08-01 22:53:33 +00:00
}
} else {
$terms = $this->_tokenizer->sqlExplode($clause, ' ', '(', ')');
if (count($terms) === 1 && ! $recursive) {
$return = $this->parseTerm($clause);
} else {
foreach ($terms as $k => $term) {
$term = trim($term);
if ($term === 'AND') {
continue;
}
if (substr($term, 0, 1) === '-') {
$operator = 'NOT IN';
$term = substr($term, 1);
} else {
$operator = 'IN';
}
if ($this->isExpression($term)) {
$ret[$k] = $this->parseClause($term, true);
} else {
$ret[$k] = sprintf($this->_condition, $operator) . $this->parseTerm($term) . ')';
}
2007-07-27 19:24:28 +00:00
}
$return = implode(' AND ', $ret);
2007-08-01 22:53:33 +00:00
}
}
2007-08-01 22:53:33 +00:00
if ($brackets) {
return '(' . $return . ')';
2007-07-27 19:03:32 +00:00
} else {
2007-08-01 22:53:33 +00:00
return $return;
}
}
public function isExpression($term)
{
if (strpos($term, '(') !== false) {
return true;
} else {
$terms = $this->_tokenizer->quoteExplode($term);
2007-08-01 22:53:33 +00:00
return (count($terms) > 1);
2007-07-27 19:24:28 +00:00
}
}
2007-07-27 20:18:58 +00:00
2007-07-26 23:10:04 +00:00
public function parseTerm($term)
{
$negation = false;
2007-08-01 19:37:28 +00:00
2007-07-26 23:10:04 +00:00
if (strpos($term, "'") === false) {
$where = $this->parseWord($term);
2007-07-26 23:10:04 +00:00
} else {
$term = trim($term, "' ");
$terms = $this->_tokenizer->quoteExplode($term);
$where = $this->parseWord($terms[0]);
2007-07-26 23:10:04 +00:00
foreach ($terms as $k => $word) {
if ($k === 0) {
continue;
}
$where .= ' AND (position + ' . $k . ') = (SELECT position FROM ' . $this->_table->getTableName() . ' WHERE ' . $this->parseWord($word) . ')';
2007-07-26 23:10:04 +00:00
}
2007-08-01 19:37:28 +00:00
}
2007-08-01 22:53:33 +00:00
return $where;
2007-07-26 23:10:04 +00:00
}
2007-11-18 17:44:47 +00:00
public function parseWord($word)
{
2007-11-18 17:44:47 +00:00
$this->_words[] = str_replace('*', '', $word);
if (strpos($word, '?') !== false ||
strpos($word, '*') !== false) {
2007-11-18 17:44:47 +00:00
$word = str_replace('*', '%', $word);
2007-07-12 21:50:31 +00:00
$where = 'keyword LIKE ?';
2007-11-18 17:44:47 +00:00
$params = array($word);
} else {
$where = 'keyword = ?';
}
2007-11-18 17:44:47 +00:00
$this->_params[] = $word;
return $where;
}
2007-11-18 17:44:47 +00:00
public function getWords()
{
return $this->_words;
}
public function getParams()
{
return $this->_params;
}
2007-07-26 22:57:36 +00:00
public function getSql()
{
return $this->_sql;
}
2007-10-17 21:17:01 +00:00
}