2007-07-12 21:50:31 +00:00
|
|
|
<?php
|
|
|
|
/*
|
|
|
|
* $Id: Hook.php 1939 2007-07-05 23:47:48Z zYne $
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
|
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
|
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
|
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*
|
|
|
|
* This software consists of voluntary contributions made by many individuals
|
|
|
|
* and is licensed under the LGPL. For more information, see
|
|
|
|
* <http://www.phpdoctrine.com>.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Doctrine_Search_Query
|
|
|
|
*
|
|
|
|
* @package Doctrine
|
|
|
|
* @license http://www.opensource.org/licenses/lgpl-license.php LGPL
|
|
|
|
* @category Object Relational Mapping
|
|
|
|
* @link www.phpdoctrine.com
|
|
|
|
* @since 1.0
|
|
|
|
* @version $Revision: 1939 $
|
|
|
|
* @author Konsta Vesterinen <kvesteri@cc.hut.fi>
|
|
|
|
*/
|
|
|
|
class Doctrine_Search_Query
|
|
|
|
{
|
2007-07-27 19:03:32 +00:00
|
|
|
const OPERATOR_OR = 0;
|
|
|
|
const OPERATOR_AND = 1;
|
2007-07-12 21:50:31 +00:00
|
|
|
/**
|
|
|
|
* @var Doctrine_Query $query the base query
|
|
|
|
*/
|
|
|
|
protected $_query;
|
|
|
|
/**
|
2007-07-26 22:57:36 +00:00
|
|
|
* @var Doctrine_Table $_table the index table
|
2007-07-12 21:50:31 +00:00
|
|
|
*/
|
2007-07-26 22:57:36 +00:00
|
|
|
protected $_table = array();
|
|
|
|
|
|
|
|
protected $_sql = '';
|
2007-07-12 21:50:31 +00:00
|
|
|
/**
|
2007-07-26 22:57:36 +00:00
|
|
|
* @param octrine_Table $_table the index table
|
2007-07-12 21:50:31 +00:00
|
|
|
*/
|
2007-07-26 22:57:36 +00:00
|
|
|
public function __construct($table)
|
2007-07-12 21:50:31 +00:00
|
|
|
{
|
2007-07-27 19:24:28 +00:00
|
|
|
if (is_string($table)) {
|
|
|
|
$table = Doctrine_Manager::table($table);
|
|
|
|
}
|
2007-07-26 22:57:36 +00:00
|
|
|
|
|
|
|
$this->_table = $table;
|
|
|
|
|
|
|
|
$this->_query = new Doctrine_Query();
|
2007-07-12 21:50:31 +00:00
|
|
|
}
|
|
|
|
/**
|
|
|
|
* getQuery
|
|
|
|
*
|
|
|
|
* @return Doctrine_Query returns the query object associated with this object
|
|
|
|
*/
|
|
|
|
public function getQuery()
|
|
|
|
{
|
|
|
|
return $this->_query;
|
|
|
|
}
|
|
|
|
|
|
|
|
public function search($text)
|
2007-07-26 22:57:36 +00:00
|
|
|
{
|
2007-07-27 19:24:28 +00:00
|
|
|
$text = strtolower(trim($text));
|
2007-07-26 22:57:36 +00:00
|
|
|
|
2007-07-27 19:03:32 +00:00
|
|
|
$terms = Doctrine_Tokenizer::sqlExplode($text, ' AND ', '(', ')');
|
2007-07-26 22:57:36 +00:00
|
|
|
|
|
|
|
$foreignId = current(array_diff($this->_table->getColumnNames(), array('keyword', 'field', 'position')));
|
|
|
|
|
|
|
|
$numTerms = count($terms);
|
2007-07-26 23:44:09 +00:00
|
|
|
|
|
|
|
$weighted = false;
|
|
|
|
if (strpos($text, '^') === false) {
|
|
|
|
$select = 'SELECT COUNT(keyword) AS relevance, ' . $foreignId;
|
|
|
|
$from = 'FROM ' . $this->_table->getTableName();
|
|
|
|
} else {
|
|
|
|
// organize terms according weights
|
2007-07-27 19:03:32 +00:00
|
|
|
|
2007-07-26 23:44:09 +00:00
|
|
|
foreach ($terms as $k => $term) {
|
|
|
|
$e = explode('^', $term);
|
|
|
|
$x = (isset($e[1]) && is_numeric($e[1])) ? $e[1] : 1;
|
|
|
|
|
|
|
|
$weightedTerms[$x][] = $term;
|
|
|
|
}
|
|
|
|
$weighted = true;
|
|
|
|
|
|
|
|
$select = 'SELECT SUM(sub_relevance) AS relevance, ' . $foreignId;
|
|
|
|
$from = 'FROM ' ;
|
|
|
|
}
|
|
|
|
|
2007-07-26 22:57:36 +00:00
|
|
|
switch ($numTerms) {
|
|
|
|
case 0:
|
|
|
|
return false;
|
|
|
|
break;
|
|
|
|
case 1:
|
2007-07-26 23:10:04 +00:00
|
|
|
// only one term found, use fast and simple query
|
2007-07-26 23:44:09 +00:00
|
|
|
$data = $this->parseTerm($terms[0]);
|
|
|
|
$where = $data[0];
|
|
|
|
$params = $data[1];
|
2007-07-26 22:57:36 +00:00
|
|
|
break;
|
|
|
|
default:
|
2007-07-26 23:10:04 +00:00
|
|
|
$where = 'WHERE ';
|
|
|
|
$cond = array();
|
|
|
|
$params = array();
|
|
|
|
|
|
|
|
foreach ($terms as $term) {
|
|
|
|
$data = $this->parseTerm($term);
|
|
|
|
$params = array_merge($params, $data[1]);
|
|
|
|
$cond[] = $foreignId . ' IN (SELECT ' . $foreignId . ' FROM ' . $this->_table->getTableName() . ' ' . $data[0] . ')';
|
|
|
|
}
|
|
|
|
$where .= implode(' AND ', $cond);
|
2007-07-26 22:57:36 +00:00
|
|
|
}
|
|
|
|
|
2007-07-26 23:10:04 +00:00
|
|
|
$groupby = 'GROUP BY ' . $foreignId;
|
|
|
|
$orderby = 'ORDER BY relevance';
|
|
|
|
|
2007-07-26 22:57:36 +00:00
|
|
|
$this->_sql = $select . ' ' . $from . ' ' . $where . ' ' . $groupby . ' ' . $orderby;
|
|
|
|
}
|
2007-07-27 19:03:32 +00:00
|
|
|
public function tokenizeClause($clause)
|
|
|
|
{
|
2007-07-27 19:24:28 +00:00
|
|
|
$clause = Doctrine_Tokenizer::bracketTrim($clause);
|
2007-07-27 19:03:32 +00:00
|
|
|
|
|
|
|
$terms = Doctrine_Tokenizer::sqlExplode($clause, ' ', '(', ')');
|
|
|
|
|
|
|
|
$operator = self::OPERATOR_AND;
|
|
|
|
|
|
|
|
$ret = array();
|
|
|
|
|
|
|
|
$pending = false;
|
|
|
|
|
|
|
|
$i = 0;
|
|
|
|
$prev = false;
|
|
|
|
foreach ($terms as $k => $term) {
|
|
|
|
$term = trim($term);
|
|
|
|
|
|
|
|
if ($term === 'AND') {
|
|
|
|
$operator = self::OPERATOR_AND;
|
|
|
|
} elseif ($term === 'OR') {
|
|
|
|
$operator = self::OPERATOR_OR;
|
|
|
|
} else {
|
|
|
|
if ($operator === self::OPERATOR_OR) {
|
|
|
|
if ( ! is_array($ret[($i-1)])) {
|
|
|
|
$ret[($i-1)] = array($ret[($i-1)], $term);
|
|
|
|
} else {
|
|
|
|
$ret[($i-1)][] = $term;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
$ret[$i] = $term;
|
|
|
|
|
|
|
|
$i++;
|
|
|
|
}
|
|
|
|
$operator = self::OPERATOR_AND;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return $ret;
|
|
|
|
}
|
2007-07-27 19:24:28 +00:00
|
|
|
|
2007-07-27 19:03:32 +00:00
|
|
|
public function parseClause($clause)
|
|
|
|
{
|
2007-07-27 19:24:28 +00:00
|
|
|
$clause = Doctrine_Tokenizer::bracketTrim($clause);
|
2007-07-27 19:03:32 +00:00
|
|
|
|
2007-07-27 19:24:28 +00:00
|
|
|
$foreignId = current(array_diff($this->_table->getColumnNames(), array('keyword', 'field', 'position')));
|
2007-07-27 19:03:32 +00:00
|
|
|
|
2007-07-27 19:24:28 +00:00
|
|
|
$terms = $this->tokenizeClause($clause);
|
2007-07-27 19:03:32 +00:00
|
|
|
|
|
|
|
if (count($terms) > 1) {
|
|
|
|
$ret = array();
|
2007-07-27 19:24:28 +00:00
|
|
|
|
2007-07-27 19:03:32 +00:00
|
|
|
foreach ($terms as $term) {
|
2007-07-27 19:24:28 +00:00
|
|
|
if (is_array($term)) {
|
|
|
|
$parsed = $this->parseTerms($term);
|
|
|
|
} else {
|
|
|
|
$parsed = $this->parseClause($term);
|
|
|
|
}
|
2007-07-27 19:03:32 +00:00
|
|
|
$ret[] = $foreignId . ' IN (SELECT ' . $foreignId . ' FROM ' . $this->_table->getTableName() . ' WHERE ' . $parsed . ')';
|
|
|
|
}
|
2007-07-27 19:24:28 +00:00
|
|
|
|
|
|
|
$r = implode(' AND ', $ret);
|
2007-07-27 19:03:32 +00:00
|
|
|
} else {
|
2007-07-27 19:24:28 +00:00
|
|
|
$terms = (is_array($terms[0])) ? $terms[0] : array($terms[0]);
|
2007-07-27 19:03:32 +00:00
|
|
|
|
2007-07-27 19:24:28 +00:00
|
|
|
return $this->parseTerms($terms);
|
|
|
|
}
|
|
|
|
return $r;
|
|
|
|
}
|
|
|
|
public function parseTerms(array $terms)
|
|
|
|
{
|
|
|
|
if (count($terms) > 1) {
|
|
|
|
$ret = array();
|
|
|
|
foreach ($terms as $term) {
|
|
|
|
$parsed = $this->parseClause($term);
|
|
|
|
if (strlen($parsed) > 20) {
|
|
|
|
$ret[] = '(' . $parsed. ')';
|
|
|
|
} else {
|
|
|
|
$ret[] = $parsed;
|
2007-07-27 19:03:32 +00:00
|
|
|
}
|
|
|
|
}
|
2007-07-27 19:24:28 +00:00
|
|
|
|
|
|
|
return implode(' OR ', $ret);
|
|
|
|
} else {
|
|
|
|
$ret = $this->parseTerm($terms[0]);
|
|
|
|
return $ret[0];
|
2007-07-27 19:03:32 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
public function parseAndSeparatedTerms($terms, $foreignId)
|
|
|
|
{
|
|
|
|
$ret = array();
|
|
|
|
|
|
|
|
foreach ($terms as $term) {
|
|
|
|
$parsed = $this->parseClause($term);
|
|
|
|
|
|
|
|
$ret[] = $foreignId . ' IN (SELECT ' . $foreignId . ' FROM ' . $this->_table->getTableName() . ' WHERE ' . $parsed . ')';
|
|
|
|
}
|
|
|
|
|
2007-07-27 19:24:28 +00:00
|
|
|
$r = implode(' AND ', $ret);
|
2007-07-27 19:03:32 +00:00
|
|
|
}
|
2007-07-26 23:10:04 +00:00
|
|
|
public function parseTerm($term)
|
|
|
|
{
|
|
|
|
if (strpos($term, "'") === false) {
|
2007-07-27 19:03:32 +00:00
|
|
|
$where = 'keyword = ?';
|
2007-07-26 23:10:04 +00:00
|
|
|
|
|
|
|
$params = array($term);
|
|
|
|
} else {
|
|
|
|
$term = trim($term, "' ");
|
|
|
|
|
2007-07-27 19:03:32 +00:00
|
|
|
$where = 'keyword = ?';
|
2007-07-26 23:10:04 +00:00
|
|
|
$terms = Doctrine_Tokenizer::quoteExplode($term);
|
|
|
|
$params = $terms;
|
|
|
|
foreach ($terms as $k => $word) {
|
|
|
|
if ($k === 0) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
$where .= ' AND (position + ' . $k . ') = (SELECT position FROM ' . $this->_table->getTableName() . ' WHERE keyword = ?)';
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return array($where, $params);
|
|
|
|
}
|
2007-07-12 21:50:31 +00:00
|
|
|
|
2007-07-26 22:57:36 +00:00
|
|
|
public function getSql()
|
|
|
|
{
|
|
|
|
return $this->_sql;
|
|
|
|
}
|
2007-07-12 21:50:31 +00:00
|
|
|
public function execute()
|
|
|
|
{
|
|
|
|
$resultSet = $this->_query->execute();
|
|
|
|
|
|
|
|
return $resultSet;
|
|
|
|
}
|
|
|
|
}
|