303 lines
10 KiB
PHP
303 lines
10 KiB
PHP
|
<?php
|
||
|
/*
|
||
|
* $Id$
|
||
|
*
|
||
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
||
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
||
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
||
|
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
||
|
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
||
|
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
||
|
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
||
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
||
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
||
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
||
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||
|
*
|
||
|
* This software consists of voluntary contributions made by many individuals
|
||
|
* and is licensed under the LGPL. For more information, see
|
||
|
* <http://www.phpdoctrine.org>.
|
||
|
*/
|
||
|
|
||
|
/**
|
||
|
* Doctrine_Search
|
||
|
*
|
||
|
* @package Doctrine
|
||
|
* @subpackage Search
|
||
|
* @author Konsta Vesterinen <kvesteri@cc.hut.fi>
|
||
|
* @license http://www.opensource.org/licenses/lgpl-license.php LGPL
|
||
|
* @version $Revision$
|
||
|
* @link www.phpdoctrine.org
|
||
|
* @since 1.0
|
||
|
*/
|
||
|
class Doctrine_Search extends Doctrine_Record_Generator
|
||
|
{
|
||
|
const INDEX_FILES = 0;
|
||
|
|
||
|
const INDEX_TABLES = 1;
|
||
|
|
||
|
protected $_options = array('generateFiles' => false,
|
||
|
'analyzer' => 'Doctrine_Search_Analyzer_Standard',
|
||
|
'analyzer_options' => array(),
|
||
|
'type' => self::INDEX_TABLES,
|
||
|
'className' => '%CLASS%Index',
|
||
|
'generatePath' => false,
|
||
|
'table' => null,
|
||
|
'batchUpdates' => false,
|
||
|
'pluginTable' => false,
|
||
|
'fields' => array(),
|
||
|
'connection' => null,
|
||
|
'children' => array());
|
||
|
/**
|
||
|
* __construct
|
||
|
*
|
||
|
* @param array $options
|
||
|
* @return void
|
||
|
*/
|
||
|
public function __construct(array $options)
|
||
|
{
|
||
|
$this->_options = Doctrine_Lib::arrayDeepMerge($this->_options, $options);
|
||
|
|
||
|
if ( ! isset($this->_options['analyzer'])) {
|
||
|
$this->_options['analyzer'] = 'Doctrine_Search_Analyzer_Standard';
|
||
|
}
|
||
|
|
||
|
if ( ! isset($this->_options['analyzer_options'])) {
|
||
|
$this->_options['analyzer_options'] = array();
|
||
|
}
|
||
|
|
||
|
$this->_options['analyzer'] = new $this->_options['analyzer']($this->_options['analyzer_options']);
|
||
|
|
||
|
if ( ! isset($this->_options['connection'])) {
|
||
|
$this->_options['connection'] = Doctrine_Manager::connection();
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* Searchable keyword search
|
||
|
*
|
||
|
* @param string $string Keyword string to search for
|
||
|
* @param Doctrine_Query $query Query object to alter. Adds where condition to limit the results using the search index
|
||
|
* @return array ids and relevancy
|
||
|
*/
|
||
|
public function search($string, $query = null)
|
||
|
{
|
||
|
$q = new Doctrine_Search_Query($this->_table);
|
||
|
|
||
|
if ($query instanceof Doctrine_Query) {
|
||
|
$q->query($string, false);
|
||
|
|
||
|
$newQuery = $query->copy();
|
||
|
$query->getSql();
|
||
|
$key = (array) $this->getOption('table')->getIdentifier();
|
||
|
$newQuery->addWhere($query->getRootAlias() . '.'.current($key).' IN (SQL:' . $q->getSql() . ')', $q->getParams());
|
||
|
|
||
|
return $newQuery;
|
||
|
} else {
|
||
|
$q->query($string);
|
||
|
return $this->_options['connection']->fetchAll($q->getSql(), $q->getParams());
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* analyze a text in the encoding format
|
||
|
*
|
||
|
* @param string $text
|
||
|
* @param string $encoding
|
||
|
* @return void
|
||
|
*/
|
||
|
public function analyze($text, $encoding = null)
|
||
|
{
|
||
|
return $this->_options['analyzer']->analyze($text, $encoding);
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* updateIndex
|
||
|
* updates the index
|
||
|
*
|
||
|
* @param Doctrine_Record $record
|
||
|
* @return integer
|
||
|
*/
|
||
|
public function updateIndex(array $data, $encoding = null)
|
||
|
{
|
||
|
$this->initialize($this->_options['table']);
|
||
|
|
||
|
$fields = $this->getOption('fields');
|
||
|
$class = $this->getOption('className');
|
||
|
$name = $this->getOption('table')->getComponentName();
|
||
|
$conn = $this->getOption('table')->getConnection();
|
||
|
$identifier = $this->_options['table']->getIdentifier();
|
||
|
|
||
|
$q = Doctrine_Query::create()->delete()
|
||
|
->from($class);
|
||
|
foreach ((array) $identifier as $id) {
|
||
|
$q->addWhere($id . ' = ?', array($data[$id]));
|
||
|
}
|
||
|
$q->execute();
|
||
|
|
||
|
if ($this->_options['batchUpdates'] === true) {
|
||
|
$index = new $class();
|
||
|
|
||
|
foreach ((array) $this->_options['table']->getIdentifier() as $id) {
|
||
|
$index->$id = $data[$id];
|
||
|
}
|
||
|
|
||
|
$index->save();
|
||
|
} else {
|
||
|
foreach ($fields as $field) {
|
||
|
|
||
|
$value = isset($data[$field]) ? $data[$field] : null;
|
||
|
|
||
|
$terms = $this->analyze($value, $encoding);
|
||
|
|
||
|
foreach ($terms as $pos => $term) {
|
||
|
$index = new $class();
|
||
|
|
||
|
$index->keyword = $term;
|
||
|
$index->position = $pos;
|
||
|
$index->field = $field;
|
||
|
foreach ((array) $this->_options['table']->getIdentifier() as $id) {
|
||
|
$index->$id = $data[$id];
|
||
|
}
|
||
|
|
||
|
$index->save();
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* readTableData
|
||
|
*
|
||
|
* @param mixed $limit
|
||
|
* @param mixed $offset
|
||
|
* @return Doctrine_Collection The collection of results
|
||
|
*/
|
||
|
public function readTableData($limit = null, $offset = null)
|
||
|
{
|
||
|
$this->initialize($this->_options['table']);
|
||
|
|
||
|
$conn = $this->_options['table']->getConnection();
|
||
|
$tableName = $this->_options['table']->getTableName();
|
||
|
$id = current($this->_options['table']->getIdentifierColumnNames());
|
||
|
|
||
|
$query = 'SELECT * FROM ' . $conn->quoteIdentifier($tableName)
|
||
|
. ' WHERE ' . $conn->quoteIdentifier($id)
|
||
|
. ' IN (SELECT ' . $conn->quoteIdentifier('id')
|
||
|
. ' FROM ' . $conn->quoteIdentifier($this->_table->getTableName())
|
||
|
. ' WHERE keyword = \'\') OR ' . $conn->quoteIdentifier($id)
|
||
|
. ' NOT IN (SELECT ' . $conn->quoteIdentifier('id')
|
||
|
. ' FROM ' . $conn->quoteIdentifier($this->_table->getTableName()) . ')';
|
||
|
|
||
|
$query = $conn->modifyLimitQuery($query, $limit, $offset);
|
||
|
|
||
|
return $conn->fetchAll($query);
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* batchUpdateIndex
|
||
|
*
|
||
|
* @param mixed $limit
|
||
|
* @param mixed $offset
|
||
|
* @return void
|
||
|
*/
|
||
|
public function batchUpdateIndex($limit = null, $offset = null, $encoding = null)
|
||
|
{
|
||
|
$table = $this->_options['table'];
|
||
|
|
||
|
$this->initialize($table);
|
||
|
|
||
|
$id = current($table->getIdentifierColumnNames());
|
||
|
$class = $this->_options['className'];
|
||
|
$fields = $this->_options['fields'];
|
||
|
$conn = $this->_options['connection'];
|
||
|
|
||
|
for ($i = 0; $i < count($fields); $i++) {
|
||
|
$fields[$i] = $table->getColumnName($fields[$i], $fields[$i]);
|
||
|
}
|
||
|
|
||
|
$rows = $this->readTableData($limit, $offset);
|
||
|
|
||
|
$ids = array();
|
||
|
foreach ($rows as $row) {
|
||
|
$ids[] = $row[$id];
|
||
|
}
|
||
|
|
||
|
if (count($ids) > 0)
|
||
|
{
|
||
|
$placeholders = str_repeat('?, ', count($ids));
|
||
|
$placeholders = substr($placeholders, 0, strlen($placeholders) - 2);
|
||
|
|
||
|
$sql = 'DELETE FROM '
|
||
|
. $conn->quoteIdentifier($this->_table->getTableName())
|
||
|
. ' WHERE ' . $conn->quoteIdentifier($table->getIdentifier()) . ' IN (' . substr($placeholders, 0) . ')';
|
||
|
|
||
|
$conn->exec($sql, $ids);
|
||
|
}
|
||
|
|
||
|
foreach ($rows as $row) {
|
||
|
$conn->beginTransaction();
|
||
|
try {
|
||
|
foreach ($fields as $field) {
|
||
|
$data = $row[$field];
|
||
|
|
||
|
$terms = $this->analyze($data, $encoding);
|
||
|
|
||
|
foreach ($terms as $pos => $term) {
|
||
|
$index = new $class();
|
||
|
|
||
|
$index->keyword = $term;
|
||
|
$index->position = $pos;
|
||
|
$index->field = $field;
|
||
|
|
||
|
foreach ((array) $table->getIdentifier() as $identifier) {
|
||
|
$index->$identifier = $row[$table->getColumnName($identifier, $identifier)];
|
||
|
}
|
||
|
|
||
|
$index->save();
|
||
|
}
|
||
|
}
|
||
|
$conn->commit();
|
||
|
} catch (Doctrine_Exception $e) {
|
||
|
$conn->rollback();
|
||
|
throw $e;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
* buildDefinition
|
||
|
*
|
||
|
* @return void
|
||
|
*/
|
||
|
public function setTableDefinition()
|
||
|
{
|
||
|
if ( ! isset($this->_options['table'])) {
|
||
|
throw new Doctrine_Record_Exception("Unknown option 'table'.");
|
||
|
}
|
||
|
|
||
|
$componentName = $this->_options['table']->getComponentName();
|
||
|
|
||
|
$className = $this->getOption('className');
|
||
|
|
||
|
$autoLoad = (bool) ($this->_options['generateFiles']);
|
||
|
if (class_exists($className, $autoLoad)) {
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
$columns = array('keyword' => array('type' => 'string',
|
||
|
'length' => 200,
|
||
|
'primary' => true,
|
||
|
),
|
||
|
'field' => array('type' => 'string',
|
||
|
'length' => 50,
|
||
|
'primary' => true),
|
||
|
'position' => array('type' => 'integer',
|
||
|
'length' => 8,
|
||
|
'primary' => true,
|
||
|
));
|
||
|
|
||
|
$this->hasColumns($columns);
|
||
|
}
|
||
|
}
|