157 lines
5.2 KiB
PHP
157 lines
5.2 KiB
PHP
<?php
|
|
|
|
//
|
|
// $Id: test.php 1103 2008-01-24 18:42:57Z shodan $
|
|
//
|
|
|
|
require ( "sphinxapi.php" );
|
|
|
|
//////////////////////
|
|
// parse command line
|
|
//////////////////////
|
|
|
|
// for very old PHP versions, like at my home test server
|
|
if ( is_array($argv) && !isset($_SERVER["argv"]) )
|
|
$_SERVER["argv"] = $argv;
|
|
unset ( $_SERVER["argv"][0] );
|
|
|
|
// build query
|
|
if ( !is_array($_SERVER["argv"]) || empty($_SERVER["argv"]) )
|
|
{
|
|
print ( "Usage: php -f test.php [OPTIONS] query words\n\n" );
|
|
print ( "Options are:\n" );
|
|
print ( "-h, --host <HOST>\tconnect to searchd at host HOST\n" );
|
|
print ( "-p, --port\t\tconnect to searchd at port PORT\n" );
|
|
print ( "-i, --index <IDX>\tsearch through index(es) specified by IDX\n" );
|
|
print ( "-s, --sortby <CLAUSE>\tsort matches by 'CLAUSE' in sort_extended mode\n" );
|
|
print ( "-S, --sortexpr <EXPR>\tsort matches by 'EXPR' DESC in sort_expr mode\n" );
|
|
print ( "-a, --any\t\tuse 'match any word' matching mode\n" );
|
|
print ( "-b, --boolean\t\tuse 'boolean query' matching mode\n" );
|
|
print ( "-e, --extended\t\tuse 'extended query' matching mode\n" );
|
|
print ( "-ph,--phrase\t\tuse 'exact phrase' matching mode\n" );
|
|
print ( "-f, --filter <ATTR>\tfilter by attribute 'ATTR' (default is 'group_id')\n" );
|
|
print ( "-v, --value <VAL>\tadd VAL to allowed 'group_id' values list\n" );
|
|
print ( "-g, --groupby <EXPR>\tgroup matches by 'EXPR'\n" );
|
|
print ( "-gs,--groupsort <EXPR>\tsort groups by 'EXPR'\n" );
|
|
print ( "-d, --distinct <ATTR>\tcount distinct values of 'ATTR''\n" );
|
|
print ( "-l, --limit <COUNT>\tretrieve COUNT matches (default: 20)\n" );
|
|
exit;
|
|
}
|
|
|
|
$args = array();
|
|
foreach ( $_SERVER["argv"] as $arg )
|
|
$args[] = $arg;
|
|
|
|
$q = "";
|
|
$mode = SPH_MATCH_ALL;
|
|
$host = "localhost";
|
|
$port = 3312;
|
|
$index = "*";
|
|
$groupby = "";
|
|
$groupsort = "@group desc";
|
|
$filter = "group_id";
|
|
$filtervals = array();
|
|
$distinct = "";
|
|
$sortby = "";
|
|
$limit = 20;
|
|
$ranker = SPH_RANK_PROXIMITY_BM25;
|
|
for ( $i=0; $i<count($args); $i++ )
|
|
{
|
|
$arg = $args[$i];
|
|
|
|
if ( $arg=="-h" || $arg=="--host" ) $host = $args[++$i];
|
|
else if ( $arg=="-p" || $arg=="--port" ) $port = (int)$args[++$i];
|
|
else if ( $arg=="-i" || $arg=="--index" ) $index = $args[++$i];
|
|
else if ( $arg=="-s" || $arg=="--sortby" ) { $sortby = $args[++$i]; $sortexpr = ""; }
|
|
else if ( $arg=="-S" || $arg=="--sortexpr" ) { $sortexpr = $args[++$i]; $sortby = ""; }
|
|
else if ( $arg=="-a" || $arg=="--any" ) $mode = SPH_MATCH_ANY;
|
|
else if ( $arg=="-b" || $arg=="--boolean" ) $mode = SPH_MATCH_BOOLEAN;
|
|
else if ( $arg=="-e" || $arg=="--extended" ) $mode = SPH_MATCH_EXTENDED;
|
|
else if ( $arg=="-e2" ) $mode = SPH_MATCH_EXTENDED2;
|
|
else if ( $arg=="-ph"|| $arg=="--phrase" ) $mode = SPH_MATCH_PHRASE;
|
|
else if ( $arg=="-f" || $arg=="--filter" ) $filter = $args[++$i];
|
|
else if ( $arg=="-v" || $arg=="--value" ) $filtervals[] = $args[++$i];
|
|
else if ( $arg=="-g" || $arg=="--groupby" ) $groupby = $args[++$i];
|
|
else if ( $arg=="-gs"|| $arg=="--groupsort" ) $groupsort = $args[++$i];
|
|
else if ( $arg=="-d" || $arg=="--distinct" ) $distinct = $args[++$i];
|
|
else if ( $arg=="-l" || $arg=="--limit" ) $limit = (int)$args[++$i];
|
|
else if ( $arg=="-r" )
|
|
{
|
|
$arg = strtolower($args[++$i]);
|
|
if ( $arg=="bm25" ) $ranker = SPH_RANK_BM25;
|
|
if ( $arg=="none" ) $ranker = SPH_RANK_NONE;
|
|
if ( $arg=="wordcount" )$ranker = SPH_RANK_WORDCOUNT;
|
|
}
|
|
else
|
|
$q .= $args[$i] . " ";
|
|
}
|
|
|
|
////////////
|
|
// do query
|
|
////////////
|
|
|
|
$cl = new SphinxClient ();
|
|
$cl->SetServer ( $host, $port );
|
|
$cl->SetWeights ( array ( 100, 1 ) );
|
|
$cl->SetMatchMode ( $mode );
|
|
if ( count($filtervals) ) $cl->SetFilter ( $filter, $filtervals );
|
|
if ( $groupby ) $cl->SetGroupBy ( $groupby, SPH_GROUPBY_ATTR, $groupsort );
|
|
if ( $sortby ) $cl->SetSortMode ( SPH_SORT_EXTENDED, $sortby );
|
|
if ( $sortexpr ) $cl->SetSortMode ( SPH_SORT_EXPR, $sortexpr );
|
|
if ( $distinct ) $cl->SetGroupDistinct ( $distinct );
|
|
if ( $limit ) $cl->SetLimits ( 0, $limit, ( $limit>1000 ) ? $limit : 1000 );
|
|
$cl->SetRankingMode ( $ranker );
|
|
$cl->SetArrayResult ( true );
|
|
$res = $cl->Query ( $q, $index );
|
|
|
|
////////////////
|
|
// print me out
|
|
////////////////
|
|
|
|
if ( $res===false )
|
|
{
|
|
print "Query failed: " . $cl->GetLastError() . ".\n";
|
|
|
|
} else
|
|
{
|
|
if ( $cl->GetLastWarning() )
|
|
print "WARNING: " . $cl->GetLastWarning() . "\n\n";
|
|
|
|
print "Query '$q' retrieved $res[total] of $res[total_found] matches in $res[time] sec.\n";
|
|
print "Query stats:\n";
|
|
if ( is_array($res["words"]) )
|
|
foreach ( $res["words"] as $word => $info )
|
|
print " '$word' found $info[hits] times in $info[docs] documents\n";
|
|
print "\n";
|
|
|
|
if ( is_array($res["matches"]) )
|
|
{
|
|
$n = 1;
|
|
print "Matches:\n";
|
|
foreach ( $res["matches"] as $docinfo )
|
|
{
|
|
print "$n. doc_id=$docinfo[id], weight=$docinfo[weight]";
|
|
foreach ( $res["attrs"] as $attrname => $attrtype )
|
|
{
|
|
$value = $docinfo["attrs"][$attrname];
|
|
if ( $attrtype & SPH_ATTR_MULTI )
|
|
{
|
|
$value = "(" . join ( ",", $value ) .")";
|
|
} else
|
|
{
|
|
if ( $attrtype==SPH_ATTR_TIMESTAMP )
|
|
$value = date ( "Y-m-d H:i:s", $value );
|
|
}
|
|
print ", $attrname=$value";
|
|
}
|
|
print "\n";
|
|
$n++;
|
|
}
|
|
}
|
|
}
|
|
|
|
//
|
|
// $Id: test.php 1103 2008-01-24 18:42:57Z shodan $
|
|
//
|
|
|
|
?>
|