From 2e8d866b9d36d1d84dde4dd7a88f650ad6a4262c Mon Sep 17 00:00:00 2001 From: Domas Mituzas Date: Thu, 25 Nov 2004 14:20:35 +0000 Subject: [PATCH] PostgreSQL/Tsearch2 full-text-index initial support --- includes/SearchTsearch2.php | 85 +++++++++++++++++++++++++++++++++++++ includes/SpecialSearch.php | 3 ++ 2 files changed, 88 insertions(+) create mode 100644 includes/SearchTsearch2.php diff --git a/includes/SearchTsearch2.php b/includes/SearchTsearch2.php new file mode 100644 index 0000000000..53b9523442 --- /dev/null +++ b/includes/SearchTsearch2.php @@ -0,0 +1,85 @@ +, Domas Mituzas +# http://www.mediawiki.org/ +# +# This program is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation; either version 2 of the License, or +# (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License along +# with this program; if not, write to the Free Software Foundation, Inc., +# 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. +# http://www.gnu.org/copyleft/gpl.html + +/** + * Search engine hook for PostgreSQL / Tsearch2 + * @package MediaWiki + * @subpackage Search + */ + +require_once( 'SearchEngine.php' ); + +class SearchTsearch2 extends SearchEngine { + var $strictMatching = false; + + function SearchTsearch2( &$db ) { + $this->db =& $db; + $this->db->setSchema('tsearch'); + } + + function getIndexField( $fulltext ) { + return $fulltext ? 'si_text' : 'si_title'; + } + + function parseQuery( $filteredText, $fulltext ) { + global $wgContLang; + $lc = SearchEngine::legalSearchChars(); + $searchon = ''; + $this->searchTerms = array(); + + # FIXME: This doesn't handle parenthetical expressions. + if( preg_match_all( '/([-+<>~]?)(([' . $lc . ']+)(\*?)|"[^"]*")/', + $filteredText, $m, PREG_SET_ORDER ) ) { + foreach( $m as $terms ) { + if( $searchon !== '' ) $searchon .= ' '; + if( $this->strictMatching && ($terms[1] == '') ) { + $terms[1] = '+'; + } + $searchon .= $terms[1] . $wgContLang->stripForSearch( $terms[2] ); + if( !empty( $terms[3] ) ) { + $regexp = preg_quote( $terms[3], '/' ); + if( $terms[4] ) $regexp .= "[0-9A-Za-z_]+"; + } else { + $regexp = preg_quote( str_replace( '"', '', $terms[2] ), '/' ); + } + $this->searchTerms[] = $regexp; + } + wfDebug( "Would search with '$searchon'\n" ); + wfDebug( "Match with /\b" . implode( '\b|\b', $this->searchTerms ) . "\b/\n" ); + } else { + wfDebug( "Can't understand search query '{$this->filteredText}'\n" ); + } + + $searchon = preg_replace('/(\s+)/','&',$searchon); + $searchon = $this->db->strencode( $searchon ); + $field = $this->getIndexField( $fulltext ); + return " $field @@ to_tsquery('$searchon')"; + } + + function queryMain( $filteredTerm, $fulltext ) { + $match = $this->parseQuery( $filteredTerm, $fulltext ); + $cur = $this->db->tableName( 'cur' ); + $searchindex = $this->db->tableName( 'searchindex' ); + return 'SELECT cur_id, cur_namespace, cur_title, cur_text ' . + "FROM $cur,$searchindex " . + 'WHERE cur_id=si_page AND ' . $match; + } +} + +?> diff --git a/includes/SpecialSearch.php b/includes/SpecialSearch.php index f3fa3e615c..d390fb3579 100644 --- a/includes/SpecialSearch.php +++ b/includes/SpecialSearch.php @@ -220,6 +220,9 @@ class SpecialSearch { $class = 'SearchMysql3'; require_once( 'SearchMySQL3.php' ); } + } else if ( $wgDBtype == 'PostgreSQL' ) { + $class = 'SearchTsearch2'; + require_once( 'SearchTsearch2.php' ); } else { $class = 'SearchEngineDummy'; } -- 2.20.1