/*
* Nucleus: PHP/MySQL Weblog CMS (http://nucleuscms.org/)
- * Copyright (C) 2003-2007 The Nucleus Group
+ * Copyright (C) 2003-2009 The Nucleus Group
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License
* http://davidaltherr.net/web/php_functions/boolean/funcs.mysql.boolean.txt
*
* @license http://nucleuscms.org/license.txt GNU General Public License
- * @copyright Copyright (C) 2002-2007 The Nucleus Group
- * @version $Id: SEARCH.php,v 1.8 2007-02-04 06:28:46 kimitake Exp $
+ * @copyright Copyright (C) 2002-2011 The Nucleus Group
+ * @version $Id$
* @version $NucleusJP: SEARCH.php,v 1.7 2006/07/20 08:01:52 kimitake Exp $
*/
-
-
class SEARCH {
var $querystring;
var $inclusive;
var $blogs;
-
function SEARCH($text) {
global $blogid;
// $text = preg_replace ("/[<,>,=,?,!,#,^,(,),[,\],:,;,\\\,%]/","",$text);
+ /* * * for jp * * * * * * * * * * */
+ $this->encoding = strtolower(preg_replace('|[^a-z0-9-_]|i', '', _CHARSET));
+ if ($this->encoding != 'utf-8') {
+ $text = mb_convert_encoding($text, "UTF-8", $this->encoding);
+ }
+ $text = str_replace ("\xE3\x80\x80",' ',$text);
+ $text = preg_replace ("/[<>=?!#^()[\]:;\\%]/","",$text);
+
+ $this->ascii = '[\x00-\x7F]';
+ $this->two = '[\xC0-\xDF][\x80-\xBF]';
+ $this->three = '[\xE0-\xEF][\x80-\xBF][\x80-\xBF]';
+
+ $this->jpmarked = $this->boolean_mark_atoms_jp($text);
+ /* * * * * * * * * * * * * * * * */
+ $this->querystring = $text;
+// $this->marked = $this->boolean_mark_atoms($text);
+ $this->inclusive = $this->boolean_inclusive_atoms($text);
+ $this->blogs = array();
- /* * * for jp * * * * * * * * * * */
- $text = str_replace ("\xE3\x80\x80",' ',$text);
- $text = preg_replace ("/[<>=?!#^()[\]:;\\%]/","",$text);
-
- $this->ascii = '[\x00-\x7F]';
- $this->two = '[\xC0-\xDF][\x80-\xBF]';
- $this->three = '[\xE0-\xEF][\x80-\xBF][\x80-\xBF]';
-
- $this->jpmarked = $this->boolean_mark_atoms_jp($text);
- /* * * * * * * * * * * * * * * * */
-
- $this->querystring = $text;
-// $this->marked = $this->boolean_mark_atoms($text);
- $this->inclusive = $this->boolean_inclusive_atoms($text);
- $this->blogs = array();
-
- // get all public searchable blogs, no matter what, include the current blog allways.
- $res = sql_query('SELECT bnumber FROM '.sql_table('blog').' WHERE bincludesearch=1 ');
- while ($obj = mysql_fetch_object($res))
- $this->blogs[] = intval($obj->bnumber);
- }
-
- function boolean_sql_select($match){
-// if (strlen($this->inclusive) > 0) {
- /* build sql for determining score for each record */
-/* $result=explode(" ",$this->inclusive);
- for($cth=0;$cth<count($result);$cth++){
- if(strlen($result[$cth])>=4){
- $stringsum_long .= " $result[$cth] ";
- }else{
- $stringsum_a[] = ' '.$this->boolean_sql_select_short($result[$cth],$match).' ';
- }
- }
-
- if(strlen($stringsum_long)>0){
- $stringsum_long = addslashes($stringsum_long);
- $stringsum_a[] = " match ($match) against ('$stringsum_long') ";
- }
-
- $stringsum .= implode("+",$stringsum_a);
- return $stringsum;
+ // get all public searchable blogs, no matter what, include the current blog allways.
+ $res = sql_query('SELECT bnumber FROM ' . sql_table('blog') . ' WHERE bincludesearch=1 ');
+ while ($obj = sql_fetch_object($res)) {
+ $this->blogs[] = intval($obj->bnumber);
}
-*/ }
+ }
-
+ function boolean_sql_select($match) {
+ if (!isset($stringsum)) {
+ $stringsum = '';
+ }
+ if (strlen($this->inclusive) > 0) {
+ /* build sql for determining score for each record */
+ $result=explode(" ",$this->inclusive);
+ if (!isset($stringsum_long)) {
+ $stringsum_long = '';
+ }
+ for ($cth = 0; $cth < count($result); $cth++) {
+ if (strlen($result[$cth])>=4) {
+ $stringsum_long .= " $result[$cth] ";
+ } else {
+ $stringsum_a[] = ' ' . $this->boolean_sql_select_short($result[$cth], $match) . ' ';
+ }
+ }
+
+ if (strlen($stringsum_long) > 0) {
+ $stringsum_long = sql_real_escape_string($stringsum_long);
+ $stringsum_a[] = " match ($match) against ('$stringsum_long') ";
+ }
+
+ $stringsum .= implode("+", $stringsum_a);
+
+ return $stringsum;
+ }
+ }
- function boolean_inclusive_atoms($string){
- $result=trim($string);
- $result=preg_replace("/([[:space:]]{2,})/",' ',$result);
+
+ function boolean_inclusive_atoms($string) {
+ $result = trim($string);
+ $result = preg_replace("#([[:space:]]{2,})#", ' ', $result);
+
+ # replaced eregi_replace() below with preg_replace(). ereg* functions are deprecated in PHP 5.3.0
+ # just added delimiters to regex and the 'i' for case-insensitive matching
+
/* convert normal boolean operators to shortened syntax */
- $result=eregi_replace(' not ',' -',$result);
- $result=eregi_replace(' and ',' ',$result);
- $result=eregi_replace(' or ',',',$result);
-
+ $result = preg_replace('# not #i', ' -', $result);
+ $result = preg_replace('# and #i', ' ', $result);
+ $result = preg_replace('# or #i', ',', $result);
+
/* drop unnecessary spaces */
- $result=str_replace(' ,',',',$result);
- $result=str_replace(', ',',',$result);
- $result=str_replace('- ','-',$result);
- $result=str_replace('+','',$result);
-
+ $result = str_replace(' ,', ',', $result);
+ $result = str_replace(', ', ',', $result);
+ $result = str_replace('- ', '-', $result);
+ $result = str_replace('+', '', $result);
+
/* strip exlusive atoms */
- $result=preg_replace(
-// "(\-\([A-Za-z0-9]{1,}[A-Za-z0-9\-\.\_\,]{0,}\))",
- "(\-\(([A-Za-z0-9]|$this->two|$this->three){1,}([A-Za-z0-9\-\.\_\,]|$this->two|$this->three){0,}\))",
- '',
- $result);
-
- $result=preg_replace(
-// "(\-[A-Za-z0-9]{1,}[A-Za-z0-9\-\.\_]{0,})",
- "(\-([A-Za-z0-9]|$this->two|$this->three){1,}([A-Za-z0-9\-\.\_\,]|$this->two|$this->three){0,})",
+ $result = preg_replace(
+ "#\-\(([A-Za-z0-9]|$this->two|$this->three){1,}([A-Za-z0-9\-\.\_\,]|$this->two|$this->three){0,}\)#",
'',
$result);
-
- $result=str_replace('(',' ',$result);
- $result=str_replace(')',' ',$result);
- $result=str_replace(',',' ',$result);
-
+
+ $result = str_replace('(', ' ', $result);
+ $result = str_replace(')', ' ', $result);
+ $result = str_replace(',', ' ', $result);
+ if ($this->encoding != 'utf-8') {
+ $result = mb_convert_encoding($result, $this->encoding, "UTF-8");
+ }
return $result;
}
- function boolean_sql_where($match){
+ function boolean_sql_where($match) {
/*
$result = $this->marked;
$result = preg_replace(
"/foo\[\(\'([^\)]{4,})\'\)\]bar/e",
" 'match ('.\$match.') against (\''.\$this->copyvalue(\"$1\").'\') > 0 ' ",
$result);
-
$result = preg_replace(
"/foo\[\(\'([^\)]{1,3})\'\)\]bar/e",
" '('.\$this->boolean_sql_where_short(\"$1\",\"$match\").')' ",
$result);
*/
$result = $this->jpmarked; /* for jp */
- $result = $this->boolean_sql_where_jp_short($result,$match);/* for jp */
+ $result = $this->boolean_sql_where_jp_short($result, $match);/* for jp */
+ if ($this->encoding != 'utf-8') {
+ $result = mb_convert_encoding($result, $this->encoding, "UTF-8");
+ }
return $result;
}
function copyvalue($foo) {
return $foo;
}
-
-
/*
function boolean_mark_atoms($string){
$result=trim($string);
$result=preg_replace("/([[:space:]]{2,})/",' ',$result);
- // convert normal boolean operators to shortened syntax
- $result=eregi_replace(' not ',' -',$result);
- $result=eregi_replace(' and ',' ',$result);
- $result=eregi_replace(' or ',',',$result);
+ # replaced eregi_replace() below with preg_replace(). ereg* functions are deprecated in PHP 5.3.0
+ # just added delimiters to regex and the 'i' for case-insensitive matching
+ $result = preg_replace('# not #i', ' -', $result);
+ $result = preg_replace('# and #i', ' ', $result);
+ $result = preg_replace('# or #i', ',', $result);
// strip excessive whitespace
$result=str_replace('( ','(',$result);
// remove double spaces (we might have introduced some new ones above)
$result=trim($result);
- $result=preg_replace("/([[:space:]]{2,})/",' ',$result);
+ $result=preg_replace("#([[:space:]]{2,})#",' ',$result);
- // apply arbitrary function to all 'word' atoms
+ // apply arbitrary function to all 'word' atoms
- $result_a = explode(" ",$result);
- for($word=0;$word<count($result_a);$word++){
+ $result_a = explode(' ',$result);
+ for($word=0;$word<count($result_a);$word++)
+ {
$result_a[$word] = "foo[('".$result_a[$word]."')]bar";
}
$result = implode(" ",$result_a);
return $like;
}
- function boolean_sql_select_short($string,$match){
- $match_a = explode(',',$match);
+*/
+
+ function boolean_sql_select_short($string, $match) {
+ $match_a = explode(',', $match);
$score_unit_weight = .2;
- for($ith=0;$ith<count($match_a);$ith++){
+ for ($ith = 0; $ith< count($match_a); $ith++){
$score_a[$ith] =
- " $score_unit_weight*(
- LENGTH(" . addslashes($match_a[$ith]) . ") -
- LENGTH(REPLACE(LOWER(" . addslashes($match_a[$ith]) . "),LOWER('" . addslashes($string) . "'),'')))
- /LENGTH('" . addslashes($string) . "') ";
+ " $score_unit_weight*(
+ LENGTH(" . sql_real_escape_string($match_a[$ith]) . ") -
+ LENGTH(REPLACE(LOWER(" . sql_real_escape_string($match_a[$ith]) . "),LOWER('" . sql_real_escape_string($string) . "'),'')))
+ /LENGTH('" . sql_real_escape_string($string) . "') ";
}
- $score = implode(" + ",$score_a);
+ $score = implode(" + ", $score_a);
return $score;
}
-*/
/***********************************************
- Make "WHERE" (jp)
+ Make "WHERE" (jp)
***********************************************/
- function boolean_mark_atoms_jp($string){
-
- $result=trim($string);
- $result=preg_replace("/([[:space:]]{2,})/",' ',$result);
-
- /* convert normal boolean operators to shortened syntax */
- $result=eregi_replace(' not ',' -',$result);
- $result=eregi_replace(' and ',' ',$result);
- $result=eregi_replace(' or ',',',$result);
-
- /* strip excessive whitespace */
- $result=str_replace(', ',',',$result);
- $result=str_replace(' ,',',',$result);
- $result=str_replace('- ','-',$result);
- $result=str_replace('+','',$result);
-
- $result=str_replace(',',' ,',$result);
-
- return $result;
- }
-
-
- function boolean_sql_where_jp_short($string,$match){
- $match_a = explode(',',$match);
- $key_a = explode(' ',$string);
-
- for($ith=0;$ith<count($match_a);$ith++){
- $temp_a[$ith] = "(i.$match_a[$ith] LIKE '%" . addslashes($key_a[0]) . "%') ";
- }
- $like = '('.implode(' or ',$temp_a).')';
-
- for($kn=1; $kn<count($key_a); $kn++){
- if(substr($key_a[$kn],0,1) == ","){
- for($ith=0;$ith<count($match_a);$ith++){
- $temp_a[$ith] = " (i.$match_a[$ith] LIKE '%" . addslashes(substr($key_a[$kn],1)) . "%') ";
- }
- $like .=' OR ('. implode(' or ',$temp_a).')';
- }elseif(substr($key_a[$kn],0,1) != '-'){
- for($ith=0;$ith<count($match_a);$ith++){
- $temp_a[$ith] = " (i.$match_a[$ith] LIKE '%" . addslashes($key_a[$kn]) . "%') ";
- }
- $like .=' AND ('. implode(' or ',$temp_a).')';
- }else{
- for($ith=0;$ith<count($match_a);$ith++){
- $temp_a[$ith] = " NOT(i.$match_a[$ith] LIKE '%" . addslashes(substr($key_a[$kn],1)) . "%') ";
- }
- $like .=' AND ('. implode(' and ',$temp_a).')';
- }
- }
-
- $like = '('.$like.')';
- return $like;
- }
-
-/***********************************************/
+ function boolean_mark_atoms_jp($string) {
+ $result = trim($string);
+ $result = preg_replace("/([[:space:]]{2,})/", ' ', $result);
+
+ /* convert normal boolean operators to shortened syntax */
+ $result = eregi_replace(' not ', ' -', $result);
+ $result = eregi_replace(' and ', ' ', $result);
+ $result = eregi_replace(' or ', ',', $result);
+
+ /* strip excessive whitespace */
+ $result = str_replace(', ', ',', $result);
+ $result = str_replace(' ,', ',', $result);
+ $result = str_replace('- ', '-', $result);
+ $result = str_replace('+', '', $result);
+ $result = str_replace(',', ' ,', $result);
+
+ return $result;
+ }
+
+ function boolean_sql_where_jp_short($string, $match) {
+ $match_a = explode(',', $match);
+ $key_a = explode(' ', $string);
+
+ for ($ith=0; $ith<count($match_a); $ith++) {
+// $temp_a[$ith] = "(i.$match_a[$ith] LIKE '%" . sql_real_escape_string($key_a[0]) . "%') ";
+ $binKey = preg_match('/[a-zA-Z]/', $key_a[0]) ? '' : 'BINARY';
+ $temp_a[$ith] = "(i.$match_a[$ith] LIKE " . $binKey . " '%" . sql_real_escape_string($key_a[0]) . "%') ";
+ }
+ $like = '('.implode(' or ',$temp_a).')';
+
+ for ($kn = 1; $kn < count($key_a); $kn++) {
+ $binKey = preg_match('/[a-zA-Z]/', $key_a[$kn]) ? '' : 'BINARY';
+ if (substr($key_a[$kn], 0, 1) == ",") {
+ for($ith = 0; $ith < count($match_a); $ith++) {
+// $temp_a[$ith] = " (i.$match_a[$ith] LIKE '%" . sql_real_escape_string(substr($key_a[$kn],1)) . "%') ";
+ $temp_a[$ith] = " (i.$match_a[$ith] LIKE " . $binKey . " '%" . sql_real_escape_string(substr($key_a[$kn], 1)) . "%') ";
+ }
+ $like .=' OR ('. implode(' or ', $temp_a).')';
+ }elseif(substr($key_a[$kn],0,1) != '-'){
+ for($ith=0;$ith<count($match_a);$ith++){
+// $temp_a[$ith] = " (i.$match_a[$ith] LIKE '%" . sql_real_escape_string($key_a[$kn]) . "%') ";
+ $temp_a[$ith] = " (i.$match_a[$ith] LIKE " . $binKey . " '%" . sql_real_escape_string($key_a[$kn]) . "%') ";
+ }
+ $like .=' AND ('. implode(' or ', $temp_a).')';
+ }else{
+ for($ith=0;$ith<count($match_a);$ith++){
+// $temp_a[$ith] = " NOT(i.$match_a[$ith] LIKE '%" . sql_real_escape_string(substr($key_a[$kn],1)) . "%') ";
+ $temp_a[$ith] = " NOT(i.$match_a[$ith] LIKE " . $binKey . " '%" . sql_real_escape_string(substr($key_a[$kn], 1)) . "%') ";
+ }
+ $like .=' AND ('. implode(' and ', $temp_a).')';
+ }
+ }
+
+ $like = '('.$like.')';
+ return $like;
+ }
}
-?>
+?>
\ No newline at end of file