+++ /dev/null
-<?php
-
-/*
- * Nucleus: PHP/MySQL Weblog CMS (http://nucleuscms.org/)
- * Copyright (C) 2003-2007 The Nucleus Group
- *
- * This program is free software; you can redistribute it and/or
- * modify it under the terms of the GNU General Public License
- * as published by the Free Software Foundation; either version 2
- * of the License, or (at your option) any later version.
- * (see nucleus/documentation/index.html#license for more info)
- */
-/**
- * SEARCH(querystring) offers different functionality to create an
- * SQL query to find certain items. (and comments)
- *
- * based on code by David Altherr:
- * http://www.evolt.org/article/Boolean_Fulltext_Searching_with_PHP_and_MySQL/18/15665/
- * http://davidaltherr.net/web/php_functions/boolean/funcs.mysql.boolean.txt
- *
- * @license http://nucleuscms.org/license.txt GNU General Public License
- * @copyright Copyright (C) 2002-2007 The Nucleus Group
- * @version $Id: SEARCH.php,v 1.6 2007-03-27 12:13:56 kimitake Exp $
- * @version $NucleusJP: SEARCH.php,v 1.8 2007/02/04 06:28:46 kimitake Exp $
- */
-
-
-
-class SEARCH {
-
- var $querystring;
- var $marked;
- var $inclusive;
- var $blogs;
-
-
- function SEARCH($text) {
- global $blogid;
-// $text = preg_replace ("/[<,>,=,?,!,#,^,(,),[,\],:,;,\\\,%]/","",$text);
-
-
- /* * * for jp * * * * * * * * * * */
- $text = $this->zenspace_replace($text);
- $text = preg_replace ("/[<>=?!#^()[\]:;\\%]/","",$text);
-
- $this->ascii = '[\x00-\x7F]';
- $this->two = '[\x8E\xA1-\xFE][\xA1-\xFE]';
- $this->three = '\x8F[\xA1-\xFE][\xA1-\xFE]';
-
- $this->jpmarked = $this->boolean_mark_atoms_jp($text);
- /* * * * * * * * * * * * * * * * */
-
- $this->querystring = $text;
-// $this->marked = $this->boolean_mark_atoms($text);
- $this->inclusive = $this->boolean_inclusive_atoms($text);
- $this->blogs = array();
-
- // get all public searchable blogs, no matter what, include the current blog allways.
- $res = sql_query('SELECT bnumber FROM '.sql_table('blog').' WHERE bincludesearch=1 ');
- while ($obj = mysql_fetch_object($res))
- $this->blogs[] = intval($obj->bnumber);
- }
-/***********************************************
- zenkaku space to space
-***********************************************/
-
- function zenspace_replace($text){
- $ta = unpack("C*",$text);
- $len = count($ta);
- $temp = '';
- for($i=1; $i<=$len; $i++){
- if($ta[$i]>= 0x8e){ // ja
- if($ta[$i]>0xa0 || $ta[$i]<0x8f){ // 2byte
- $char = chr($ta[$i]).chr($ta[$i+1]);
- if($char == "\xA1\xA1") $char = "\x20";
- $temp .= $char;
- $i ++;
- }else{ // 3byte
- $temp .= chr($ta[$i]).chr($ta[$i+1]).chr($ta[$i+2]);
- $i += 2;
- }
- }else{ //ascii
- $temp .= chr($ta[$i]);
- }
- }
- return $temp;
- }
-/***********************************************/
-
- function boolean_sql_select($match){
-// $string = $this->inclusive;
-// if (strlen($string) > 0) {
- /* build sql for determining score for each record */
-/*
- preg_match_all(
- "([A-Za-z0-9]{1,}[A-Za-z0-9\-\.\_]{0,})",
- $string,
- $result);
- $result = $result[0];
- for($cth=0;$cth<count($result);$cth++){
- if(strlen($result[$cth])>=4){
- $stringsum_long .= " $result[$cth] ";
- }else{
- $stringsum_a[] = ' '.$this->boolean_sql_select_short($result[$cth],$match).' ';
- }
- }
- if(strlen($stringsum_long)>0){
- $stringsum_long = addslashes($stringsum_long);
- $stringsum_a[] = " match ($match) against ('$stringsum_long') ";
- }
- $stringsum .= implode("+",$stringsum_a);
- return $stringsum;
- }
-*/
- }
-
-
-
- function boolean_inclusive_atoms($string){
- $result=trim($string);
- $result=preg_replace("/([[:space:]]{2,})/",' ',$result);
-
- /* convert normal boolean operators to shortened syntax */
- $result=eregi_replace(' not ',' -',$result);
- $result=eregi_replace(' and ',' ',$result);
- $result=eregi_replace(' or ',',',$result);
-
- /* drop unnecessary spaces */
- $result=str_replace(' ,',',',$result);
- $result=str_replace(', ',',',$result);
- $result=str_replace('- ','-',$result);
- $result=str_replace('+','',$result);
-
- /* strip exlusive atoms */
- $result=preg_replace(
-// "(\-\([A-Za-z0-9]{1,}[A-Za-z0-9\-\.\_\,]{0,}\))",
- "(\-\(([A-Za-z0-9]|$this->two|$this->three){1,}([A-Za-z0-9\-\.\_\,]|$this->two|$this->three){0,}\))",
- '',
- $result);
-
- $result=preg_replace(
-// "(\-[A-Za-z0-9]{1,}[A-Za-z0-9\-\.\_]{0,})",
- "(\-([A-Za-z0-9]|$this->two|$this->three){1,}([A-Za-z0-9\-\.\_\,]|$this->two|$this->three){0,})",
- '',
- $result);
-
- $result=str_replace('(',' ',$result);
- $result=str_replace(')',' ',$result);
- $result=str_replace(',',' ',$result);
-
- return $result;
- }
-
- function boolean_sql_where($match){
-/*
- $result = $this->marked;
- $result = preg_replace(
- "/foo\[\(\'([^\)]{4,})\'\)\]bar/e",
- " 'match ('.\$match.') against (\''.\$this->copyvalue(\"$1\").'\') > 0 ' ",
- $result);
-
- $result = preg_replace(
- "/foo\[\(\'([^\)]{1,3})\'\)\]bar/e",
- " '('.\$this->boolean_sql_where_short(\"$1\",\"$match\").')' ",
- $result);
-*/
- $result = $this->jpmarked; /* for jp */
- $result = $this->boolean_sql_where_jp_short($result,$match);/* for jp */
- return $result;
- }
-
- // there must be a simple way to simply copy a value with backslashes in it through
- // the preg_replace, but I cannot currently find it (karma 2003-12-30)
- function copyvalue($foo) {
- return $foo;
- }
-
-/***********************************************
- Make "WHERE" (jp)
-***********************************************/
-
- function boolean_mark_atoms_jp($string){
-
- $result=trim($string);
- $result=preg_replace("/([[:space:]]{2,})/",' ',$result);
-
- /* convert normal boolean operators to shortened syntax */
- $result=eregi_replace(' not ',' -',$result);
- $result=eregi_replace(' and ',' ',$result);
- $result=eregi_replace(' or ',',',$result);
-
- /* strip excessive whitespace */
- $result=str_replace(', ',',',$result);
- $result=str_replace(' ,',',',$result);
- $result=str_replace('- ','-',$result);
- $result=str_replace('+','',$result);
-
- $result=str_replace(',',' ,',$result);
-
- return $result;
- }
-
-
- function boolean_sql_where_jp_short($string,$match){
- $match_a = explode(',',$match);
- $key_a = explode(' ',$string);
-
- for($ith=0;$ith<count($match_a);$ith++){
- $temp_a[$ith] = "(i.$match_a[$ith] LIKE '%" . addslashes($key_a[0]) . "%') ";
- }
- $like = '('.implode(' or ',$temp_a).')';
-
- for($kn=1; $kn<count($key_a); $kn++){
- if(substr($key_a[$kn],0,1) == ","){
- for($ith=0;$ith<count($match_a);$ith++){
- $temp_a[$ith] = " (i.$match_a[$ith] LIKE '%" . addslashes(substr($key_a[$kn],1)) . "%') ";
- }
- $like .=' OR ('. implode(' or ',$temp_a).')';
- }elseif(substr($key_a[$kn],0,1) != '-'){
- for($ith=0;$ith<count($match_a);$ith++){
- $temp_a[$ith] = " (i.$match_a[$ith] LIKE '%" . addslashes($key_a[$kn]) . "%') ";
- }
- $like .=' AND ('. implode(' or ',$temp_a).')';
- }else{
- for($ith=0;$ith<count($match_a);$ith++){
- $temp_a[$ith] = " NOT(i.$match_a[$ith] LIKE '%" . addslashes(substr($key_a[$kn],1)) . "%') ";
- }
- $like .=' AND ('. implode(' and ',$temp_a).')';
- }
- }
-
- $like = '('.$like.')';
- return $like;
- }
-
-/***********************************************/
-
-
-/*
- function boolean_mark_atoms($string){
- $result=trim($string);
- $result=preg_replace("/([[:space:]]{2,})/",' ',$result);
-
- //convert normal boolean operators to shortened syntax
- $result=eregi_replace(' not ',' -',$result);
- $result=eregi_replace(' and ',' ',$result);
- $result=eregi_replace(' or ',',',$result);
-
-
- //strip excessive whitespace
- $result=str_replace('( ','(',$result);
- $result=str_replace(' )',')',$result);
- $result=str_replace(', ',',',$result);
- $result=str_replace(' ,',',',$result);
- $result=str_replace('- ','-',$result);
- $result=str_replace('+','',$result);
-
- // remove double spaces (we might have introduced some new ones above)
- $result=trim($result);
- $result=preg_replace("/([[:space:]]{2,})/",' ',$result);
-
- // apply arbitrary function to all 'word' atoms
-
- $result_a = explode(" ",$result);
- for($word=0;$word<count($result_a);$word++){
- $result_a[$word] = "foo[('".$result_a[$word]."')]bar";
- }
- $result = implode(" ",$result_a);
-
- // dispatch ' ' to ' AND '
- $result=str_replace(' ',' AND ',$result);
-
- // dispatch ',' to ' OR '
- $result=str_replace(',',' OR ',$result);
-
- // dispatch '-' to ' NOT '
- $result=str_replace(' -',' NOT ',$result);
- return $result;
- }
-
- function boolean_sql_where_short($string,$match){
- $match_a = explode(',',$match);
- for($ith=0;$ith<count($match_a);$ith++){
- $like_a[$ith] = " $match_a[$ith] LIKE '% $string %' ";
- }
- $like = implode(" OR ",$like_a);
-
- return $like;
- }
- function boolean_sql_select_short($string,$match){
- $match_a = explode(',',$match);
- $score_unit_weight = .2;
- for($ith=0;$ith<count($match_a);$ith++){
- $score_a[$ith] =
- " $score_unit_weight*(
- LENGTH(" . addslashes($match_a[$ith]) . ") -
- LENGTH(REPLACE(LOWER(" . addslashes($match_a[$ith]) . "),LOWER('" . addslashes($string) . "'),'')))
- /LENGTH('" . addslashes($string) . "') ";
- }
- $score = implode(" + ",$score_a);
-
- return $score;
- }
-*/
-
-}
-?>