Skip to content
Snippets Groups Projects
Commit 4efb9a42 authored by Andreas Gohr's avatar Andreas Gohr
Browse files

fixed stupid bug in search query parser

darcs-hash:20060618134515-7ad00-3097e310ccdaf793b5da3bd49a54723fea7ec260.gz
parent 377f9e97
No related branches found
No related tags found
No related merge requests found
<?php
// use no mbstring help here
if(!defined('UTF8_NOMBSTRING')) define('UTF8_NOMBSTRING',1);
require_once DOKU_INC.'inc/utf8.php';
class utf8_stripspecials extends UnitTestCase {
function test1(){
// we test multiple cases here - format: string, repl, additional, test
$tests = array();
$tests[] = array('asciistring','','','asciistring');
$tests[] = array('asciistring','','\._\-:','asciistring');
$tests[] = array('ascii.string','','\._\-:','asciistring');
$tests[] = array('ascii.string',' ','\._\-:','ascii string');
$tests[] = array('2.1.14',' ','\._\-:','2 1 14');
$tests[] = array('ascii.string','','\._\-:\*','asciistring');
$tests[] = array('ascii.string',' ','\._\-:\*','ascii string');
$tests[] = array('2.1.14',' ','\._\-:\*','2 1 14');
foreach($tests as $test){
$this->assertEqual(utf8_stripspecials($test[0],$test[1],$test[2]),$test[3]);
}
}
}
//Setup VIM: ex: et ts=4 enc=utf-8 :
......@@ -357,14 +357,14 @@ function idx_parseIndexLine(&$page_idx,$line){
*/
function idx_tokenizer($string,&$stopwords,$wc=false){
$words = array();
if(!$wc) $wc = '\*';
$wc = ($wc) ? '' : $wc = '\*';
if(preg_match('/[^0-9A-Za-z]/u', $string)){
// handle asian chars as single words (may fail on older PHP version)
$asia = @preg_replace('/('.IDX_ASIAN.')/u','\1 ',$string);
if(!is_null($asia)) $string = $asia; //recover from regexp failure
$arr = explode(' ', utf8_stripspecials($string,' ','._\-:'.$wc));
$arr = explode(' ', utf8_stripspecials($string,' ','\._\-:'.$wc));
foreach ($arr as $w) {
if (!is_numeric($w) && strlen($w) < 3) continue;
$w = utf8_strtolower($w);
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment