| 1 | <?php
 | 
  
    | 2 | 
 | 
  
    | 3 | // $Id: search_convert.php 881 2008-11-22 15:51:23Z thorn $
 | 
  
    | 4 | 
 | 
  
    | 5 | /*
 | 
  
    | 6 | 
 | 
  
    | 7 |  Website Baker Project <http://www.websitebaker.org/>
 | 
  
    | 8 |  Copyright (C) 2004-2008, Ryan Djurovich
 | 
  
    | 9 | 
 | 
  
    | 10 |  Website Baker is free software; you can redistribute it and/or modify
 | 
  
    | 11 |  it under the terms of the GNU General Public License as published by
 | 
  
    | 12 |  the Free Software Foundation; either version 2 of the License, or
 | 
  
    | 13 |  (at your option) any later version.
 | 
  
    | 14 | 
 | 
  
    | 15 |  Website Baker is distributed in the hope that it will be useful,
 | 
  
    | 16 |  but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
  
    | 17 |  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
  
    | 18 |  GNU General Public License for more details.
 | 
  
    | 19 | 
 | 
  
    | 20 |  You should have received a copy of the GNU General Public License
 | 
  
    | 21 |  along with Website Baker; if not, write to the Free Software
 | 
  
    | 22 |  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 | 
  
    | 23 | 
 | 
  
    | 24 | */
 | 
  
    | 25 | 
 | 
  
    | 26 | /*
 | 
  
    | 27 | Character Conversion file
 | 
  
    | 28 | for search-/highlighting-related character-translations
 | 
  
    | 29 | */
 | 
  
    | 30 | 
 | 
  
    | 31 | if(!defined('WB_URL')) {
 | 
  
    | 32 | 	header('Location: ../index.php');
 | 
  
    | 33 | 	exit(0);
 | 
  
    | 34 | }
 | 
  
    | 35 | if(!isset($search_lang)) $search_lang = LANGUAGE;
 | 
  
    | 36 | 
 | 
  
    | 37 | // umlaut to '(upper|lower)' for preg_match()
 | 
  
    | 38 | // this is UTF-8-encoded
 | 
  
    | 39 | // there is no need for a translation-table anymore since we use u-switch (utf-8) for preg-functions
 | 
  
    | 40 | // remember that we use the i-switch, too. [No need for (ae|Ae)]
 | 
  
    | 41 | 
 | 
  
    | 42 | $string_ul_umlaut = array();
 | 
  
    | 43 | $string_ul_regex = array();
 | 
  
    | 44 | 
 | 
  
    | 45 | // but add some national stuff
 | 
  
    | 46 | if($search_lang=='DE') { // add special handling for german umlauts (ä==ae, ...)
 | 
  
    | 47 | 	$string_ul_umlaut_add = array(
 | 
  
    | 48 | 		"\xc3\x9f", // german SZ-Ligatur
 | 
  
    | 49 | 		"\xc3\xa4", // german ae
 | 
  
    | 50 | 		"\xc3\xb6", // german oe
 | 
  
    | 51 | 		"\xc3\xbc", // german ue
 | 
  
    | 52 | 		"\xc3\x84", // german Ae
 | 
  
    | 53 | 		"\xc3\x96", // german Oe
 | 
  
    | 54 | 		"\xc3\x9c", // german Ue
 | 
  
    | 55 | 		// these are not that usual
 | 
  
    | 56 | 		"\xEF\xAC\x84", // german ffl-ligatur
 | 
  
    | 57 | 		"ffl",          // german ffl-ligatur
 | 
  
    | 58 | 		"\xEF\xAC\x83", // german ffi-ligatur
 | 
  
    | 59 | 		"ffi",          // german ffi-ligatur
 | 
  
    | 60 | 		"0xEF\xAC\x80", // german ff-Ligatur
 | 
  
    | 61 | 		"ff",           // german ff-Ligatur
 | 
  
    | 62 | 		"\xEF\xAC\x81", // german fi-ligatur
 | 
  
    | 63 | 		"fi",           // german fi-ligatur
 | 
  
    | 64 | 		"\xEF\xAC\x82", // german fl-ligatur
 | 
  
    | 65 | 		"fl",           // german fl-ligatur
 | 
  
    | 66 | 		"\xEF\xAC\x85", // german st-Ligatur (long s)
 | 
  
    | 67 | 		"st",           // german st-Ligatur
 | 
  
    | 68 | 		"\xEF\xAC\x86"  // german st-ligatur (round-s)
 | 
  
    | 69 | 	);
 | 
  
    | 70 | 	$string_ul_regex_add = array(
 | 
  
    | 71 | 		"(\xc3\x9f|ss)", // german SZ.Ligatur
 | 
  
    | 72 | 		"(\xc3\xa4|ae)", // german ae
 | 
  
    | 73 | 		"(\xc3\xb6|oe)", // german oe
 | 
  
    | 74 | 		"(\xc3\xbc|ue)", // german ue
 | 
  
    | 75 | 		"(\xc3\x84|Ae)", // german Ae
 | 
  
    | 76 | 		"(\xc3\x96|Oe)", // german Oe
 | 
  
    | 77 | 		"(\xc3\x9c|Ue)", // german Ue
 | 
  
    | 78 | 		// these are not that usual
 | 
  
    | 79 | 		"(\xEF\xAC\x84|ffl)", // german ffl-ligatur
 | 
  
    | 80 | 		"(\xEF\xAC\x84|ffl)", // german ffl-ligatur
 | 
  
    | 81 | 		"(\xEF\xAC\x83|ffi)", // german ffi-ligatur
 | 
  
    | 82 | 		"(\xEF\xAC\x83|ffi)", // german ffi-ligatur
 | 
  
    | 83 | 		"(\xEF\xAC\x80|ff)",  // german ff-Ligatur
 | 
  
    | 84 | 		"(\xEF\xAC\x80|ff)",  // german ff-Ligatur
 | 
  
    | 85 | 		"(\xEF\xAC\x81|fi)",  // german fi-Ligatur
 | 
  
    | 86 | 		"(\xEF\xAC\x81|fi)",  // german fi-Ligatur
 | 
  
    | 87 | 		"(\xEF\xAC\x82|fl)",  // german fl-ligatur
 | 
  
    | 88 | 		"(\xEF\xAC\x82|fl)",  // german fl-ligatur
 | 
  
    | 89 | 		"(\xEF\xAC\x85|st)",  // german st-Ligatur (long s)
 | 
  
    | 90 | 		"(\xEF\xAC\x85|st|\xEF\xAC\x86)",  // german st-Ligaturs
 | 
  
    | 91 | 		"(\xEF\xAC\x86|st)"  // german st-ligatur (round-s)
 | 
  
    | 92 | 	);
 | 
  
    | 93 | 	$string_ul_umlaut = array_merge($string_ul_umlaut_add, $string_ul_umlaut);
 | 
  
    | 94 | 	$string_ul_regex = array_merge($string_ul_regex_add, $string_ul_regex);
 | 
  
    | 95 | }
 | 
  
    | 96 | 
 | 
  
    | 97 | 
 | 
  
    | 98 | ?>
 |