* @package search
* @version $Id$
* @copyright (c) 2005 phpBB Group
* @license http://opensource.org/licenses/gpl-license.php GNU Public License

* @ignore
if (!defined('IN_PHPBB'))

* @ignore
include_once($phpbb_root_path . 'includes/search/search.' . $phpEx);

* fulltext_native
* phpBB's own db driven fulltext search, version 2
* @package search
class fulltext_native extends search_backend
	var $stats = array();
	var $word_length = array();
	var $search_query;
	var $common_words = array();

	var $must_contain_ids = array();
	var $must_not_contain_ids = array();
	var $must_exclude_one_ids = array();

	* Initialises the fulltext_native search backend with min/max word length and makes sure the UTF-8 normalizer is loaded.
	* @param	boolean|string	&$error	is passed by reference and should either be set to false on success or an error message on failure.
	* @access	public
	function fulltext_native(&$error)
		global $phpbb_root_path, $phpEx, $config;

		$this->word_length = array('min' => $config['fulltext_native_min_chars'], 'max' => $config['fulltext_native_max_chars']);

		* Load the UTF tools
		if (!class_exists('utf_normalizer'))
			include($phpbb_root_path . 'includes/utf/utf_normalizer.' . $phpEx);

		$error = false;

	* This function fills $this->search_query with the cleaned user search query.
	* If $terms is 'any' then the words will be extracted from the search query
	* and combined with | inside brackets. They will afterwards be treated like
	* an standard search query.
	* Then it analyses the query and fills the internal arrays $must_not_contain_ids,
	* $must_contain_ids and $must_exclude_one_ids which are later used by keyword_search().
	* @param	string	$keywords	contains the search query string as entered by the user
	* @param	string	$terms		is either 'all' (use search query as entered, default words to 'must be contained in post')
	* 	or 'any' (find all posts containing at least one of the given words)
	* @return	boolean				false if no valid keywords were found and otherwise true
	* @access	public
	function split_keywords($keywords, $terms)
		global $db, $user, $config;

		$tokens = '+-|()*';

		$keywords = trim($this->cleanup($keywords, $tokens));

		// allow word|word|word without brackets
		if ((strpos($keywords, ' ') === false) && (strpos($keywords, '|') !== false) && (strpos($keywords, '(') === false))
			$keywords = '(' . $keywords . ')';

		$open_bracket = $space = false;
		for ($i = 0, $n = strlen($keywords); $i < $n; $i++)
			if ($open_bracket !== false)
				switch ($keywords[$i])
					case ')':
						if ($open_bracket + 1 == $i)
							$keywords[$i - 1] = '|';
							$keywords[$i] = '|';
						$open_bracket = false;
					case '(':
						$keywords[$i] = '|';
					case '+':
					case '-':
					case ' ':
						$keywords[$i] = '|';
					case '*':
						if ($i === 0 || ($keywords[$i - 1] !== '*' && strcspn($keywords[$i - 1], $tokens) === 0))
							if ($i === $n - 1 || ($keywords[$i + 1] !== '*' && strcspn($keywords[$i + 1], $tokens) === 0))
								$keywords = substr($keywords, 0, $i) . substr($keywords, $i + 1);
				switch ($keywords[$i])
					case ')':
						$keywords[$i] = ' ';
					case '(':
						$open_bracket = $i;
						$space = false;
					case '|':
						$keywords[$i] = ' ';
					case '-':
					case '+':
						$space = $keywords[$i];
					case ' ':
						if ($space !== false)
							$keywords[$i] = $space;
						$space = false;

		if ($open_bracket)
			$keywords .= ')';

		$match = array(
			'#  +#',
		$replace = array(
			' ',

		$keywords = preg_replace($match, $replace, $keywords);
		$num_keywords = sizeof(explode(' ', $keywords));

		// We limit the number of allowed keywords to minimize load on the database
		if ($config['max_num_search_keywords'] && $num_keywords > $config['max_num_search_keywords'])
			trigger_error($user->lang('MAX_NUM_SEARCH_KEYWORDS_REFINE', $config['max_num_search_keywords'], $num_keywords));

		// $keywords input format: each word separated by a space, words in a bracket are not separated

		// the user wants to search for any word, convert the search query
		if ($terms == 'any')
			$words = array();

			preg_match_all('#([^\\s+\\-|()]+)(?:$|[\\s+\\-|()])#u', $keywords, $words);
			if (sizeof($words[1]))
				$keywords = '(' . implode('|', $words[1]) . ')';

		// set the search_query which is shown to the user
		$this->search_query = $keywords;

		$exact_words = array();
		preg_match_all('#([^\\s+\\-|*()]+)(?:$|[\\s+\\-|()])#u', $keywords, $exact_words);
		$exact_words = $exact_words[1];

		$common_ids = $words = array();

		if (sizeof($exact_words))
			$sql = 'SELECT word_id, word_text, word_common
				WHERE ' . $db->sql_in_set('word_text', $exact_words) . '
				ORDER BY word_count ASC';
			$result = $db->sql_query($sql);

			// store an array of words and ids, remove common words
			while ($row = $db->sql_fetchrow($result))
				if ($row['word_common'])
					$this->common_words[] = $row['word_text'];
					$common_ids[$row['word_text']] = (int) $row['word_id'];

				$words[$row['word_text']] = (int) $row['word_id'];

		// now analyse the search query, first split it using the spaces
		$query = explode(' ', $keywords);

		$this->must_contain_ids = array();
		$this->must_not_contain_ids = array();
		$this->must_exclude_one_ids = array();

		$mode = '';
		$ignore_no_id = true;

		foreach ($query as $word)
			if (empty($word))

			// words which should not be included
			if ($word[0] == '-')
				$word = substr($word, 1);

				// a group of which at least one may not be in the resulting posts
				if ($word[0] == '(')
					$word = array_unique(explode('|', substr($word, 1, -1)));
					$mode = 'must_exclude_one';
				// one word which should not be in the resulting posts
					$mode = 'must_not_contain';
				$ignore_no_id = true;
			// words which have to be included
				// no prefix is the same as a +prefix
				if ($word[0] == '+')
					$word = substr($word, 1);

				// a group of words of which at least one word should be in every resulting post
				if ($word[0] == '(')
					$word = array_unique(explode('|', substr($word, 1, -1)));
				$ignore_no_id = false;
				$mode = 'must_contain';

			if (empty($word))

			// if this is an array of words then retrieve an id for each
			if (is_array($word))
				$non_common_words = array();
				$id_words = array();
				foreach ($word as $i => $word_part)
					if (strpos($word_part, '*') !== false)
						$id_words[] = '\'' . $db->sql_escape(str_replace('*', '%', $word_part)) . '\'';
						$non_common_words[] = $word_part;
					else if (isset($words[$word_part]))
						$id_words[] = $words[$word_part];
						$non_common_words[] = $word_part;
						$len = utf8_strlen($word_part);
						if ($len < $this->word_length['min'] || $len > $this->word_length['max'])
							$this->common_words[] = $word_part;
				if (sizeof($id_words))
					if (sizeof($id_words) > 1)
						$this->{$mode . '_ids'}[] = $id_words;
						$mode = ($mode == 'must_exclude_one') ? 'must_not_contain' : $mode;
						$this->{$mode . '_ids'}[] = $id_words[0];
				// throw an error if we shall not ignore unexistant words
				else if (!$ignore_no_id && sizeof($non_common_words))
					trigger_error(sprintf($user->lang['WORDS_IN_NO_POST'], implode(', ', $non_common_words)));
			// else we only need one id
			else if (($wildcard = strpos($word, '*') !== false) || isset($words[$word]))
				if ($wildcard)
					$len = utf8_strlen(str_replace('*', '', $word));
					if ($len >= $this->word_length['min'] && $len <= $this->word_length['max'])
						$this->{$mode . '_ids'}[] = '\'' . $db->sql_escape(str_replace('*', '%', $word)) . '\'';
						$this->common_words[] = $word;
					$this->{$mode . '_ids'}[] = $words[$word];
			// throw an error if we shall not ignore unexistant words
			else if (!$ignore_no_id)
				if (!isset($common_ids[$word]))
					$len = utf8_strlen($word);
					if ($len >= $this->word_length['min'] && $len <= $this->word_length['max'])
						trigger_error(sprintf($user->lang['WORD_IN_NO_POST'], $word));
						$this->common_words[] = $word;
				$len = utf8_strlen($word);
				if ($len < $this->word_length['min'] || $len > $this->word_length['max'])
					$this->common_words[] = $word;

		// we can't search for negatives only
		if (!sizeof($this->must_contain_ids))
			return false;

		if (!empty($this->search_query))
			return true;
		return false;

	* Performs a search on keywords depending on display specific params. You have to run split_keywords() first.
	* @param	string		$type				contains either posts or topics depending on what should be searched for
	* @param	string		$fields				contains either titleonly (topic titles should be searched), msgonly (only message bodies should be searched), firstpost (only subject and body of the first post should be searched) or all (all post bodies and subjects should be searched)
	* @param	string		$terms				is either 'all' (use query as entered, words without prefix should default to "have to be in field") or 'any' (ignore search query parts and just return all posts that contain any of the specified words)
	* @param	array		$sort_by_sql		contains SQL code for the ORDER BY part of a query
	* @param	string		$sort_key			is the key of $sort_by_sql for the selected sorting
	* @param	string		$sort_dir			is either a or d representing ASC and DESC
	* @param	string		$sort_days			specifies the maximum amount of days a post may be old
	* @param	array		$ex_fid_ary			specifies an array of forum ids which should not be searched
	* @param	array		$m_approve_fid_ary	specifies an array of forum ids in which the searcher is allowed to view unapproved posts
	* @param	int			$topic_id			is set to 0 or a topic id, if it is not 0 then only posts in this topic should be searched
	* @param	array		$author_ary			an array of author ids if the author should be ignored during the search the array is empty
	* @param	string		$author_name		specifies the author match, when ANONYMOUS is also a search-match
	* @param	array		&$id_ary			passed by reference, to be filled with ids for the page specified by $start and $per_page, should be ordered
	* @param	int			$start				indicates the first index of the page
	* @param	int			$per_page			number of ids each page is supposed to contain
	* @return	boolean|int						total number of results
	* @access	public
	function keyword_search($type, $fields, $terms, $sort_by_sql, $sort_key, $sort_dir, $sort_days, $ex_fid_ary, $m_approve_fid_ary, $topic_id, $author_ary, $author_name, &$id_ary, $start, $per_page)
		global $config, $db;

		// No keywords? No posts.
		if (empty($this->search_query))
			return false;

		$must_contain_ids = $this->must_contain_ids;
		$must_not_contain_ids = $this->must_not_contain_ids;
		$must_exclude_one_ids = $this->must_exclude_one_ids;


		// generate a search_key from all the options to identify the results
		$search_key = md5(implode('#', array(
			implode(',', $ex_fid_ary),
			implode(',', $m_approve_fid_ary),
			implode(',', $author_ary),

		// try reading the results from cache
		$total_results = 0;
		if ($this->obtain_ids($search_key, $total_results, $id_ary, $start, $per_page, $sort_dir) == SEARCH_RESULT_IN_CACHE)
			return $total_results;

		$id_ary = array();

		$sql_where = array();
		$group_by = false;
		$m_num = 0;
		$w_num = 0;

		$sql_array = array(
			'SELECT'	=> ($type == 'posts') ? 'p.post_id' : 'p.topic_id',
			'FROM'		=> array(
			'LEFT_JOIN' => array(array(
				'FROM'	=> array(POSTS_TABLE => 'p'),
				'ON'	=> 'm0.post_id = p.post_id',

		$title_match = '';
		$left_join_topics = false;
		$group_by = true;
		// Build some display specific sql strings
		switch ($fields)
			case 'titleonly':
				$title_match = 'title_match = 1';
				$group_by = false;
			// no break
			case 'firstpost':
				$left_join_topics = true;
				$sql_where[] = 'p.post_id = t.topic_first_post_id';

			case 'msgonly':
				$title_match = 'title_match = 0';
				$group_by = false;

		if ($type == 'topics')
			$left_join_topics = true;
			$group_by = true;

		* @todo Add a query optimizer (handle stuff like "+(4|3) +4")

		foreach ($this->must_contain_ids as $subquery)
			if (is_array($subquery))
				$group_by = true;

				$word_id_sql = array();
				$word_ids = array();
				foreach ($subquery as $id)
					if (is_string($id))
						$sql_array['LEFT_JOIN'][] = array(
							'FROM'	=> array(SEARCH_WORDLIST_TABLE => 'w' . $w_num),
							'ON'	=> "w$w_num.word_text LIKE $id"
						$word_ids[] = "w$w_num.word_id";

						$word_ids[] = $id;

				$sql_where[] = $db->sql_in_set("m$m_num.word_id", $word_ids);

			else if (is_string($subquery))
				$sql_array['FROM'][SEARCH_WORDLIST_TABLE][] = 'w' . $w_num;

				$sql_where[] = "w$w_num.word_text LIKE $subquery";
				$sql_where[] = "m$m_num.word_id = w$w_num.word_id";

				$group_by = true;
				$sql_where[] = "m$m_num.word_id = $subquery";

			$sql_array['FROM'][SEARCH_WORDMATCH_TABLE][] = 'm' . $m_num;

			if ($title_match)
				$sql_where[] = "m$m_num.$title_match";

			if ($m_num != 0)
				$sql_where[] = "m$m_num.post_id = m0.post_id";

		foreach ($this->must_not_contain_ids as $key => $subquery)
			if (is_string($subquery))
				$sql_array['LEFT_JOIN'][] = array(
					'FROM'	=> array(SEARCH_WORDLIST_TABLE => 'w' . $w_num),
					'ON'	=> "w$w_num.word_text LIKE $subquery"

				$this->must_not_contain_ids[$key] = "w$w_num.word_id";

				$group_by = true;

		if (sizeof($this->must_not_contain_ids))
			$sql_array['LEFT_JOIN'][] = array(
				'FROM'	=> array(SEARCH_WORDMATCH_TABLE => 'm' . $m_num),
				'ON'	=> $db->sql_in_set("m$m_num.word_id", $this->must_not_contain_ids) . (($title_match) ? " AND m$m_num.$title_match" : '') . " AND m$m_num.post_id = m0.post_id"

			$sql_where[] = "m$m_num.word_id IS NULL";

		foreach ($this->must_exclude_one_ids as $ids)
			$is_null_joins = array();
			foreach ($ids as $id)
				if (is_string($id))
					$sql_array['LEFT_JOIN'][] = array(
						'FROM'	=> array(SEARCH_WORDLIST_TABLE => 'w' . $w_num),
						'ON'	=> "w$w_num.word_text LIKE $id"
					$id = "w$w_num.word_id";

					$group_by = true;

				$sql_array['LEFT_JOIN'][] = array(
					'FROM'	=> array(SEARCH_WORDMATCH_TABLE => 'm' . $m_num),
					'ON'	=> "m$m_num.word_id = $id AND m$m_num.post_id = m0.post_id" . (($title_match) ? " AND m$m_num.$title_match" : '')
				$is_null_joins[] = "m$m_num.word_id IS NULL";

			$sql_where[] = '(' . implode(' OR ', $is_null_joins) . ')';

		if (!sizeof($m_approve_fid_ary))
			$sql_where[] = 'p.post_approved = 1';
		else if ($m_approve_fid_ary !== array(-1))
			$sql_where[] = '(p.post_approved = 1 OR ' . $db->sql_in_set('p.forum_id', $m_approve_fid_ary, true) . ')';

		if ($topic_id)
			$sql_where[] = 'p.topic_id = ' . $topic_id;

		if (sizeof($author_ary))
			if ($author_name)
				// first one matches post of registered users, second one guests and deleted users
				$sql_author = '(' . $db->sql_in_set('p.poster_id', array_diff($author_ary, array(ANONYMOUS)), false, true) . ' OR p.post_username ' . $author_name . ')';
				$sql_author = $db->sql_in_set('p.poster_id', $author_ary);
			$sql_where[] = $sql_author;

		if (sizeof($ex_fid_ary))
			$sql_where[] = $db->sql_in_set('p.forum_id', $ex_fid_ary, true);

		if ($sort_days)
			$sql_where[] = 'p.post_time >= ' . (time() - ($sort_days * 86400));

		$sql_array['WHERE'] = implode(' AND ', $sql_where);

		$is_mysql = false;
		// if the total result count is not cached yet, retrieve it from the db
		if (!$total_results)
			$sql = '';
			$sql_array_count = $sql_array;

			if ($left_join_topics)
				$sql_array_count['LEFT_JOIN'][] = array(
					'FROM'	=> array(TOPICS_TABLE => 't'),
					'ON'	=> 'p.topic_id = t.topic_id'

			switch ($db->sql_layer)
				case 'mysql4':
				case 'mysqli':

					// 3.x does not support SQL_CALC_FOUND_ROWS
					// $sql_array['SELECT'] = 'SQL_CALC_FOUND_ROWS ' . $sql_array['SELECT'];
					$is_mysql = true;


				case 'sqlite':
					$sql_array_count['SELECT'] = ($type == 'posts') ? 'DISTINCT p.post_id' : 'DISTINCT p.topic_id';
					$sql = 'SELECT COUNT(' . (($type == 'posts') ? 'post_id' : 'topic_id') . ') as total_results
							FROM (' . $db->sql_build_query('SELECT', $sql_array_count) . ')';

				// no break

					$sql_array_count['SELECT'] = ($type == 'posts') ? 'COUNT(DISTINCT p.post_id) AS total_results' : 'COUNT(DISTINCT p.topic_id) AS total_results';
					$sql = (!$sql) ? $db->sql_build_query('SELECT', $sql_array_count) : $sql;

					$result = $db->sql_query($sql);
					$total_results = (int) $db->sql_fetchfield('total_results');

					if (!$total_results)
						return false;

			unset($sql_array_count, $sql);

		// Build sql strings for sorting
		$sql_sort = $sort_by_sql[$sort_key] . (($sort_dir == 'a') ? ' ASC' : ' DESC');

		switch ($sql_sort[0])
			case 'u':
				$sql_array['FROM'][USERS_TABLE] = 'u';
				$sql_where[] = 'u.user_id = p.poster_id ';

			case 't':
				$left_join_topics = true;

			case 'f':
				$sql_array['FROM'][FORUMS_TABLE] = 'f';
				$sql_where[] = 'f.forum_id = p.forum_id';

		if ($left_join_topics)
			$sql_array['LEFT_JOIN'][] = array(
				'FROM'	=> array(TOPICS_TABLE => 't'),
				'ON'	=> 'p.topic_id = t.topic_id'

		$sql_array['WHERE'] = implode(' AND ', $sql_where);
		$sql_array['GROUP_BY'] = ($group_by) ? (($type == 'posts') ? 'p.post_id' : 'p.topic_id') . ', ' . $sort_by_sql[$sort_key] : '';
		$sql_array['ORDER_BY'] = $sql_sort;

		unset($sql_where, $sql_sort, $group_by);

		$sql = $db->sql_build_query('SELECT', $sql_array);
		$result = $db->sql_query_limit($sql, $config['search_block_size'], $start);

		while ($row = $db->sql_fetchrow($result))
			$id_ary[] = (int) $row[(($type == 'posts') ? 'post_id' : 'topic_id')];

		if (!sizeof($id_ary))
			return false;

		// if we use mysql and the total result count is not cached yet, retrieve it from the db
		if (!$total_results && $is_mysql)
			// Count rows for the executed queries. Replace $select within $sql with SQL_CALC_FOUND_ROWS, and run it.
			$sql_array_copy = $sql_array;
			$sql_array_copy['SELECT'] = 'SQL_CALC_FOUND_ROWS p.post_id ';

			$sql = $db->sql_build_query('SELECT', $sql_array_copy);


			$sql = 'SELECT FOUND_ROWS() as total_results';
			$result = $db->sql_query($sql);
			$total_results = (int) $db->sql_fetchfield('total_results');

			if (!$total_results)
				return false;

		// store the ids, from start on then delete anything that isn't on the current page because we only need ids for one page
		$this->save_ids($search_key, $this->search_query, $author_ary, $total_results, $id_ary, $start, $sort_dir);
		$id_ary = array_slice($id_ary, 0, (int) $per_page);

		return $total_results;

	* Performs a search on an author's posts without caring about message contents. Depends on display specific params
	* @param	string		$type				contains either posts or topics depending on what should be searched for
	* @param	boolean		$firstpost_only		if true, only topic starting posts will be considered
	* @param	array		$sort_by_sql		contains SQL code for the ORDER BY part of a query
	* @param	string		$sort_key			is the key of $sort_by_sql for the selected sorting
	* @param	string		$sort_dir			is either a or d representing ASC and DESC
	* @param	string		$sort_days			specifies the maximum amount of days a post may be old
	* @param	array		$ex_fid_ary			specifies an array of forum ids which should not be searched
	* @param	array		$m_approve_fid_ary	specifies an array of forum ids in which the searcher is allowed to view unapproved posts
	* @param	int			$topic_id			is set to 0 or a topic id, if it is not 0 then only posts in this topic should be searched
	* @param	array		$author_ary			an array of author ids
	* @param	string		$author_name		specifies the author match, when ANONYMOUS is also a search-match
	* @param	array		&$id_ary			passed by reference, to be filled with ids for the page specified by $start and $per_page, should be ordered
	* @param	int			$start				indicates the first index of the page
	* @param	int			$per_page			number of ids each page is supposed to contain
	* @return	boolean|int						total number of results
	* @access	public
	function author_search($type, $firstpost_only, $sort_by_sql, $sort_key, $sort_dir, $sort_days, $ex_fid_ary, $m_approve_fid_ary, $topic_id, $author_ary, $author_name, &$id_ary, $start, $per_page)
		global $config, $db;

		// No author? No posts.
		if (!sizeof($author_ary))
			return 0;

		// generate a search_key from all the options to identify the results
		$search_key = md5(implode('#', array(
			($firstpost_only) ? 'firstpost' : '',
			implode(',', $ex_fid_ary),
			implode(',', $m_approve_fid_ary),
			implode(',', $author_ary),

		// try reading the results from cache
		$total_results = 0;
		if ($this->obtain_ids($search_key, $total_results, $id_ary, $start, $per_page, $sort_dir) == SEARCH_RESULT_IN_CACHE)
			return $total_results;

		$id_ary = array();

		// Create some display specific sql strings
		if ($author_name)
			// first one matches post of registered users, second one guests and deleted users
			$sql_author = '(' . $db->sql_in_set('p.poster_id', array_diff($author_ary, array(ANONYMOUS)), false, true) . ' OR p.post_username ' . $author_name . ')';
			$sql_author = $db->sql_in_set('p.poster_id', $author_ary);
		$sql_fora		= (sizeof($ex_fid_ary)) ? ' AND ' . $db->sql_in_set('p.forum_id', $ex_fid_ary, true) : '';
		$sql_time		= ($sort_days) ? ' AND p.post_time >= ' . (time() - ($sort_days * 86400)) : '';
		$sql_topic_id	= ($topic_id) ? ' AND p.topic_id = ' . (int) $topic_id : '';
		$sql_firstpost = ($firstpost_only) ? ' AND p.post_id = t.topic_first_post_id' : '';

		// Build sql strings for sorting
		$sql_sort = $sort_by_sql[$sort_key] . (($sort_dir == 'a') ? ' ASC' : ' DESC');
		$sql_sort_table = $sql_sort_join = '';
		switch ($sql_sort[0])
			case 'u':
				$sql_sort_table	= USERS_TABLE . ' u, ';
				$sql_sort_join	= ' AND u.user_id = p.poster_id ';

			case 't':
				$sql_sort_table	= ($type == 'posts' && !$firstpost_only) ? TOPICS_TABLE . ' t, ' : '';
				$sql_sort_join	= ($type == 'posts' && !$firstpost_only) ? ' AND t.topic_id = p.topic_id ' : '';

			case 'f':
				$sql_sort_table	= FORUMS_TABLE . ' f, ';
				$sql_sort_join	= ' AND f.forum_id = p.forum_id ';

		if (!sizeof($m_approve_fid_ary))
			$m_approve_fid_sql = ' AND p.post_approved = 1';
		else if ($m_approve_fid_ary == array(-1))
			$m_approve_fid_sql = '';
			$m_approve_fid_sql = ' AND (p.post_approved = 1 OR ' . $db->sql_in_set('p.forum_id', $m_approve_fid_ary, true) . ')';

		$select = ($type == 'posts') ? 'p.post_id' : 't.topic_id';
		$is_mysql = false;

		// If the cache was completely empty count the results
		if (!$total_results)
			switch ($db->sql_layer)
				case 'mysql4':
				case 'mysqli':
//					$select = 'SQL_CALC_FOUND_ROWS ' . $select;
					$is_mysql = true;

					if ($type == 'posts')
						$sql = 'SELECT COUNT(p.post_id) as total_results
							FROM ' . POSTS_TABLE . ' p' . (($firstpost_only) ? ', ' . TOPICS_TABLE . ' t ' : ' ') . "
							WHERE $sql_author
						if ($db->sql_layer == 'sqlite')
							$sql = 'SELECT COUNT(topic_id) as total_results
								FROM (SELECT DISTINCT t.topic_id';
							$sql = 'SELECT COUNT(DISTINCT t.topic_id) as total_results';

						$sql .= ' FROM ' . TOPICS_TABLE . ' t, ' . POSTS_TABLE . " p
							WHERE $sql_author
								AND t.topic_id = p.topic_id
								$sql_time" . (($db->sql_layer == 'sqlite') ? ')' : '');
					$result = $db->sql_query($sql);

					$total_results = (int) $db->sql_fetchfield('total_results');

					if (!$total_results)
						return false;

		// Build the query for really selecting the post_ids
		if ($type == 'posts')
			$sql = "SELECT $select
				FROM " . $sql_sort_table . POSTS_TABLE . ' p' . (($firstpost_only) ? ', ' . TOPICS_TABLE . ' t' : '') . "
				WHERE $sql_author
				ORDER BY $sql_sort";
			$field = 'post_id';
			$sql = "SELECT $select
				FROM " . $sql_sort_table . TOPICS_TABLE . ' t, ' . POSTS_TABLE . " p
				WHERE $sql_author
					AND t.topic_id = p.topic_id
				GROUP BY t.topic_id, " . $sort_by_sql[$sort_key] . '
				ORDER BY ' . $sql_sort;
			$field = 'topic_id';

		// Only read one block of posts from the db and then cache it
		$result = $db->sql_query_limit($sql, $config['search_block_size'], $start);

		while ($row = $db->sql_fetchrow($result))
			$id_ary[] = (int) $row[$field];

		if (!$total_results && $is_mysql)
			// Count rows for the executed queries. Replace $select within $sql with SQL_CALC_FOUND_ROWS, and run it.
			$sql = str_replace('SELECT ' . $select, 'SELECT DISTINCT SQL_CALC_FOUND_ROWS p.post_id', $sql);


			$sql = 'SELECT FOUND_ROWS() as total_results';
			$result = $db->sql_query($sql);
			$total_results = (int) $db->sql_fetchfield('total_results');

			if (!$total_results)
				return false;

		if (sizeof($id_ary))
			$this->save_ids($search_key, '', $author_ary, $total_results, $id_ary, $start, $sort_dir);
			$id_ary = array_slice($id_ary, 0, $per_page);

			return $total_results;
		return false;

	* Split a text into words of a given length
	* The text is converted to UTF-8, cleaned up, and split. Then, words that
	* conform to the defined length range are returned in an array.
	* NOTE: duplicates are NOT removed from the return array
	* @param	string	$text	Text to split, encoded in UTF-8
	* @return	array			Array of UTF-8 words
	* @access	private
	function split_message($text)
		global $phpbb_root_path, $phpEx, $user;

		$match = $words = array();

		* Taken from the original code
		// Do not index code
		$match[] = '#\[code(?:=.*?)?(\:?[0-9a-z]{5,})\].*?\[\/code(\:?[0-9a-z]{5,})\]#is';
		// BBcode
		$match[] = '#\[\/?[a-z0-9\*\+\-]+(?:=.*?)?(?::[a-z])?(\:?[0-9a-z]{5,})\]#';

		$min = $this->word_length['min'];
		$max = $this->word_length['max'];

		$isset_min = $min - 1;

		* Clean up the string, remove HTML tags, remove BBCodes
		$word = strtok($this->cleanup(preg_replace($match, ' ', strip_tags($text)), -1), ' ');

		while (strlen($word))
			if (strlen($word) > 255 || strlen($word) <= $isset_min)
				* Words longer than 255 bytes are ignored. This will have to be
				* changed whenever we change the length of search_wordlist.word_text
				* Words shorter than $isset_min bytes are ignored, too
				$word = strtok(' ');

			$len = utf8_strlen($word);

			* Test whether the word is too short to be indexed.
			* Note that this limit does NOT apply to CJK and Hangul
			if ($len < $min)
				* Note: this could be optimized. If the codepoint is lower than Hangul's range
				* we know that it will also be lower than CJK ranges
				if ((strncmp($word, UTF8_HANGUL_FIRST, 3) < 0 || strncmp($word, UTF8_HANGUL_LAST, 3) > 0)
				 && (strncmp($word, UTF8_CJK_FIRST, 3) < 0 || strncmp($word, UTF8_CJK_LAST, 3) > 0)
				 && (strncmp($word, UTF8_CJK_B_FIRST, 4) < 0 || strncmp($word, UTF8_CJK_B_LAST, 4) > 0))
					$word = strtok(' ');

			$words[] = $word;
			$word = strtok(' ');

		return $words;

	* Updates wordlist and wordmatch tables when a message is posted or changed
	* @param	string	$mode		Contains the post mode: edit, post, reply, quote
	* @param	int		$post_id	The id of the post which is modified/created
	* @param	string	&$message	New or updated post content
	* @param	string	&$subject	New or updated post subject
	* @param	int		$poster_id	Post author's user id
	* @param	int		$forum_id	The id of the forum in which the post is located
	* @access	public
	function index($mode, $post_id, &$message, &$subject, $poster_id, $forum_id)
		global $config, $db, $user;

		if (!$config['fulltext_native_load_upd'])
			* The search indexer is disabled, return

		// Split old and new post/subject to obtain array of 'words'
		$split_text = $this->split_message($message);
		$split_title = $this->split_message($subject);

		$cur_words = array('post' => array(), 'title' => array());

		$words = array();
		if ($mode == 'edit')
			$words['add']['post'] = array();
			$words['add']['title'] = array();
			$words['del']['post'] = array();
			$words['del']['title'] = array();

			$sql = 'SELECT w.word_id, w.word_text, m.title_match
				WHERE m.post_id = $post_id
					AND w.word_id = m.word_id";
			$result = $db->sql_query($sql);

			while ($row = $db->sql_fetchrow($result))
				$which = ($row['title_match']) ? 'title' : 'post';
				$cur_words[$which][$row['word_text']] = $row['word_id'];

			$words['add']['post'] = array_diff($split_text, array_keys($cur_words['post']));
			$words['add']['title'] = array_diff($split_title, array_keys($cur_words['title']));
			$words['del']['post'] = array_diff(array_keys($cur_words['post']), $split_text);
			$words['del']['title'] = array_diff(array_keys($cur_words['title']), $split_title);
			$words['add']['post'] = $split_text;
			$words['add']['title'] = $split_title;
			$words['del']['post'] = array();
			$words['del']['title'] = array();

		// Get unique words from the above arrays
		$unique_add_words = array_unique(array_merge($words['add']['post'], $words['add']['title']));

		// We now have unique arrays of all words to be added and removed and
		// individual arrays of added and removed words for text and title. What
		// we need to do now is add the new words (if they don't already exist)
		// and then add (or remove) matches between the words and this post
		if (sizeof($unique_add_words))
			$sql = 'SELECT word_id, word_text
				WHERE ' . $db->sql_in_set('word_text', $unique_add_words);
			$result = $db->sql_query($sql);

			$word_ids = array();
			while ($row = $db->sql_fetchrow($result))
				$word_ids[$row['word_text']] = $row['word_id'];
			$new_words = array_diff($unique_add_words, array_keys($word_ids));

			if (sizeof($new_words))
				$sql_ary = array();

				foreach ($new_words as $word)
					$sql_ary[] = array('word_text' => (string) $word, 'word_count' => 0);
				$db->sql_multi_insert(SEARCH_WORDLIST_TABLE, $sql_ary);
			unset($new_words, $sql_ary);

		// now update the search match table, remove links to removed words and add links to new words
		foreach ($words['del'] as $word_in => $word_ary)
			$title_match = ($word_in == 'title') ? 1 : 0;

			if (sizeof($word_ary))
				$sql_in = array();
				foreach ($word_ary as $word)
					$sql_in[] = $cur_words[$word_in][$word];

					WHERE ' . $db->sql_in_set('word_id', $sql_in) . '
						AND post_id = ' . intval($post_id) . "
						AND title_match = $title_match";

					SET word_count = word_count - 1
					WHERE ' . $db->sql_in_set('word_id', $sql_in) . '
						AND word_count > 0';


		foreach ($words['add'] as $word_in => $word_ary)
			$title_match = ($word_in == 'title') ? 1 : 0;

			if (sizeof($word_ary))
				$sql = 'INSERT INTO ' . SEARCH_WORDMATCH_TABLE . ' (post_id, word_id, title_match)
					SELECT ' . (int) $post_id . ', word_id, ' . (int) $title_match . '
					WHERE ' . $db->sql_in_set('word_text', $word_ary);

					SET word_count = word_count + 1
					WHERE ' . $db->sql_in_set('word_text', $word_ary);


		// destroy cached search results containing any of the words removed or added
		$this->destroy_cache(array_unique(array_merge($words['add']['post'], $words['add']['title'], $words['del']['post'], $words['del']['title'])), array($poster_id));


	* Removes entries from the wordmatch table for the specified post_ids
	function index_remove($post_ids, $author_ids, $forum_ids)
		global $db;

		if (sizeof($post_ids))
			$sql = 'SELECT w.word_id, w.word_text, m.title_match
				WHERE ' . $db->sql_in_set('m.post_id', $post_ids) . '
					AND w.word_id = m.word_id';
			$result = $db->sql_query($sql);

			$message_word_ids = $title_word_ids = $word_texts = array();
			while ($row = $db->sql_fetchrow($result))
				if ($row['title_match'])
					$title_word_ids[] = $row['word_id'];
					$message_word_ids[] = $row['word_id'];
				$word_texts[] = $row['word_text'];

			if (sizeof($title_word_ids))
					SET word_count = word_count - 1
					WHERE ' . $db->sql_in_set('word_id', $title_word_ids) . '
						AND word_count > 0';

			if (sizeof($message_word_ids))
					SET word_count = word_count - 1
					WHERE ' . $db->sql_in_set('word_id', $message_word_ids) . '
						AND word_count > 0';


				WHERE ' . $db->sql_in_set('post_id', $post_ids);

		$this->destroy_cache(array_unique($word_texts), array_unique($author_ids));

	* Tidy up indexes: Tag 'common words' and remove
	* words no longer referenced in the match table
	function tidy()
		global $db, $config;

		// Is the fulltext indexer disabled? If yes then we need not
		// carry on ... it's okay ... I know when I'm not wanted boo hoo
		if (!$config['fulltext_native_load_upd'])
			set_config('search_last_gc', time(), true);

		$destroy_cache_words = array();

		// Remove common words
		if ($config['num_posts'] >= 100 && $config['fulltext_native_common_thres'])
			$common_threshold = ((double) $config['fulltext_native_common_thres']) / 100.0;
			// First, get the IDs of common words
			$sql = 'SELECT word_id, word_text
				WHERE word_count > ' . floor($config['num_posts'] * $common_threshold) . '
					OR word_common = 1';
			$result = $db->sql_query($sql);

			$sql_in = array();
			while ($row = $db->sql_fetchrow($result))
				$sql_in[] = $row['word_id'];
				$destroy_cache_words[] = $row['word_text'];

			if (sizeof($sql_in))
				// Flag the words
					SET word_common = 1
					WHERE ' . $db->sql_in_set('word_id', $sql_in);

				// by setting search_last_gc to the new time here we make sure that if a user reloads because the
				// following query takes too long, he won't run into it again
				set_config('search_last_gc', time(), true);

				// Delete the matches
					WHERE ' . $db->sql_in_set('word_id', $sql_in);

		if (sizeof($destroy_cache_words))
			// destroy cached search results containing any of the words that are now common or were removed

		set_config('search_last_gc', time(), true);

	* Deletes all words from the index
	function delete_index($acp_module, $u_action)
		global $db;

		switch ($db->sql_layer)
			case 'sqlite':
			case 'firebird':
				$db->sql_query('DELETE FROM ' . SEARCH_WORDLIST_TABLE);
				$db->sql_query('DELETE FROM ' . SEARCH_WORDMATCH_TABLE);
				$db->sql_query('DELETE FROM ' . SEARCH_RESULTS_TABLE);


	* Returns true if both FULLTEXT indexes exist
	function index_created()
		if (!sizeof($this->stats))

		return ($this->stats['total_words'] && $this->stats['total_matches']) ? true : false;

	* Returns an associative array containing information about the indexes
	function index_stats()
		global $user;

		if (!sizeof($this->stats))

		return array(
			$user->lang['TOTAL_WORDS']		=> $this->stats['total_words'],
			$user->lang['TOTAL_MATCHES']	=> $this->stats['total_matches']);

	function get_stats()
		global $db;

		$this->stats['total_words']		= $db->get_estimated_row_count(SEARCH_WORDLIST_TABLE);
		$this->stats['total_matches']	= $db->get_estimated_row_count(SEARCH_WORDMATCH_TABLE);

	* Clean up a text to remove non-alphanumeric characters
	* This method receives a UTF-8 string, normalizes and validates it, replaces all
	* non-alphanumeric characters with strings then returns the result.
	* Any number of "allowed chars" can be passed as a UTF-8 string in NFC.
	* @param	string	$text			Text to split, in UTF-8 (not normalized or sanitized)
	* @param	string	$allowed_chars	String of special chars to allow
	* @param	string	$encoding		Text encoding
	* @return	string					Cleaned up text, only alphanumeric chars are left
	* @todo normalizer::cleanup being able to be used?
	function cleanup($text, $allowed_chars = null, $encoding = 'utf-8')
		global $phpbb_root_path, $phpEx;
		static $conv = array(), $conv_loaded = array();
		$words = $allow = array();

		// Convert the text to UTF-8
		$encoding = strtolower($encoding);
		if ($encoding != 'utf-8')
			$text = utf8_recode($text, $encoding);

		$utf_len_mask = array(
			"\xC0"	=>	2,
			"\xD0"	=>	2,
			"\xE0"	=>	3,
			"\xF0"	=>	4

		* Replace HTML entities and NCRs
		$text = htmlspecialchars_decode(utf8_decode_ncr($text), ENT_QUOTES);

		* Load the UTF-8 normalizer
		* If we use it more widely, an instance of that class should be held in a
		* a global variable instead

		* The first thing we do is:
		* - convert ASCII-7 letters to lowercase
		* - remove the ASCII-7 non-alpha characters
		* - remove the bytes that should not appear in a valid UTF-8 string: 0xC0,
		*   0xC1 and 0xF5-0xFF
		* @todo in theory, the third one is already taken care of during normalization and those chars should have been replaced by Unicode replacement chars
		$sb_match	= "ISTCPAMELRDOJBNHFGVWUQKYXZ\r\n\t!\"#$%&'()*+,-./:;<=>?@[\\]^_`{|}~\x00\x01\x02\x03\x04\x05\x06\x07\x08\x0B\x0C\x0E\x0F\x10\x11\x12\x13\x14\x15\x16\x17\x18\x19\x1A\x1B\x1C\x1D\x1E\x1F\xC0\xC1\xF5\xF6\xF7\xF8\xF9\xFA\xFB\xFC\xFD\xFE\xFF";
		$sb_replace	= 'istcpamelrdojbnhfgvwuqkyxz                                                                              ';

		* This is the list of legal ASCII chars, it is automatically extended
		* with ASCII chars from $allowed_chars
		$legal_ascii = ' eaisntroludcpmghbfvq10xy2j9kw354867z';

		* Prepare an array containing the extra chars to allow
		if (isset($allowed_chars[0]))
			$pos = 0;
			$len = strlen($allowed_chars);
				$c = $allowed_chars[$pos];

				if ($c < "\x80")
					* ASCII char
					$sb_pos = strpos($sb_match, $c);
					if (is_int($sb_pos))
						* Remove the char from $sb_match and its corresponding
						* replacement in $sb_replace
						$sb_match = substr($sb_match, 0, $sb_pos) . substr($sb_match, $sb_pos + 1);
						$sb_replace = substr($sb_replace, 0, $sb_pos) . substr($sb_replace, $sb_pos + 1);
						$legal_ascii .= $c;

					* UTF-8 char
					$utf_len = $utf_len_mask[$c & "\xF0"];
					$allow[substr($allowed_chars, $pos, $utf_len)] = 1;
					$pos += $utf_len;
			while ($pos < $len);

		$text = strtr($text, $sb_match, $sb_replace);
		$ret = '';

		$pos = 0;
		$len = strlen($text);

			* Do all consecutive ASCII chars at once
			if ($spn = strspn($text, $legal_ascii, $pos))
				$ret .= substr($text, $pos, $spn);
				$pos += $spn;

			if ($pos >= $len)
				return $ret;

			* Capture the UTF char
			$utf_len = $utf_len_mask[$text[$pos] & "\xF0"];
			$utf_char = substr($text, $pos, $utf_len);
			$pos += $utf_len;

			if (($utf_char >= UTF8_HANGUL_FIRST && $utf_char <= UTF8_HANGUL_LAST)
			 || ($utf_char >= UTF8_CJK_FIRST && $utf_char <= UTF8_CJK_LAST)
			 || ($utf_char >= UTF8_CJK_B_FIRST && $utf_char <= UTF8_CJK_B_LAST))
				* All characters within these ranges are valid
				* We separate them with a space in order to index each character
				* individually
				$ret .= ' ' . $utf_char . ' ';

			if (isset($allow[$utf_char]))
				* The char is explicitly allowed
				$ret .= $utf_char;

			if (isset($conv[$utf_char]))
				* The char is mapped to something, maybe to itself actually
				$ret .= $conv[$utf_char];

			* The char isn't mapped, but did we load its conversion table?
			* The search indexer table is split into blocks. The block number of
			* each char is equal to its codepoint right-shifted for 11 bits. It
			* means that out of the 11, 16 or 21 meaningful bits of a 2-, 3- or
			* 4- byte sequence we only keep the leftmost 0, 5 or 10 bits. Thus,
			* all UTF chars encoded in 2 bytes are in the same first block.
			if (isset($utf_char[2]))
				if (isset($utf_char[3]))
					* 1111 0nnn 10nn nnnn 10nx xxxx 10xx xxxx
					* 0000 0111 0011 1111 0010 0000
					$idx = ((ord($utf_char[0]) & 0x07) << 7) | ((ord($utf_char[1]) & 0x3F) << 1) | ((ord($utf_char[2]) & 0x20) >> 5);
					* 1110 nnnn 10nx xxxx 10xx xxxx
					* 0000 0111 0010 0000
					$idx = ((ord($utf_char[0]) & 0x07) << 1) | ((ord($utf_char[1]) & 0x20) >> 5);
				* 110x xxxx 10xx xxxx
				* 0000 0000 0000 0000
				$idx = 0;

			* Check if the required conv table has been loaded already
			if (!isset($conv_loaded[$idx]))
				$conv_loaded[$idx] = 1;
				$file = $phpbb_root_path . 'includes/utf/data/search_indexer_' . $idx . '.' . $phpEx;

				if (file_exists($file))
					$conv += include($file);

			if (isset($conv[$utf_char]))
				$ret .= $conv[$utf_char];
				* We add an entry to the conversion table so that we
				* don't have to convert to codepoint and perform the checks
				* that are above this block
				$conv[$utf_char] = ' ';
				$ret .= ' ';
		while (1);

		return $ret;

	* Returns a list of options for the ACP to display
	function acp()
		global $user, $config;

		* if we need any options, copied from fulltext_native for now, will have to be adjusted or removed

		$tpl = '
			<dt><label for="fulltext_native_load_upd">' . $user->lang['YES_SEARCH_UPDATE'] . ':</label><br /><span>' . $user->lang['YES_SEARCH_UPDATE_EXPLAIN'] . '</span></dt>
			<dd><label><input type="radio" id="fulltext_native_load_upd" name="config[fulltext_native_load_upd]" value="1"' . (($config['fulltext_native_load_upd']) ? ' checked="checked"' : '') . ' class="radio" /> ' . $user->lang['YES'] . '</label><label><input type="radio" name="config[fulltext_native_load_upd]" value="0"' . ((!$config['fulltext_native_load_upd']) ? ' checked="checked"' : '') . ' class="radio" /> ' . $user->lang['NO'] . '</label></dd>
			<dt><label for="fulltext_native_min_chars">' . $user->lang['MIN_SEARCH_CHARS'] . ':</label><br /><span>' . $user->lang['MIN_SEARCH_CHARS_EXPLAIN'] . '</span></dt>
			<dd><input id="fulltext_native_min_chars" type="text" size="3" maxlength="3" name="config[fulltext_native_min_chars]" value="' . (int) $config['fulltext_native_min_chars'] . '" /></dd>
			<dt><label for="fulltext_native_max_chars">' . $user->lang['MAX_SEARCH_CHARS'] . ':</label><br /><span>' . $user->lang['MAX_SEARCH_CHARS_EXPLAIN'] . '</span></dt>
			<dd><input id="fulltext_native_max_chars" type="text" size="3" maxlength="3" name="config[fulltext_native_max_chars]" value="' . (int) $config['fulltext_native_max_chars'] . '" /></dd>
			<dt><label for="fulltext_native_common_thres">' . $user->lang['COMMON_WORD_THRESHOLD'] . ':</label><br /><span>' . $user->lang['COMMON_WORD_THRESHOLD_EXPLAIN'] . '</span></dt>
			<dd><input id="fulltext_native_common_thres" type="text" size="3" maxlength="3" name="config[fulltext_native_common_thres]" value="' . (double) $config['fulltext_native_common_thres'] . '" /> %</dd>

		// These are fields required in the config table
		return array(
			'tpl'		=> $tpl,
			'config'	=> array('fulltext_native_load_upd' => 'bool', 'fulltext_native_min_chars' => 'integer:0:255', 'fulltext_native_max_chars' => 'integer:0:255', 'fulltext_native_common_thres' => 'double:0:100')


