mirror of
				https://github.com/phpbb/phpbb.git
				synced 2025-10-25 13:46:50 +02:00 
			
		
		
		
	
		
			
				
	
	
		
			346 lines
		
	
	
		
			8.6 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
			
		
		
	
	
			346 lines
		
	
	
		
			8.6 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
| <?php
 | |
| /***************************************************************************
 | |
|  *                             admin_search.php
 | |
|  *                            -------------------
 | |
|  *   begin                : Saturday, Feb 13, 2001
 | |
|  *   copyright            : (C) 2001 The phpBB Group
 | |
|  *   email                : support@phpbb.com
 | |
|  *
 | |
|  *   $Id$
 | |
|  *
 | |
|  ***************************************************************************/
 | |
| 
 | |
| /***************************************************************************
 | |
|  *
 | |
|  *   This program is free software; you can redistribute it and/or modify
 | |
|  *   it under the terms of the GNU General Public License as published by
 | |
|  *   the Free Software Foundation; either version 2 of the License, or
 | |
|  *   (at your option) any later version.
 | |
|  *
 | |
|  ***************************************************************************/
 | |
| 
 | |
| if (!empty($setmodules))
 | |
| {
 | |
| 	if (!$auth->acl_get('a_search'))
 | |
| 	{
 | |
| 		return;
 | |
| 	}
 | |
| 
 | |
| 	$module['DB']['Search_indexing'] = basename(__FILE__) . $SID;
 | |
| 
 | |
| 	return;
 | |
| }
 | |
| 
 | |
| define('IN_PHPBB', 1);
 | |
| // Include files
 | |
| $phpbb_root_path = '../';
 | |
| require($phpbb_root_path . 'extension.inc');
 | |
| require('pagestart.' . $phpEx);
 | |
| include($phpbb_root_path . 'includes/functions_posting.'.$phpEx);
 | |
| 
 | |
| // Check permissions
 | |
| if (!$auth->acl_get('a_search'))
 | |
| {
 | |
| 	trigger_error($user->lang['NO_ADMIN']);
 | |
| }
 | |
| 
 | |
| // Start indexing
 | |
| if (isset($_POST['start']) || isset($_GET['batchstart']))
 | |
| {
 | |
| 	$batchsize = 200; // Process this many posts per batch
 | |
| 	$batchstart = (!isset($_GET['batchstart'])) ? $row['min_post_id'] : $_GET['batchstart'];
 | |
| 	$batchcount = (!isset($_GET['batchcount'])) ? 1 : $_GET['batchcount'];
 | |
| 	$loopcount = 0;
 | |
| 	$batchend = $batchstart + $batchsize;
 | |
| 
 | |
| 	// Search re-indexing is tough on the server ... so we'll check the load
 | |
| 	// each loop and if we're on a 1min load of 3 or more we'll re-load the page
 | |
| 	// and try again. No idea how well this will work in practice so we'll see ...
 | |
| 	if (file_exists('/proc/loadavg'))
 | |
| 	{
 | |
| 		if ($load = @file('/proc/loadavg'))
 | |
| 		{
 | |
| 			list($load) = explode(' ', $load[0]);
 | |
| 
 | |
| 			if ($load > 3)
 | |
| 			{
 | |
| 				header("Location: admin_search.$phpEx$SID&batchstart=$batchstart&batchcount=$batch_count");
 | |
| 				exit;
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	// Try and load stopword and synonym files
 | |
| 	$stopword_array = array();
 | |
| 	$synonym_array = array();
 | |
| 
 | |
| 	$dir = opendir($phpbb_root_path . 'language/');
 | |
| 	while ($file = readdir($dir))
 | |
| 	{
 | |
| 		if (preg_match('#^lang_#', $file) && !is_file($phpbb_root_path . 'language/' . $file) && !is_link($phpbb_root_path . 'language/' . $file))
 | |
| 		{
 | |
| 			unset($tmp_array);
 | |
| 			$tmp_array = @file($phpbb_root_path . 'language/' . $file . '/search_stopwords.txt');
 | |
| 			if (is_array($tmp_array))
 | |
| 			{
 | |
| 				$stopword_array = array_unique(array_merge($stopword_array, $tmp_array));
 | |
| 			}
 | |
| 
 | |
| 			unset($tmp_array);
 | |
| 			$tmp_array = @file($phpbb_root_path . 'language/' . $file . '/search_synonyms.txt');
 | |
| 			if (is_array($tmp_array))
 | |
| 			{
 | |
| 				$synonym_array = array_unique(array_merge($synonym_array, $tmp_array));
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	closedir($dir);
 | |
| 
 | |
| 	if (!isset($_GET['batchstart']))
 | |
| 	{
 | |
| 		//
 | |
| 		// Take board offline
 | |
| 		//
 | |
| 		$sql = "UPDATE " . CONFIG_TABLE . "
 | |
| 			SET config_value = '1'
 | |
| 			WHERE config_name = 'board_disable'";
 | |
| 		$db->sql_query($sql);
 | |
| 
 | |
| 		//
 | |
| 		// Empty existing tables
 | |
| 		//
 | |
| 		$db->sql_query("TRUNCATE " . SEARCH_TABLE);
 | |
| 		$db->sql_query("TRUNCATE " . SEARCH_WORD_TABLE);
 | |
| 		$db->sql_query("TRUNCATE " . SEARCH_MATCH_TABLE);
 | |
| 	}
 | |
| 
 | |
| 	//
 | |
| 	// Fetch a batch of posts_text entries
 | |
| 	//
 | |
| 	$sql = "SELECT COUNT(*) AS total, MAX(post_id) AS max_post_id, MIN(post_id) AS min_post_id
 | |
| 		FROM " . POSTS_TEXT_TABLE;
 | |
| 	$result = $db->sql_query($sql);
 | |
| 
 | |
| 	$row = $db->sql_fetchrow($result);
 | |
| 	$totalposts = $row['total'];
 | |
| 	$max_post_id = $row['max_post_id'];
 | |
| 
 | |
| 	$db->sql_freeresult($result);
 | |
| 
 | |
| 	$sql = "SELECT *
 | |
| 		FROM " . POSTS_TEXT_TABLE . "
 | |
| 		WHERE post_id
 | |
| 			BETWEEN $batchstart
 | |
| 				AND $batchend";
 | |
| 	$result = $db->sql_query($sql);
 | |
| 
 | |
| 	if ($row = $db->sql_fetchrow($result))
 | |
| 	{
 | |
| 		do
 | |
| 		{
 | |
| 			$post_id = $row['post_id'];
 | |
| 
 | |
| 			$search_raw_words = array();
 | |
| 			$search_raw_words['text'] = split_words(clean_words('post', $row['post_text'], $stopword_array, $synonym_array));
 | |
| 			$search_raw_words['title'] = split_words(clean_words('post', $row['post_subject'], $stopword_array, $synonym_array));
 | |
| 
 | |
| 			$word = array();
 | |
| 			$word_insert_sql = array();
 | |
| 			foreach ($search_raw_words as $word_in => $search_matches)
 | |
| 			{
 | |
| 				$word_insert_sql[$word_in] = '';
 | |
| 				if (!empty($search_matches))
 | |
| 				{
 | |
| 					for ($i = 0; $i < count($search_matches); $i++)
 | |
| 					{
 | |
| 						$search_matches[$i] = trim($search_matches[$i]);
 | |
| 
 | |
| 						if ($search_matches[$i] != '')
 | |
| 						{
 | |
| 							$word[] = $search_matches[$i];
 | |
| 							$word_insert_sql[$word_in] .= ($word_insert_sql[$word_in] != '') ? ", '" . $search_matches[$i] . "'" : "'" . $search_matches[$i] . "'";
 | |
| 						}
 | |
| 					}
 | |
| 				}
 | |
| 			}
 | |
| 
 | |
| 			if (count($word))
 | |
| 			{
 | |
| 				$word_text_sql = '';
 | |
| 				$word = array_unique($word);
 | |
| 
 | |
| 				for($i = 0; $i < count($word); $i++)
 | |
| 				{
 | |
| 					$word_text_sql .= (($word_text_sql != '') ? ', ' : '') . "'" . $word[$i] . "'";
 | |
| 				}
 | |
| 
 | |
| 				$check_words = array();
 | |
| 				switch(SQL_LAYER)
 | |
| 				{
 | |
| 					case 'postgresql':
 | |
| 					case 'msaccess':
 | |
| 					case 'mssql-odbc':
 | |
| 					case 'oracle':
 | |
| 					case 'db2':
 | |
| 						$sql = "SELECT word_id, word_text
 | |
| 							FROM " . SEARCH_WORD_TABLE . "
 | |
| 							WHERE word_text IN ($word_text_sql)";
 | |
| 						$result = $db->sql_query($sql);
 | |
| 
 | |
| 						while ($row = $db->sql_fetchrow($result))
 | |
| 						{
 | |
| 							$check_words[$row['word_text']] = $row['word_id'];
 | |
| 						}
 | |
| 						break;
 | |
| 				}
 | |
| 
 | |
| 				$value_sql = '';
 | |
| 				$match_word = array();
 | |
| 				for ($i = 0; $i < count($word); $i++)
 | |
| 				{
 | |
| 					$new_match = true;
 | |
| 					if (isset($check_words[$word[$i]]))
 | |
| 					{
 | |
| 						$new_match = false;
 | |
| 					}
 | |
| 
 | |
| 					if ($new_match)
 | |
| 					{
 | |
| 						switch(SQL_LAYER)
 | |
| 						{
 | |
| 							case 'mysql':
 | |
| 							case 'mysql4':
 | |
| 								$value_sql .= (($value_sql != '') ? ', ' : '') . '(\'' . $word[$i] . '\')';
 | |
| 								break;
 | |
| 							case 'mssql':
 | |
| 								$value_sql .= (($value_sql != '') ? ' UNION ALL ' : '') . "SELECT '" . $word[$i] . "'";
 | |
| 								break;
 | |
| 							default:
 | |
| 								$sql = "INSERT INTO " . SEARCH_WORD_TABLE . " (word_text)
 | |
| 									VALUES ('" . $word[$i] . "')";
 | |
| 								$db->sql_query($sql);
 | |
| 								break;
 | |
| 						}
 | |
| 					}
 | |
| 				}
 | |
| 
 | |
| 				if ($value_sql != '')
 | |
| 				{
 | |
| 					switch (SQL_LAYER)
 | |
| 					{
 | |
| 						case 'mysql':
 | |
| 						case 'mysql4':
 | |
| 							$sql = "INSERT IGNORE INTO " . SEARCH_WORD_TABLE . " (word_text)
 | |
| 								VALUES $value_sql";
 | |
| 							break;
 | |
| 						case 'mssql':
 | |
| 							$sql = "INSERT INTO " . SEARCH_WORD_TABLE . " (word_text)
 | |
| 								$value_sql";
 | |
| 							break;
 | |
| 					}
 | |
| 
 | |
| 					$db->sql_query($sql);
 | |
| 				}
 | |
| 			}
 | |
| 
 | |
| 			foreach ($word_insert_sql as $word_in => $match_sql)
 | |
| 			{
 | |
| 				$title_match = ($word_in == 'title') ? 1 : 0;
 | |
| 
 | |
| 				if ($match_sql != '')
 | |
| 				{
 | |
| 					$sql = "INSERT INTO " . SEARCH_MATCH_TABLE . " (post_id, word_id, title_match)
 | |
| 						SELECT $post_id, word_id, $title_match
 | |
| 							FROM " . SEARCH_WORD_TABLE . "
 | |
| 							WHERE word_text IN ($match_sql)";
 | |
| 					$db->sql_query($sql);
 | |
| 				}
 | |
| 			}
 | |
| 
 | |
| 		}
 | |
| 		while ($row = $db->sql_fetchrow($result));
 | |
| 	}
 | |
| 
 | |
| 	$db->sql_freeresult($result);
 | |
| 
 | |
| 	// Remove common words after the first 2 batches and after every 4th batch after that.
 | |
| 	if ($batchcount % 4 == 3)
 | |
| 	{
 | |
| //		remove_common('global', $config['common_search']);
 | |
| 	}
 | |
| 
 | |
| 	$batchcount++;
 | |
| 
 | |
| 	if (($batchstart + $batchsize) < $max_post_id)
 | |
| 	{
 | |
| 		header("Location: admin_search.$phpEx$SID&batchstart=" . ($batchstart + $batchsize) . "&batchcount=$batch_count");
 | |
| 		exit;
 | |
| 	}
 | |
| 	else
 | |
| 	{
 | |
| 		$sql = "UPDATE " . CONFIG_TABLE . "
 | |
| 			SET config_value = '0'
 | |
| 			WHERE config_name = 'board_disable'";
 | |
| 		$db->sql_query($sql);
 | |
| 
 | |
| 		page_header($user->lang['Search_indexing']);
 | |
| 
 | |
| ?>
 | |
| 
 | |
| <h1><?php echo $user->lang['Search_indexing']; ?></h1>
 | |
| 
 | |
| <p><?php echo $user->lang['Search_indexing_complete']; ?></p>
 | |
| 
 | |
| <?php
 | |
| 
 | |
| 		page_footer();
 | |
| 
 | |
| 	}
 | |
| 
 | |
| 	exit;
 | |
| 
 | |
| }
 | |
| else if (isset($_POST['cancel']))
 | |
| {
 | |
| 	$sql = "UPDATE " . CONFIG_TABLE . "
 | |
| 		SET config_value = '0'
 | |
| 		WHERE config_name = 'board_disable'";
 | |
| 	$db->sql_query($sql);
 | |
| 
 | |
| 	page_header($user->lang['Search_indexing']);
 | |
| 
 | |
| ?>
 | |
| 
 | |
| <h1><?php echo $user->lang['Search_indexing']; ?></h1>
 | |
| 
 | |
| <p><?php echo $user->lang['Search_indexing_cancel']; ?></p>
 | |
| 
 | |
| <?php
 | |
| 
 | |
| 	page_footer();
 | |
| 
 | |
| }
 | |
| else
 | |
| {
 | |
| 	page_header($user->lang['Search_indexing']);
 | |
| 
 | |
| ?>
 | |
| 
 | |
| <h1><?php echo $user->lang['Search_indexing']; ?></h1>
 | |
| 
 | |
| <p><?php echo $user->lang['Search_indexing_explain']; ?></p>
 | |
| 
 | |
| <form method="post" action="<?php echo "admin_search.$phpEx$SID"; ?>"><table cellspacing="1" cellpadding="4" border="0" align="center" bgcolor="#98AAB1">
 | |
| 	<tr>
 | |
| 		<td class="cat" height="28" align="center"> <input type="submit" name="start" value="<?php echo $user->lang['Start']; ?>" class="mainoption" />   <input type="submit" name="cancel" value="<?php echo $user->lang['Cancel']; ?>" class="mainoption" /> </td>
 | |
| 	</tr>
 | |
| </table></form>
 | |
| 
 | |
| <?php
 | |
| 
 | |
| 	page_footer();
 | |
| 
 | |
| }
 | |
| 
 | |
| ?>
 |