- added a UNIQUE index on the wordmatch table

- some modifications of search indexing which might improve the speed and hopefully fixes [Bug #8352]
- added logging to search indexing [Bug #8384]


git-svn-id: file:///svn/phpbb/trunk@7119 89ea8834-ac86-4346-8a33-228a782c2dd0
This commit is contained in:
Nils Adermann 2007-03-04 16:05:17 +00:00
parent 567b01302b
commit ac21b7d47b
13 changed files with 57 additions and 28 deletions

View file

@ -1474,6 +1474,7 @@ function get_schema_struct()
'title_match' => array('BOOL', 0), 'title_match' => array('BOOL', 0),
), ),
'KEYS' => array( 'KEYS' => array(
'unique_match' => array('UNIQUE', array('word_id', 'post_id', 'title_match')),
'word_id' => array('INDEX', 'word_id'), 'word_id' => array('INDEX', 'word_id'),
'post_id' => array('INDEX', 'post_id'), 'post_id' => array('INDEX', 'post_id'),
), ),

View file

@ -8,16 +8,6 @@
* *
*/ */
/**
* @ignore
*/
if (!defined('IN_PHPBB'))
{
exit;
}
// make sure, a start time is saved
still_on_time();
/** /**
* @package acp * @package acp
*/ */
@ -27,7 +17,7 @@ class acp_search
var $state; var $state;
var $search; var $search;
var $max_post_id; var $max_post_id;
var $batch_size = 1000; var $batch_size = 100;
function main($id, $mode) function main($id, $mode)
{ {
@ -260,6 +250,7 @@ class acp_search
{ {
trigger_error($error . adm_back_link($this->u_action), E_USER_WARNING); trigger_error($error . adm_back_link($this->u_action), E_USER_WARNING);
} }
$name = ucfirst(strtolower(str_replace('_', ' ', $this->state[0])));
$action = &$this->state[1]; $action = &$this->state[1];
@ -284,12 +275,15 @@ class acp_search
} }
else else
{ {
$starttime = explode(' ', microtime());
$starttime = $starttime[1] + $starttime[0];
$row_count = 0;
while (still_on_time() && $post_counter <= $this->max_post_id) while (still_on_time() && $post_counter <= $this->max_post_id)
{ {
$sql = 'SELECT post_id, poster_id, forum_id $sql = 'SELECT post_id, poster_id, forum_id
FROM ' . POSTS_TABLE . ' FROM ' . POSTS_TABLE . '
WHERE post_id >= ' . (int) ($post_counter + 1) . ' WHERE post_id >= ' . (int) ($post_counter + 1) . '
AND post_id < ' . (int) ($post_counter + $this->batch_size); AND post_id <= ' . (int) ($post_counter + $this->batch_size);
$result = $db->sql_query($sql); $result = $db->sql_query($sql);
$ids = $posters = $forum_ids = array(); $ids = $posters = $forum_ids = array();
@ -300,6 +294,7 @@ class acp_search
$forum_ids[] = $row['forum_id']; $forum_ids[] = $row['forum_id'];
} }
$db->sql_freeresult($result); $db->sql_freeresult($result);
$row_count += sizeof($ids);
if (sizeof($ids)) if (sizeof($ids))
{ {
@ -307,15 +302,17 @@ class acp_search
} }
$post_counter += $this->batch_size; $post_counter += $this->batch_size;
}
// save the current state // save the current state
$this->save_state(); $this->save_state();
}
if ($post_counter <= $this->max_post_id) if ($post_counter <= $this->max_post_id)
{ {
$mtime = explode(' ', microtime());
$totaltime = $mtime[0] + $mtime[1] - $starttime;
$rows_per_second = $row_count / $totaltime;
meta_refresh(1, $this->u_action . '&amp;action=delete&amp;skip_rows=' . $post_counter); meta_refresh(1, $this->u_action . '&amp;action=delete&amp;skip_rows=' . $post_counter);
trigger_error(sprintf($user->lang['SEARCH_INDEX_DELETE_REDIRECT'], $post_counter)); trigger_error(sprintf($user->lang['SEARCH_INDEX_DELETE_REDIRECT'], $post_counter, $row_count, $rows_per_second));
} }
} }
@ -324,6 +321,7 @@ class acp_search
$this->state = array(''); $this->state = array('');
$this->save_state(); $this->save_state();
add_log('admin', 'LOG_SEARCH_INDEX_REMOVED', $name);
trigger_error($user->lang['SEARCH_INDEX_REMOVED'] . adm_back_link($this->u_action) . $this->close_popup_js()); trigger_error($user->lang['SEARCH_INDEX_REMOVED'] . adm_back_link($this->u_action) . $this->close_popup_js());
break; break;
@ -350,12 +348,15 @@ class acp_search
} }
$db->sql_freeresult($result); $db->sql_freeresult($result);
$starttime = explode(' ', microtime());
$starttime = $starttime[1] + $starttime[0];
$row_count = 0;
while (still_on_time() && $post_counter <= $this->max_post_id) while (still_on_time() && $post_counter <= $this->max_post_id)
{ {
$sql = 'SELECT post_id, post_subject, post_text, poster_id, forum_id $sql = 'SELECT post_id, post_subject, post_text, poster_id, forum_id
FROM ' . POSTS_TABLE . ' FROM ' . POSTS_TABLE . '
WHERE post_id >= ' . (int) ($post_counter + 1) . ' WHERE post_id >= ' . (int) ($post_counter + 1) . '
AND post_id < ' . (int) ($post_counter + $this->batch_size); AND post_id <= ' . (int) ($post_counter + $this->batch_size);
$result = $db->sql_query($sql); $result = $db->sql_query($sql);
while ($row = $db->sql_fetchrow($result)) while ($row = $db->sql_fetchrow($result))
@ -366,19 +367,29 @@ class acp_search
{ {
$this->search->index('post', $row['post_id'], $row['post_text'], $row['post_subject'], $row['poster_id'], $row['forum_id']); $this->search->index('post', $row['post_id'], $row['post_text'], $row['post_subject'], $row['poster_id'], $row['forum_id']);
} }
$row_count++;
} }
$db->sql_freeresult($result); $db->sql_freeresult($result);
$post_counter += $this->batch_size; $post_counter += $this->batch_size;
}
// save the current state // save the current state
$this->save_state(); $this->save_state();
}
// pretend the number of posts was as big as the number of ids we indexed so far
// just an estimation as it includes deleted posts
$num_posts = $config['num_posts'];
$config['num_posts'] = min($config['num_posts'], $post_counter);
$this->search->tidy();
$config['num_posts'] = $num_posts;
if ($post_counter <= $this->max_post_id) if ($post_counter <= $this->max_post_id)
{ {
$mtime = explode(' ', microtime());
$totaltime = $mtime[0] + $mtime[1] - $starttime;
$rows_per_second = $row_count / $totaltime;
meta_refresh(1, $this->u_action . '&amp;action=create&amp;skip_rows=' . $post_counter); meta_refresh(1, $this->u_action . '&amp;action=create&amp;skip_rows=' . $post_counter);
trigger_error(sprintf($user->lang['SEARCH_INDEX_CREATE_REDIRECT'], $post_counter)); trigger_error(sprintf($user->lang['SEARCH_INDEX_CREATE_REDIRECT'], $post_counter, $row_count, $rows_per_second));
} }
} }
@ -387,6 +398,7 @@ class acp_search
$this->state = array(''); $this->state = array('');
$this->save_state(); $this->save_state();
add_log('admin', 'LOG_SEARCH_INDEX_CREATED', $name);
trigger_error($user->lang['SEARCH_INDEX_CREATED'] . adm_back_link($this->u_action) . $this->close_popup_js()); trigger_error($user->lang['SEARCH_INDEX_CREATED'] . adm_back_link($this->u_action) . $this->close_popup_js());
break; break;
} }

View file

@ -180,7 +180,7 @@ function unique_id($extra = 'c')
* @return bool Either true if the maximum execution time is nearly reached, or false * @return bool Either true if the maximum execution time is nearly reached, or false
* if some time is still left. * if some time is still left.
*/ */
function still_on_time() function still_on_time($extra_time = 15)
{ {
static $max_execution_time, $start_time; static $max_execution_time, $start_time;
@ -194,10 +194,10 @@ function still_on_time()
// If zero, then set to something higher to not let the user catch the ten seconds barrier. // If zero, then set to something higher to not let the user catch the ten seconds barrier.
if ($max_execution_time === 0) if ($max_execution_time === 0)
{ {
$max_execution_time = 65; $max_execution_time = 50 + $extra_time;
} }
$max_execution_time = min(max(10, ($max_execution_time - 15)), 50); $max_execution_time = min(max(10, ($max_execution_time - $extra_time)), 50);
// For debugging purposes // For debugging purposes
// $max_execution_time = 10; // $max_execution_time = 10;

View file

@ -1110,7 +1110,6 @@ class fulltext_native extends search_backend
$word_ids[$row['word_text']] = $row['word_id']; $word_ids[$row['word_text']] = $row['word_id'];
} }
$db->sql_freeresult($result); $db->sql_freeresult($result);
$new_words = array_diff($unique_add_words, array_keys($word_ids)); $new_words = array_diff($unique_add_words, array_keys($word_ids));
if (sizeof($new_words)) if (sizeof($new_words))
@ -1121,8 +1120,9 @@ class fulltext_native extends search_backend
{ {
$sql_ary[] = array('word_text' => $word); $sql_ary[] = array('word_text' => $word);
} }
$db->return_on_error = true;
$db->sql_multi_insert(SEARCH_WORDLIST_TABLE, $sql_ary); $db->sql_multi_insert(SEARCH_WORDLIST_TABLE, $sql_ary);
$db->return_on_error = false;
} }
unset($new_words, $sql_ary); unset($new_words, $sql_ary);
} }
@ -1149,6 +1149,7 @@ class fulltext_native extends search_backend
} }
} }
$db->return_on_error = true;
foreach ($words['add'] as $word_in => $word_ary) foreach ($words['add'] as $word_in => $word_ary)
{ {
$title_match = ($word_in == 'title') ? 1 : 0; $title_match = ($word_in == 'title') ? 1 : 0;
@ -1162,6 +1163,7 @@ class fulltext_native extends search_backend
$db->sql_query($sql); $db->sql_query($sql);
} }
} }
$db->return_on_error = false;
// destroy cached search results containing any of the words removed or added // destroy cached search results containing any of the words removed or added
$this->destroy_cache(array_unique(array_merge($words['add']['post'], $words['add']['title'], $words['del']['post'], $words['del']['title'])), array($poster_id)); $this->destroy_cache(array_unique(array_merge($words['add']['post'], $words['add']['title'], $words['del']['post'], $words['del']['title'])), array($poster_id));

View file

@ -369,6 +369,9 @@ $database_update_info = array(
), ),
// Add the following unique indexes // Add the following unique indexes
'add_unique_index' => array( 'add_unique_index' => array(
SEARCH_WORDMATCH_TABLE => array(
'unique_match' => array('word_id', 'post_id', 'title_match'),
),
USERS_TABLE => array( USERS_TABLE => array(
'username_clean' => array('username_clean'), 'username_clean' => array('username_clean'),
), ),

View file

@ -949,6 +949,7 @@ CREATE TABLE phpbb_search_wordmatch (
title_match INTEGER DEFAULT 0 NOT NULL title_match INTEGER DEFAULT 0 NOT NULL
);; );;
CREATE UNIQUE INDEX phpbb_search_wordmatch_unique_match ON phpbb_search_wordmatch(word_id, post_id, title_match);;
CREATE INDEX phpbb_search_wordmatch_word_id ON phpbb_search_wordmatch(word_id);; CREATE INDEX phpbb_search_wordmatch_word_id ON phpbb_search_wordmatch(word_id);;
CREATE INDEX phpbb_search_wordmatch_post_id ON phpbb_search_wordmatch(post_id);; CREATE INDEX phpbb_search_wordmatch_post_id ON phpbb_search_wordmatch(post_id);;

View file

@ -1123,6 +1123,9 @@ CREATE TABLE [phpbb_search_wordmatch] (
) ON [PRIMARY] ) ON [PRIMARY]
GO GO
CREATE UNIQUE INDEX [unique_match] ON [phpbb_search_wordmatch]([word_id], [post_id], [title_match]) ON [PRIMARY]
GO
CREATE INDEX [word_id] ON [phpbb_search_wordmatch]([word_id]) ON [PRIMARY] CREATE INDEX [word_id] ON [phpbb_search_wordmatch]([word_id]) ON [PRIMARY]
GO GO

View file

@ -648,6 +648,7 @@ CREATE TABLE phpbb_search_wordmatch (
post_id mediumint(8) UNSIGNED DEFAULT '0' NOT NULL, post_id mediumint(8) UNSIGNED DEFAULT '0' NOT NULL,
word_id mediumint(8) UNSIGNED DEFAULT '0' NOT NULL, word_id mediumint(8) UNSIGNED DEFAULT '0' NOT NULL,
title_match tinyint(1) UNSIGNED DEFAULT '0' NOT NULL, title_match tinyint(1) UNSIGNED DEFAULT '0' NOT NULL,
UNIQUE unique_match (word_id, post_id, title_match),
KEY word_id (word_id), KEY word_id (word_id),
KEY post_id (post_id) KEY post_id (post_id)
); );

View file

@ -648,6 +648,7 @@ CREATE TABLE phpbb_search_wordmatch (
post_id mediumint(8) UNSIGNED DEFAULT '0' NOT NULL, post_id mediumint(8) UNSIGNED DEFAULT '0' NOT NULL,
word_id mediumint(8) UNSIGNED DEFAULT '0' NOT NULL, word_id mediumint(8) UNSIGNED DEFAULT '0' NOT NULL,
title_match tinyint(1) UNSIGNED DEFAULT '0' NOT NULL, title_match tinyint(1) UNSIGNED DEFAULT '0' NOT NULL,
UNIQUE unique_match (word_id, post_id, title_match),
KEY word_id (word_id), KEY word_id (word_id),
KEY post_id (post_id) KEY post_id (post_id)
) CHARACTER SET `utf8` COLLATE `utf8_bin`; ) CHARACTER SET `utf8` COLLATE `utf8_bin`;

View file

@ -1260,7 +1260,8 @@ END;
CREATE TABLE phpbb_search_wordmatch ( CREATE TABLE phpbb_search_wordmatch (
post_id number(8) DEFAULT '0' NOT NULL, post_id number(8) DEFAULT '0' NOT NULL,
word_id number(8) DEFAULT '0' NOT NULL, word_id number(8) DEFAULT '0' NOT NULL,
title_match number(1) DEFAULT '0' NOT NULL title_match number(1) DEFAULT '0' NOT NULL,
CONSTRAINT u_phpbb_unique_match UNIQUE (word_id, post_id, title_match)
) )
/ /

View file

@ -862,6 +862,7 @@ CREATE TABLE phpbb_search_wordmatch (
title_match INT2 DEFAULT '0' NOT NULL CHECK (title_match >= 0) title_match INT2 DEFAULT '0' NOT NULL CHECK (title_match >= 0)
); );
CREATE UNIQUE INDEX phpbb_search_wordmatch_unique_match ON phpbb_search_wordmatch (word_id, post_id, title_match);
CREATE INDEX phpbb_search_wordmatch_word_id ON phpbb_search_wordmatch (word_id); CREATE INDEX phpbb_search_wordmatch_word_id ON phpbb_search_wordmatch (word_id);
CREATE INDEX phpbb_search_wordmatch_post_id ON phpbb_search_wordmatch (post_id); CREATE INDEX phpbb_search_wordmatch_post_id ON phpbb_search_wordmatch (post_id);

View file

@ -628,6 +628,7 @@ CREATE TABLE phpbb_search_wordmatch (
title_match INTEGER UNSIGNED NOT NULL DEFAULT '0' title_match INTEGER UNSIGNED NOT NULL DEFAULT '0'
); );
CREATE UNIQUE INDEX phpbb_search_wordmatch_unique_match ON phpbb_search_wordmatch (word_id, post_id, title_match);
CREATE INDEX phpbb_search_wordmatch_word_id ON phpbb_search_wordmatch (word_id); CREATE INDEX phpbb_search_wordmatch_word_id ON phpbb_search_wordmatch (word_id);
CREATE INDEX phpbb_search_wordmatch_post_id ON phpbb_search_wordmatch (post_id); CREATE INDEX phpbb_search_wordmatch_post_id ON phpbb_search_wordmatch (post_id);

View file

@ -587,6 +587,8 @@ $lang = array_merge($lang, array(
'LOG_RESYNC_POST_MARKING' => '<strong>Dotted topics resynchronised</strong>', 'LOG_RESYNC_POST_MARKING' => '<strong>Dotted topics resynchronised</strong>',
'LOG_RESYNC_STATS' => '<strong>Post, topic and user statistics resynchronised</strong>', 'LOG_RESYNC_STATS' => '<strong>Post, topic and user statistics resynchronised</strong>',
'LOG_SEARCH_INDEX_CREATED' => '<strong>Created search index for</strong><br />» %s',
'LOG_SEARCH_INDEX_REMOVED' => '<strong>Removed search index for</strong><br />» %s',
'LOG_STYLE_ADD' => '<strong>Added new style</strong><br />» %s', 'LOG_STYLE_ADD' => '<strong>Added new style</strong><br />» %s',
'LOG_STYLE_DELETE' => '<strong>Deleted style</strong><br />» %s', 'LOG_STYLE_DELETE' => '<strong>Deleted style</strong><br />» %s',
'LOG_STYLE_EDIT_DETAILS' => '<strong>Edited style</strong><br />» %s', 'LOG_STYLE_EDIT_DETAILS' => '<strong>Edited style</strong><br />» %s',