1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
|
<?php
/**
* Rebuild search index table from scratch. This may take several
* hours, depending on the database size and server configuration.
*
* Postgres is trigger-based and should never need rebuilding.
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
* http://www.gnu.org/copyleft/gpl.html
*
* @ingroup Maintenance
* @todo document
*/
require_once( dirname(__FILE__) . '/Maintenance.php' );
class RebuildTextIndex extends Maintenance {
const RTI_CHUNK_SIZE = 500;
private $db;
public function __construct() {
parent::__construct();
$this->mDescription = "Rebuild search index table from scratch";
}
public function getDbType() {
return Maintenance::DB_ADMIN;
}
public function execute() {
global $wgTitle, $wgDBtype;
// Shouldn't be needed for Postgres
if ( $wgDBtype == 'postgres' ) {
$this->error( "This script is not needed when using Postgres.\n", true );
}
$this->db = wfGetDB( DB_MASTER );
$wgTitle = Title::newFromText( "Rebuild text index script" );
if ( $wgDBtype == 'mysql' ) {
$this->dropMysqlTextIndex();
$this->populateSearchIndex();
$this->createMysqlTextIndex();
} else {
$this->clearSearchIndex();
$this->populateSearchIndex();
}
$this->output( "Done.\n" );
}
/**
* Populates the search index with content from all pages
*/
protected function populateSearchIndex() {
$res = $this->db->select( 'page', 'MAX(page_id) AS count' );
$s = $this->db->fetchObject($res);
$count = $s->count;
$this->output( "Rebuilding index fields for {$count} pages...\n" );
$n = 0;
while ( $n < $count ) {
$this->output( $n . "\n" );
$end = $n + self::RTI_CHUNK_SIZE - 1;
$res = $this->db->select( array( 'page', 'revision', 'text' ),
array( 'page_id', 'page_namespace', 'page_title', 'old_flags', 'old_text' ),
array( "page_id BETWEEN $n AND $end", 'page_latest = rev_id', 'rev_text_id = old_id' ),
__METHOD__
);
foreach( $res as $s ) {
$revtext = Revision::getRevisionText( $s );
$u = new SearchUpdate( $s->page_id, $s->page_title, $revtext );
$u->doUpdate();
}
$this->db->freeResult( $res );
$n += self::RTI_CHUNK_SIZE;
}
}
/**
* (MySQL only) Drops fulltext index before populating the table.
*/
private function dropMysqlTextIndex() {
$searchindex = $this->db->tableName( 'searchindex' );
if ( $this->db->indexExists( 'searchindex', 'si_title' ) ) {
$this->output( "Dropping index...\n" );
$sql = "ALTER TABLE $searchindex DROP INDEX si_title, DROP INDEX si_text";
$this->db->query($sql, __METHOD__ );
}
}
/**
* (MySQL only) Adds back fulltext index after populating the table.
*/
private function createMysqlTextIndex() {
$searchindex = $this->db->tableName( 'searchindex' );
$this->output( "\nRebuild the index...\n" );
$sql = "ALTER TABLE $searchindex ADD FULLTEXT si_title (si_title), " .
"ADD FULLTEXT si_text (si_text)";
$this->db->query( $sql, __METHOD__ );
}
/**
* Deletes everything from search index.
*/
private function clearSearchIndex() {
$this->output( 'Clearing searchindex table...' );
$this->db->delete( 'searchindex', '*', __METHOD__ );
$this->output( "Done\n" );
}
}
$maintClass = "RebuildTextIndex";
require_once( DO_MAINTENANCE );
|