#!/usr/bin/env php <?php /* * StatusNet - the distributed open-source microblogging tool * Copyright (C) 2009, StatusNet, Inc. * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Affero General Public License for more details. * * You should have received a copy of the GNU Affero General Public License * along with this program. If not, see <http://www.gnu.org/licenses/>. */ # Abort if called from a web server define('INSTALLDIR', realpath(dirname(__FILE__) . '/..')); $helptext = <<<ENDOFHELP fixup_utf8.php <maxdate> <maxid> <minid> Fixup records in a database that stored the data incorrectly (pre-0.7.4 for StatusNet). ENDOFHELP; require_once INSTALLDIR.'/scripts/commandline.inc'; require_once 'DB.php'; class UTF8FixerUpper { var $dbl = null; var $dbu = null; var $args = array(); function __construct($args) { $this->args = $args; if (!empty($args['max_date'])) { $this->max_date = strftime('%Y-%m-%d %H:%M:%S', strtotime($args['max_date'])); } else { $this->max_date = strftime('%Y-%m-%d %H:%M:%S', time()); } $this->dbl = $this->doConnect('latin1'); if (empty($this->dbl)) { return; } $this->dbu = $this->doConnect('utf8'); if (empty($this->dbu)) { return; } } function doConnect($charset) { $db = DB::connect(common_config('db', 'database'), array('persistent' => false)); if (PEAR::isError($db)) { echo "ERROR: " . $db->getMessage() . "\n"; return NULL; } $conn = $db->connection; $succ = mysqli_set_charset($conn, $charset); if (!$succ) { echo "ERROR: couldn't set charset\n"; $db->disconnect(); return NULL; } $result = $db->autoCommit(true); if (PEAR::isError($result)) { echo "ERROR: " . $result->getMessage() . "\n"; $db->disconnect(); return NULL; } return $db; } function fixup() { $this->fixupNotices($this->args['max_notice'], $this->args['min_notice']); $this->fixupProfiles(); $this->fixupGroups(); $this->fixupMessages(); } function fixupNotices($max_id, $min_id) { // Do a separate DB connection $sth = $this->dbu->prepare("UPDATE notice SET content = UNHEX(?), rendered = UNHEX(?) WHERE id = ?"); if (PEAR::isError($sth)) { echo "ERROR: " . $sth->getMessage() . "\n"; return; } $sql = 'SELECT id, content, rendered FROM notice ' . 'WHERE LENGTH(content) != CHAR_LENGTH(content) '. 'AND modified < "'.$this->max_date.'" '; if (!empty($max_id)) { $sql .= ' AND id <= ' . $max_id; } if (!empty($min_id)) { $sql .= ' AND id >= ' . $min_id; } $sql .= ' ORDER BY id DESC'; $rn = $this->dbl->query($sql); if (PEAR::isError($rn)) { echo "ERROR: " . $rn->getMessage() . "\n"; return; } echo "Number of rows: " . $rn->numRows() . "\n"; $notice = array(); while (DB_OK == $rn->fetchInto($notice)) { $id = ($notice[0])+0; $content = bin2hex($notice[1]); $rendered = bin2hex($notice[2]); echo "$id..."; $result = $this->dbu->execute($sth, array($content, $rendered, $id)); if (PEAR::isError($result)) { echo "ERROR: " . $result->getMessage() . "\n"; continue; } $cnt = $this->dbu->affectedRows(); if ($cnt != 1) { echo "ERROR: 0 rows affected\n"; continue; } $notice = Notice::staticGet('id', $id); $notice->decache(); $notice->free(); echo "OK\n"; } } function fixupProfiles() { // Do a separate DB connection $sth = $this->dbu->prepare("UPDATE profile SET ". "fullname = UNHEX(?),". "location = UNHEX(?), ". "bio = UNHEX(?) ". "WHERE id = ?"); if (PEAR::isError($sth)) { echo "ERROR: " . $sth->getMessage() . "\n"; return; } $sql = 'SELECT id, fullname, location, bio FROM profile ' . 'WHERE (LENGTH(fullname) != CHAR_LENGTH(fullname) '. 'OR LENGTH(location) != CHAR_LENGTH(location) '. 'OR LENGTH(bio) != CHAR_LENGTH(bio)) '. 'AND modified < "'.$this->max_date.'" '. ' ORDER BY modified DESC'; $rn = $this->dbl->query($sql); if (PEAR::isError($rn)) { echo "ERROR: " . $rn->getMessage() . "\n"; return; } echo "Number of rows: " . $rn->numRows() . "\n"; $profile = array(); while (DB_OK == $rn->fetchInto($profile)) { $id = ($profile[0])+0; $fullname = bin2hex($profile[1]); $location = bin2hex($profile[2]); $bio = bin2hex($profile[3]); echo "$id..."; $result = $this->dbu->execute($sth, array($fullname, $location, $bio, $id)); if (PEAR::isError($result)) { echo "ERROR: " . $result->getMessage() . "\n"; continue; } $cnt = $this->dbu->affectedRows(); if ($cnt != 1) { echo "ERROR: 0 rows affected\n"; continue; } $profile = Profile::staticGet('id', $id); $profile->decache(); $profile->free(); echo "OK\n"; } } function fixupGroups() { // Do a separate DB connection $sth = $this->dbu->prepare("UPDATE user_group SET ". "fullname = UNHEX(?),". "location = UNHEX(?), ". "description = UNHEX(?) ". "WHERE id = ?"); if (PEAR::isError($sth)) { echo "ERROR: " . $sth->getMessage() . "\n"; return; } $sql = 'SELECT id, fullname, location, description FROM user_group ' . 'WHERE LENGTH(fullname) != CHAR_LENGTH(fullname) '. 'OR LENGTH(location) != CHAR_LENGTH(location) '. 'OR LENGTH(description) != CHAR_LENGTH(description) '; 'AND modified < "'.$this->max_date.'" '. 'ORDER BY modified DESC'; $rn = $this->dbl->query($sql); if (PEAR::isError($rn)) { echo "ERROR: " . $rn->getMessage() . "\n"; return; } echo "Number of rows: " . $rn->numRows() . "\n"; $user_group = array(); while (DB_OK == $rn->fetchInto($user_group)) { $id = ($user_group[0])+0; $fullname = bin2hex($user_group[1]); $location = bin2hex($user_group[2]); $description = bin2hex($user_group[3]); echo "$id..."; $result = $this->dbu->execute($sth, array($fullname, $location, $description, $id)); if (PEAR::isError($result)) { echo "ERROR: " . $result->getMessage() . "\n"; continue; } $cnt = $this->dbu->affectedRows(); if ($cnt != 1) { echo "ERROR: 0 rows affected\n"; continue; } $user_group = User_group::staticGet('id', $id); $user_group->decache(); $user_group->free(); echo "OK\n"; } } function fixupMessages() { // Do a separate DB connection $sth = $this->dbu->prepare("UPDATE message SET content = UNHEX(?), rendered = UNHEX(?) WHERE id = ?"); if (PEAR::isError($sth)) { echo "ERROR: " . $sth->getMessage() . "\n"; return; } $sql = 'SELECT id, content, rendered FROM message ' . 'WHERE LENGTH(content) != CHAR_LENGTH(content) '. 'AND modified < "'.$this->max_date.'" '. 'ORDER BY id DESC'; $rn = $this->dbl->query($sql); if (PEAR::isError($rn)) { echo "ERROR: " . $rn->getMessage() . "\n"; return; } echo "Number of rows: " . $rn->numRows() . "\n"; $message = array(); while (DB_OK == $rn->fetchInto($message)) { $id = ($message[0])+0; $content = bin2hex($message[1]); $rendered = bin2hex($message[2]); echo "$id..."; $result = $this->dbu->execute($sth, array($content, $rendered, $id)); if (PEAR::isError($result)) { echo "ERROR: " . $result->getMessage() . "\n"; continue; } $cnt = $this->dbu->affectedRows(); if ($cnt != 1) { echo "ERROR: 0 rows affected\n"; continue; } $message = Message::staticGet('id', $id); $message->decache(); $message->free(); echo "OK\n"; } } } $max_date = (count($args) > 0) ? $args[0] : null; $max_id = (count($args) > 1) ? $args[1] : null; $min_id = (count($args) > 2) ? $args[2] : null; $fixer = new UTF8FixerUpper(array('max_date' => $max_date, 'max_notice' => $max_id, 'min_notice' => $min_id)); $fixer->fixup();