fixup_deletions.php 4.49 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166
#!/usr/bin/env php
<?php
/*
 * StatusNet - a distributed open-source microblogging tool
 * Copyright (C) 2010 StatusNet, Inc.
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 */

define('INSTALLDIR', realpath(dirname(__FILE__) . '/..'));

$longoptions = array('dry-run', 'start=', 'end=');

$helptext = <<<END_OF_USERROLE_HELP
fixup_deletions.php [options]
Finds notices posted by deleted users and cleans them up.
Stray incompletely deleted items cause various fun problems!

     --dry-run  look but don't touch
     --start=N  start looking at profile_id N instead of 1
     --end=N    end looking at profile_id N instead of the max

END_OF_USERROLE_HELP;

require_once INSTALLDIR.'/scripts/commandline.inc';

/**
 * Find the highest profile_id currently listed in the notice table;
 * this field is indexed and should return very quickly.
 *
 * We check notice.profile_id rather than profile.id because we're
 * looking for notices left behind after deletion; if the most recent
 * accounts were deleted, we wouldn't have them from profile.
 *
 * @return int
 * @access private
 */
function get_max_profile_id()
{
    $query = 'SELECT MAX(profile_id) AS id FROM notice';

    $profile = new Profile();
    $profile->query($query);

    if ($profile->fetch()) {
        return intval($profile->id);
    } else {
        die("Something went awry; could not look up max used profile_id.");
    }
}

/**
 * Check for profiles in the given id range that are missing, presumed deleted.
 *
 * @param int $start beginning profile.id, inclusive
 * @param int $end final profile.id, inclusive
 * @return array of integer profile.ids
 * @access private
 */
function get_missing_profiles($start, $end)
{
    $query = sprintf("SELECT id FROM profile WHERE id BETWEEN %d AND %d",
                     $start, $end);

    $profile = new Profile();
    $profile->query($query);

    $all = range($start, $end);
    $known = array();
    while ($row = $profile->fetch()) {
        $known[] = intval($profile->id);
    }
    unset($profile);

    $missing = array_diff($all, $known);
    return $missing;
}

/**
 * Look for stray notices from this profile and, if present, kill them.
 *
 * @param int $profile_id
 * @param bool $dry if true, we won't delete anything
 */
function cleanup_missing_profile($profile_id, $dry)
{
    $notice = new Notice();
    $notice->profile_id = $profile_id;
    $notice->find();
    if ($notice->N == 0) {
        return;
    }

    $s = ($notice->N == 1) ? '' : 's';
    print "Deleted profile $profile_id has $notice->N stray notice$s:\n";

    while ($notice->fetch()) {
        print "  notice $notice->id";
        if ($dry) {
            print " (skipped; dry run)\n";
        } else {
            $victim = clone($notice);
            try {
                $victim->delete();
                print " (deleted)\n";
            } catch (Exception $e) {
                print " FAILED: ";
                print $e->getMessage();
                print "\n";
            }
        }
    }
}

$dry = have_option('dry-run');

$max_profile_id = get_max_profile_id();
$chunk = 1000;

if (have_option('start')) {
    $begin = intval(get_option_value('start'));
} else {
    $begin = 1;
}
if (have_option('end')) {
    $final = min($max_profile_id, intval(get_option_value('end')));
} else {
    $final = $max_profile_id;
}

if ($begin < 1) {
    die("Silly human, you can't begin before profile number 1!\n");
}
if ($final < $begin) {
    die("Silly human, you can't end at $final if it's before $begin!\n");
}

// Identify missing profiles...
for ($start = $begin; $start <= $final; $start += $chunk) {
    $end = min($start + $chunk - 1, $final);

    print "Checking for missing profiles between id $start and $end";
    if ($dry) {
        print " (dry run)";
    }
    print "...\n";
    $missing = get_missing_profiles($start, $end);

    foreach ($missing as $profile_id) {
        cleanup_missing_profile($profile_id, $dry);
    }
}

echo "done.\n";