2020-08-04 05:02:06 +01:00
|
|
|
#!/usr/bin/env php
|
|
|
|
<?php
|
|
|
|
// This file is part of GNU social - https://www.gnu.org/software/social
|
|
|
|
//
|
|
|
|
// GNU social is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// GNU social is distributed in the hope that it will be useful,
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with GNU social. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Script that removes duplicated profiles inter and intra
|
|
|
|
* federation protocols.
|
|
|
|
*
|
|
|
|
* @package GNUsocial
|
|
|
|
* @copyright 2020 Free Software Foundation, Inc http://www.fsf.org
|
|
|
|
* @license https://www.gnu.org/licenses/agpl.html GNU AGPL v3 or later
|
|
|
|
*/
|
|
|
|
|
|
|
|
define('INSTALLDIR', dirname(__DIR__, 3));
|
|
|
|
define('PUBLICDIR', INSTALLDIR . DIRECTORY_SEPARATOR . 'public');
|
|
|
|
|
|
|
|
$longoptions = [];
|
|
|
|
$shortoptions = '';
|
|
|
|
|
|
|
|
$helptext = <<<END_OF_HELP
|
|
|
|
fix_duplicates.php [options]
|
|
|
|
remove duplicated profiles inter and intra federation protocols
|
|
|
|
|
|
|
|
END_OF_HELP;
|
|
|
|
|
|
|
|
require_once INSTALLDIR . '/scripts/commandline.inc';
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Remote profiles are inspected from the most to the least
|
2020-08-04 12:38:51 +01:00
|
|
|
* preferred according to the protocols they belong and age.
|
2020-08-04 05:10:11 +01:00
|
|
|
* Invariants:
|
2020-08-04 12:38:51 +01:00
|
|
|
* - `seen_local` array: The most recent profile inside of a certain protocol are kept
|
|
|
|
* - global `seen` array: The most relevant profile (if there were duplicates, the first protocol of the list is the one to have its profile maintained) are kept
|
|
|
|
* These two variables make it easy to satisfy a policy of maintaining
|
|
|
|
* only the profiles that are either the most relevant or the newest
|
2020-08-04 05:02:06 +01:00
|
|
|
* ones intra-protocol wise.
|
|
|
|
*/
|
2020-08-04 05:10:11 +01:00
|
|
|
|
2020-08-04 05:02:06 +01:00
|
|
|
function run(): void
|
|
|
|
{
|
|
|
|
$protocols = common_config('TheFreeNetworkModule', 'protocols');
|
|
|
|
$seen = [];
|
|
|
|
|
|
|
|
foreach ($protocols as $protocol => $profile_class) {
|
|
|
|
fix_duplicates($profile_class, $seen);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
function fix_duplicates(string $profile_class, array &$seen): void
|
|
|
|
{
|
2020-08-04 12:38:51 +01:00
|
|
|
$protocol_profile = new $profile_class();
|
|
|
|
$protocol_profile->selectAdd();
|
|
|
|
$protocol_profile->selectAdd('profile_id');
|
|
|
|
$protocol_profile->selectAdd('uri');
|
|
|
|
$protocol_profile->whereAdd('profile_id IS NOT NULL'); // ignore groups
|
|
|
|
|
|
|
|
if (!$protocol_profile->find()) {
|
|
|
|
// This protocol wasn't used apparently
|
2020-08-04 05:02:06 +01:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
$seen_local = [];
|
|
|
|
|
2020-08-04 12:38:51 +01:00
|
|
|
while ($protocol_profile->fetch()) {
|
|
|
|
$id = $protocol_profile->profile_id;
|
|
|
|
$uri = $protocol_profile->uri;
|
2020-08-04 05:02:06 +01:00
|
|
|
|
2020-08-04 05:10:11 +01:00
|
|
|
// Have we seen this profile before?
|
2020-08-04 05:02:06 +01:00
|
|
|
if (array_key_exists($uri, $seen)) {
|
2020-08-04 13:03:33 +01:00
|
|
|
try {
|
|
|
|
// Was it on a previous protocol? Keep the highest preference protocol's one
|
|
|
|
if ($seen[$uri] !== $id) {
|
|
|
|
printfnq("Deleting Profile with id = {$id}\n");
|
|
|
|
$profile = Profile::getByID($id);
|
|
|
|
$profile->delete();
|
|
|
|
} else {
|
|
|
|
printfnq("Deleting {$profile_class} with id = {$id}\n");
|
|
|
|
$protocol_profile->delete();
|
|
|
|
}
|
|
|
|
} catch (Exception $e) {
|
|
|
|
// Let it go
|
|
|
|
printfnq('FWIW: ' . $e->getMessage() . "\n");
|
2020-08-04 05:02:06 +01:00
|
|
|
}
|
|
|
|
} elseif (array_key_exists($uri, $seen_local)) {
|
2020-08-04 13:03:33 +01:00
|
|
|
try {
|
|
|
|
// Was it in this protocol? Delete the older record.
|
|
|
|
if ($seen_local[$uri] !== $id) {
|
|
|
|
printfnq("Deleting Profile with id = {$seen_local[$uri]}\n");
|
|
|
|
$profile = Profile::getByID($seen_local[$uri]);
|
|
|
|
$profile->delete();
|
|
|
|
} else {
|
|
|
|
printfnq("Deleting {$profile_class} with id = {$seen_local[$uri]}\n");
|
|
|
|
$profile = $profile_class::getKV('profile_id', $seen_local[$uri]);
|
|
|
|
$profile->delete();
|
|
|
|
}
|
|
|
|
} catch (Exception $e) {
|
|
|
|
// Let it go
|
|
|
|
printfnq('FWIW: ' . $e->getMessage() . "\n");
|
2020-08-04 05:02:06 +01:00
|
|
|
}
|
2020-08-04 05:10:11 +01:00
|
|
|
// Update the profile id for this URI.
|
2020-08-04 05:02:06 +01:00
|
|
|
$seen_local[$uri] = $id;
|
|
|
|
} else {
|
2020-08-04 05:10:11 +01:00
|
|
|
// It's the first time we see this profile _inside_ this protocol!
|
2020-08-04 05:02:06 +01:00
|
|
|
$seen_local[$uri] = $id;
|
|
|
|
}
|
|
|
|
}
|
2020-08-04 13:03:33 +01:00
|
|
|
$protocol_profile->free();
|
|
|
|
unset($protocol_profile);
|
2020-08-04 05:02:06 +01:00
|
|
|
|
2020-08-04 05:10:11 +01:00
|
|
|
// Merge the findings inside this protocol with the global seen to be used on the next protocol of the list.
|
2020-08-04 05:02:06 +01:00
|
|
|
$seen = array_merge($seen, $seen_local);
|
|
|
|
}
|
|
|
|
|
|
|
|
run();
|