| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  | #!/usr/bin/env php
 | 
					
						
							|  |  |  | <?php | 
					
						
							|  |  |  | // This file is part of GNU social - https://www.gnu.org/software/social
 | 
					
						
							|  |  |  | //
 | 
					
						
							|  |  |  | // GNU social is free software: you can redistribute it and/or modify
 | 
					
						
							|  |  |  | // it under the terms of the GNU Affero General Public License as published by
 | 
					
						
							|  |  |  | // the Free Software Foundation, either version 3 of the License, or
 | 
					
						
							|  |  |  | // (at your option) any later version.
 | 
					
						
							|  |  |  | //
 | 
					
						
							|  |  |  | // GNU social is distributed in the hope that it will be useful,
 | 
					
						
							|  |  |  | // but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
					
						
							|  |  |  | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
					
						
							|  |  |  | // GNU Affero General Public License for more details.
 | 
					
						
							|  |  |  | //
 | 
					
						
							|  |  |  | // You should have received a copy of the GNU Affero General Public License
 | 
					
						
							|  |  |  | // along with GNU social.  If not, see <http://www.gnu.org/licenses/>.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							|  |  |  |  * Script that removes duplicated profiles inter and intra | 
					
						
							|  |  |  |  * federation protocols. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * @package   GNUsocial | 
					
						
							|  |  |  |  * @copyright 2020 Free Software Foundation, Inc http://www.fsf.org | 
					
						
							|  |  |  |  * @license   https://www.gnu.org/licenses/agpl.html GNU AGPL v3 or later | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | define('INSTALLDIR', dirname(__DIR__, 3)); | 
					
						
							|  |  |  | define('PUBLICDIR', INSTALLDIR . DIRECTORY_SEPARATOR . 'public'); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | $longoptions = []; | 
					
						
							|  |  |  | $shortoptions = ''; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | $helptext = <<<END_OF_HELP | 
					
						
							|  |  |  | fix_duplicates.php [options] | 
					
						
							|  |  |  | remove duplicated profiles inter and intra federation protocols | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | END_OF_HELP; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | require_once INSTALLDIR . '/scripts/commandline.inc'; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							|  |  |  |  * Remote profiles are inspected from the most to the least | 
					
						
							| 
									
										
										
										
											2020-08-04 12:38:51 +01:00
										 |  |  |  * preferred according to the protocols they belong and age. | 
					
						
							| 
									
										
										
										
											2020-08-04 05:10:11 +01:00
										 |  |  |  * Invariants: | 
					
						
							| 
									
										
										
										
											2020-08-04 12:38:51 +01:00
										 |  |  |  *  - `seen_local` array:  The most recent profile inside of a certain protocol are kept | 
					
						
							|  |  |  |  *  - global `seen` array:  The most relevant profile (if there were duplicates, the first protocol of the list is the one to have its profile maintained) are kept | 
					
						
							|  |  |  |  * These two variables make it easy to satisfy a policy of maintaining | 
					
						
							|  |  |  |  * only the profiles that are either the most relevant or the newest | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  |  * ones intra-protocol wise. | 
					
						
							|  |  |  |  */ | 
					
						
							| 
									
										
										
										
											2020-08-04 05:10:11 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  | function run(): void | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  |     $protocols = common_config('TheFreeNetworkModule', 'protocols'); | 
					
						
							|  |  |  |     $seen = []; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     foreach ($protocols as $protocol => $profile_class) { | 
					
						
							|  |  |  |         fix_duplicates($profile_class, $seen); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | function fix_duplicates(string $profile_class, array &$seen): void | 
					
						
							|  |  |  | { | 
					
						
							| 
									
										
										
										
											2020-08-04 12:38:51 +01:00
										 |  |  |     $protocol_profile = new $profile_class(); | 
					
						
							|  |  |  |     $protocol_profile->selectAdd(); | 
					
						
							|  |  |  |     $protocol_profile->selectAdd('profile_id'); | 
					
						
							|  |  |  |     $protocol_profile->selectAdd('uri'); | 
					
						
							|  |  |  |     $protocol_profile->whereAdd('profile_id IS NOT NULL'); // ignore groups
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (!$protocol_profile->find()) { | 
					
						
							|  |  |  |         // This protocol wasn't used apparently
 | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  |         return; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     $seen_local = []; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-08-04 12:38:51 +01:00
										 |  |  |     while ($protocol_profile->fetch()) { | 
					
						
							|  |  |  |         $id  = $protocol_profile->profile_id; | 
					
						
							|  |  |  |         $uri = $protocol_profile->uri; | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-08-04 05:10:11 +01:00
										 |  |  |         // Have we seen this profile before?
 | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  |         if (array_key_exists($uri, $seen)) { | 
					
						
							| 
									
										
										
										
											2020-08-04 13:03:33 +01:00
										 |  |  |             try { | 
					
						
							|  |  |  |                 // Was it on a previous protocol? Keep the highest preference protocol's one
 | 
					
						
							|  |  |  |                 if ($seen[$uri] !== $id) { | 
					
						
							|  |  |  |                     printfnq("Deleting Profile with id = {$id}\n"); | 
					
						
							|  |  |  |                     $profile = Profile::getByID($id); | 
					
						
							|  |  |  |                     $profile->delete(); | 
					
						
							|  |  |  |                 } else { | 
					
						
							|  |  |  |                     printfnq("Deleting {$profile_class} with id = {$id}\n"); | 
					
						
							|  |  |  |                     $protocol_profile->delete(); | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |             } catch (Exception $e) { | 
					
						
							|  |  |  |                 // Let it go
 | 
					
						
							|  |  |  |                 printfnq('FWIW: ' . $e->getMessage() . "\n"); | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  |             } | 
					
						
							|  |  |  |         } elseif (array_key_exists($uri, $seen_local)) { | 
					
						
							| 
									
										
										
										
											2020-08-04 13:03:33 +01:00
										 |  |  |             try { | 
					
						
							|  |  |  |                 // Was it in this protocol? Delete the older record.
 | 
					
						
							|  |  |  |                 if ($seen_local[$uri] !== $id) { | 
					
						
							|  |  |  |                     printfnq("Deleting Profile with id = {$seen_local[$uri]}\n"); | 
					
						
							|  |  |  |                     $profile = Profile::getByID($seen_local[$uri]); | 
					
						
							|  |  |  |                     $profile->delete(); | 
					
						
							|  |  |  |                 } else { | 
					
						
							|  |  |  |                     printfnq("Deleting {$profile_class} with id = {$seen_local[$uri]}\n"); | 
					
						
							|  |  |  |                     $profile = $profile_class::getKV('profile_id', $seen_local[$uri]); | 
					
						
							|  |  |  |                     $profile->delete(); | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |             } catch (Exception $e) { | 
					
						
							|  |  |  |                 // Let it go
 | 
					
						
							|  |  |  |                 printfnq('FWIW: ' . $e->getMessage() . "\n"); | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  |             } | 
					
						
							| 
									
										
										
										
											2020-08-04 05:10:11 +01:00
										 |  |  |             // Update the profile id for this URI.
 | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  |             $seen_local[$uri] = $id; | 
					
						
							|  |  |  |         } else { | 
					
						
							| 
									
										
										
										
											2020-08-04 05:10:11 +01:00
										 |  |  |             // It's the first time we see this profile _inside_ this protocol!
 | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  |             $seen_local[$uri] = $id; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2020-08-04 13:03:33 +01:00
										 |  |  |     $protocol_profile->free(); | 
					
						
							|  |  |  |     unset($protocol_profile); | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-08-04 05:10:11 +01:00
										 |  |  |     // Merge the findings inside this protocol with the global seen to be used on the next protocol of the list.
 | 
					
						
							| 
									
										
										
										
											2020-08-04 05:02:06 +01:00
										 |  |  |     $seen = array_merge($seen, $seen_local); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | run(); |