| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  | <?php | 
					
						
							| 
									
										
										
										
											2021-04-19 18:51:05 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | // {{{ License
 | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  | // This file is part of GNU social - https://www.gnu.org/software/social
 | 
					
						
							|  |  |  | //
 | 
					
						
							|  |  |  | // GNU social is free software: you can redistribute it and/or modify
 | 
					
						
							|  |  |  | // it under the terms of the GNU Affero General Public License as published by
 | 
					
						
							|  |  |  | // the Free Software Foundation, either version 3 of the License, or
 | 
					
						
							|  |  |  | // (at your option) any later version.
 | 
					
						
							|  |  |  | //
 | 
					
						
							|  |  |  | // GNU social is distributed in the hope that it will be useful,
 | 
					
						
							|  |  |  | // but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
					
						
							|  |  |  | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
					
						
							|  |  |  | // GNU Affero General Public License for more details.
 | 
					
						
							|  |  |  | //
 | 
					
						
							|  |  |  | // You should have received a copy of the GNU Affero General Public License
 | 
					
						
							|  |  |  | // along with GNU social.  If not, see <http://www.gnu.org/licenses/>.
 | 
					
						
							| 
									
										
										
										
											2021-04-19 18:51:05 +00:00
										 |  |  | // }}}
 | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | /** | 
					
						
							| 
									
										
										
										
											2019-07-06 04:31:02 +01:00
										 |  |  |  * OEmbed and OpenGraph implementation for GNU social | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |  * | 
					
						
							|  |  |  |  * @package   GNUsocial | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |  * | 
					
						
							| 
									
										
										
										
											2021-02-19 10:34:21 +00:00
										 |  |  |  * @author    Mikael Nordfeldth | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |  * @author    Stephen Paul Weber | 
					
						
							|  |  |  |  * @author    hannes | 
					
						
							|  |  |  |  * @author    Mikael Nordfeldth | 
					
						
							| 
									
										
										
										
											2021-02-19 10:34:21 +00:00
										 |  |  |  * @author    Miguel Dantas | 
					
						
							| 
									
										
										
										
											2021-04-19 18:51:05 +00:00
										 |  |  |  * @author    Diogo Peralta Cordeiro <mail@diogo.site> | 
					
						
							|  |  |  |  * @authir    Hugo Sales <hugo@hsal.es> | 
					
						
							|  |  |  |  * | 
					
						
							| 
									
										
										
										
											2021-02-19 10:34:21 +00:00
										 |  |  |  * @copyright 2014-2021 Free Software Foundation, Inc http://www.fsf.org | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |  * @license   https://www.gnu.org/licenses/agpl.html GNU AGPL v3 or later | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  | namespace Plugin\Embed; | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  | use App\Core\Cache; | 
					
						
							|  |  |  | use App\Core\DB\DB; | 
					
						
							|  |  |  | use App\Core\Event; | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  | use App\Core\GSFile; | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  | use App\Core\HTTPClient; | 
					
						
							|  |  |  | use App\Core\Log; | 
					
						
							| 
									
										
										
										
											2021-04-19 18:51:05 +00:00
										 |  |  | use App\Core\Modules\Plugin; | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  | use App\Core\Router\RouteLoader; | 
					
						
							|  |  |  | use App\Core\Router\Router; | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  | use App\Core\Security; | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  | use App\Entity\Attachment; | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  | use App\Entity\AttachmentThumbnail; | 
					
						
							|  |  |  | use App\Util\Common; | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  | use App\Util\Exception\DuplicateFoundException; | 
					
						
							|  |  |  | use App\Util\Exception\NotFoundException; | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  | use App\Util\TemporaryFile; | 
					
						
							|  |  |  | use Embed\Embed as LibEmbed; | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  | use Symfony\Component\HttpFoundation\Request; | 
					
						
							| 
									
										
										
										
											2019-07-07 13:26:10 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  | /** | 
					
						
							| 
									
										
										
										
											2019-07-06 04:31:02 +01:00
										 |  |  |  * Base class for the Embed plugin that does most of the heavy lifting to get | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |  * and display representations for remote content. | 
					
						
							|  |  |  |  * | 
					
						
							| 
									
										
										
										
											2021-02-19 10:34:21 +00:00
										 |  |  |  * @copyright 2014-2021 Free Software Foundation, Inc http://www.fsf.org | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |  * @license   https://www.gnu.org/licenses/agpl.html GNU AGPL v3 or later | 
					
						
							|  |  |  |  */ | 
					
						
							| 
									
										
										
										
											2021-04-19 18:51:05 +00:00
										 |  |  | class Embed extends Plugin | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     /** | 
					
						
							|  |  |  |      *  Settings which can be set in social.local.yaml | 
					
						
							|  |  |  |      *  WARNING, these are _regexps_ (slashes added later). Always escape your dots and end ('$') your strings | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public $domain_allowlist = [ | 
					
						
							| 
									
										
										
										
											2019-07-06 04:31:02 +01:00
										 |  |  |         // hostname => service provider
 | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |         '.*' => '', // Default to allowing any host
 | 
					
						
							| 
									
										
										
										
											2019-07-06 04:31:02 +01:00
										 |  |  |     ]; | 
					
						
							| 
									
										
										
										
											2019-07-06 16:52:30 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * This code executes when GNU social creates the page routing, and we hook | 
					
						
							| 
									
										
										
										
											2019-07-06 04:31:02 +01:00
										 |  |  |      * on this event to add our action handler for Embed. | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |      * | 
					
						
							|  |  |  |      * @param $m URLMapper the router that was initialized. | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |      * | 
					
						
							| 
									
										
										
										
											2019-07-12 03:13:40 +01:00
										 |  |  |      * @throws Exception | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |      * | 
					
						
							|  |  |  |      * @return void true if successful, the exception object if it isn't. | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |      */ | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     public function onAddRoute(RouteLoader $m) | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         $m->connect('oembed', 'main/oembed', Controller\Embed::class); | 
					
						
							|  |  |  |         $m->connect('embed', 'main/embed', Controller\Embed::class); | 
					
						
							|  |  |  |         return Event::next; | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Insert oembed and opengraph tags in all HTML head elements | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function onShowHeadElements(Request $request, array $result) | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         $matches = []; | 
					
						
							|  |  |  |         preg_match(',/?([^/]+)/?.*,', $request->getPathInfo(), $matches); | 
					
						
							|  |  |  |         switch ($matches[1]) { | 
					
						
							|  |  |  |         case 'attachment': | 
					
						
							|  |  |  |             $url = "{$matches[1]}/{$matches[2]}"; | 
					
						
							|  |  |  |             break; | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-07-14 23:35:11 +01:00
										 |  |  |         if (isset($url)) { | 
					
						
							|  |  |  |             foreach (['xml', 'json'] as $format) { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                 $result[] = [ | 
					
						
							|  |  |  |                     'link' => [ | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |                         'rel'   => 'alternate', | 
					
						
							|  |  |  |                         'type'  => "application/{$format}+oembed", | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                         'href'  => Router::url('embed', ['format' => $format, 'url' => $url]), | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |                         'title' => 'oEmbed', | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                     ], ]; | 
					
						
							| 
									
										
										
										
											2019-07-14 23:35:11 +01:00
										 |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         return Event::next; | 
					
						
							| 
									
										
										
										
											2016-03-17 00:31:45 +01:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |     /** | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |      * Save embedding information for an Attachment, if applicable. | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |      * | 
					
						
							|  |  |  |      * Normally this event is called through File::saveNew() | 
					
						
							|  |  |  |      * | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |      * @param Attachment $attachment The newly inserted Attachment object. | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |      * | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |      * @return bool success | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |      */ | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     public function onAttachmentStoreNew(Attachment $attachment) | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         try { | 
					
						
							|  |  |  |             DB::findOneBy('attachment_embed', ['attachment_id' => $attachment->getId()]); | 
					
						
							|  |  |  |         } catch (NotFoundException) { | 
					
						
							|  |  |  |         } catch (DuplicateFoundException) { | 
					
						
							|  |  |  |             Log::warning("Strangely, an attachment_embed object exists for new file {$attachment->getID()}"); | 
					
						
							|  |  |  |             return Event::next; | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         if (!is_null($attachment->getRemoteUrl()) || (!is_null($mimetype = $attachment->getMimetype()) && (('text/html' === substr($mimetype, 0, 9) || 'application/xhtml+xml' === substr($mimetype, 0, 21))))) { | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |             try { | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |                 $embed_data                  = $this->getEmbed($attachment->getRemoteUrl(), $attachment); | 
					
						
							|  |  |  |                 $embed_data['attachment_id'] = $attachment->getId(); | 
					
						
							|  |  |  |                 DB::persist(Entity\AttachmentEmbed::create($embed_data)); | 
					
						
							|  |  |  |                 DB::flush(); | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |             } catch (Exception $e) { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                 Log::warning($e); | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |                 return Event::next; | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |         return Event::next; | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Replace enclosure representation of an attachment with the data from embed | 
					
						
							|  |  |  |      * | 
					
						
							|  |  |  |      * @param mixed $enclosure | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function onFileEnclosureMetadata(Attachment $attachment, &$enclosure) | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |     { | 
					
						
							|  |  |  |         // Never treat generic HTML links as an enclosure type!
 | 
					
						
							| 
									
										
										
										
											2019-07-06 04:31:02 +01:00
										 |  |  |         // But if we have embed info, we'll consider it golden.
 | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         try { | 
					
						
							|  |  |  |             $embed = DB::findOneBy('attachment_embed', ['attachment_id' => $attachment->getId()]); | 
					
						
							|  |  |  |         } catch (NotFoundException) { | 
					
						
							|  |  |  |             return Event::next; | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-07-14 23:35:11 +01:00
										 |  |  |         foreach (['mimetype', 'url', 'title', 'modified', 'width', 'height'] as $key) { | 
					
						
							| 
									
										
										
										
											2019-07-06 04:31:02 +01:00
										 |  |  |             if (isset($embed->{$key}) && !empty($embed->{$key})) { | 
					
						
							|  |  |  |                 $enclosure->{$key} = $embed->{$key}; | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         return true; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2016-03-17 00:31:45 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |     /** Placeholder */ | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     public function onShowAttachment(Attachment $attachment, array &$res) | 
					
						
							| 
									
										
										
										
											2016-03-17 00:31:45 +01:00
										 |  |  |     { | 
					
						
							|  |  |  |         try { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |             $embed = Cache::get('attachment-embed-' . $attachment->getId(), | 
					
						
							|  |  |  |                                 fn () => DB::findOneBy('attachment_embed', ['attachment_id' => $attachment->getId()])); | 
					
						
							|  |  |  |         } catch (DuplicateFoundException $e) { | 
					
						
							|  |  |  |             Log::waring($e); | 
					
						
							|  |  |  |             return Event::next; | 
					
						
							|  |  |  |         } catch (NotFoundException) { | 
					
						
							|  |  |  |             return Event::next; | 
					
						
							| 
									
										
										
										
											2016-03-17 00:31:45 +01:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         if (is_null($embed) && empty($embed->getAuthorName()) && empty($embed->getProvider())) { | 
					
						
							|  |  |  |             return Event::next; | 
					
						
							| 
									
										
										
										
											2016-03-22 14:02:36 +01:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         $thumbnail  = AttachmentThumbnail::getOrCreate(attachment: $attachment, width: $width, height: $height, crop: $smart_crop); | 
					
						
							|  |  |  |         $attributes = $thumbnail->getHTMLAttributes(['class' => 'u-photo embed']); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         $res[] = Formatting::twigRender(<<<END | 
					
						
							|  |  |  | <article class="h-entry embed"> | 
					
						
							|  |  |  |     <header> | 
					
						
							|  |  |  |         <img class="u-photo embed" width="{{attributes['width']}}" height="{{attributes['height']}}" src="{{attributes['src']}}" /> | 
					
						
							|  |  |  |         <h5 class="p-name embed"> | 
					
						
							|  |  |  |              <a class="u-url" href="{{attachment.getUrl()}}">{{embed.getTitle() | escape}}</a> | 
					
						
							|  |  |  |         </h5> | 
					
						
							|  |  |  |         <div class="p-author embed"> | 
					
						
							|  |  |  |              {% if embed.getAuthorName() is not null %} | 
					
						
							|  |  |  |                   <div class="fn vcard author"> | 
					
						
							|  |  |  |                       {% if embed.getAuthorUrl() is null %} | 
					
						
							|  |  |  |                            <p>{{embed.getAuthorName()}}</p> | 
					
						
							|  |  |  |                       {% else %} | 
					
						
							|  |  |  |                            <a href="{{embed.getAuthorUrl()}}" class="url">{{embed.getAuthorName()}}</a> | 
					
						
							|  |  |  |                       {% endif %} | 
					
						
							|  |  |  |                   </div> | 
					
						
							|  |  |  |              {% endif %} | 
					
						
							|  |  |  |              {% if embed.getProvider() is not null %} | 
					
						
							|  |  |  |                   <div class="fn vcard"> | 
					
						
							|  |  |  |                       {% if embed.getProviderUrl() is null %} | 
					
						
							|  |  |  |                           <p>{{embed.getProvider()}}</p> | 
					
						
							|  |  |  |                       {% else %} | 
					
						
							|  |  |  |                           <a href="{{embed.getProviderUrl()}}" class="url">{{embed.getProvider()}}</a> | 
					
						
							|  |  |  |                       {% endif %} | 
					
						
							|  |  |  |                   </div> | 
					
						
							|  |  |  |              {% endif %} | 
					
						
							|  |  |  |         </div> | 
					
						
							|  |  |  |     </header> | 
					
						
							|  |  |  |     <div class="p-summary embed"> | 
					
						
							|  |  |  |         {{ embed.getHtml() | escape }} | 
					
						
							|  |  |  |     </div> | 
					
						
							|  |  |  | </article> | 
					
						
							|  |  |  | END, ['embed' => $embed, 'thumbnail' => $thumbnail, 'attributes' => $attributes]); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return Event::stop; | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |     /** | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |      * @throws ServerException if check is made but fails | 
					
						
							|  |  |  |      * | 
					
						
							|  |  |  |      * @return bool false on no check made, provider name on success | 
					
						
							| 
									
										
										
										
											2015-01-25 02:34:40 +01:00
										 |  |  |      */ | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     protected function checkAllowlist(string $url) | 
					
						
							| 
									
										
										
										
											2015-01-25 02:34:40 +01:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |         if ($this->check_allowlist ?? false) { | 
					
						
							| 
									
										
										
										
											2015-01-25 02:34:40 +01:00
										 |  |  |             return false;   // indicates "no check made"
 | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         $host = parse_url($url, PHP_URL_HOST); | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         foreach ($this->domain_allowlist as $regex => $provider) { | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |             if (preg_match("/{$regex}/", $host)) { | 
					
						
							| 
									
										
										
										
											2015-01-25 11:18:57 +01:00
										 |  |  |                 return $provider;    // we trust this source, return provider name
 | 
					
						
							|  |  |  |             } | 
					
						
							| 
									
										
										
										
											2015-01-25 02:34:40 +01:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         throw new ServerException(_m('Domain not in remote thumbnail source allowlist: {host}', ['host' => $host])); | 
					
						
							| 
									
										
										
										
											2015-01-25 02:34:40 +01:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Check the file size of a remote file using a HEAD request and checking | 
					
						
							|  |  |  |      * the content-length variable returned.  This isn't 100% foolproof but is | 
					
						
							|  |  |  |      * reliable enough for our purposes. | 
					
						
							|  |  |  |      * | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |      * @param string $url | 
					
						
							|  |  |  |      * @param array  $headers - if we already made a request | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |      * | 
					
						
							|  |  |  |      * @return bool|string the file size if it succeeds, false otherwise. | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |      */ | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     private function getRemoteFileSize(string $url, ?array $headers = null): ?int | 
					
						
							| 
									
										
										
										
											2015-01-25 02:34:40 +01:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |         try { | 
					
						
							| 
									
										
										
										
											2019-07-14 23:35:11 +01:00
										 |  |  |             if ($headers === null) { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                 if (!Common::isValidHttpUrl($url)) { | 
					
						
							|  |  |  |                     Log::error('Invalid URL in Embed::getRemoteFileSize()'); | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |                     return false; | 
					
						
							|  |  |  |                 } | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                 $head    = HTTPClient::head($url); | 
					
						
							|  |  |  |                 $headers = $head->getHeaders(); | 
					
						
							| 
									
										
										
										
											2019-07-14 23:56:31 +01:00
										 |  |  |                 $headers = array_change_key_case($headers, CASE_LOWER); | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |             } | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |             return $headers['content-length'][0] ?? false; | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         } catch (Exception $e) { | 
					
						
							|  |  |  |             Loog::error($e); | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |             return false; | 
					
						
							| 
									
										
										
										
											2015-01-25 02:34:40 +01:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2015-01-25 02:34:40 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |     /** | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |      * A private helper function that uses a HEAD request to check the mime type | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |      * of a remote URL to see it it's an image. | 
					
						
							|  |  |  |      * | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |      * @param mixed      $url | 
					
						
							|  |  |  |      * @param null|mixed $headers | 
					
						
							|  |  |  |      * | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |      * @return bool true if the remote URL is an image, or false otherwise. | 
					
						
							|  |  |  |      */ | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     private function isRemoteImage(string $url, ?array $headers = null): ?int | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         try { | 
					
						
							|  |  |  |             if ($headers === null) { | 
					
						
							|  |  |  |                 if (!Common::isValidHttpUrl($url)) { | 
					
						
							|  |  |  |                     Log::error('Invalid URL in Embed::getRemoteFileSize()'); | 
					
						
							|  |  |  |                     return false; | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |                 $head    = HTTPClient::head($url); | 
					
						
							|  |  |  |                 $headers = $head->getHeaders(); | 
					
						
							|  |  |  |                 $headers = array_change_key_case($headers, CASE_LOWER); | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |             } | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |             return !empty($headers['content-type']) && GSFile::mimetypeMajor($headers['content-type'][0]) === 'image'; | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         } catch (Exception $e) { | 
					
						
							|  |  |  |             Loog::error($e); | 
					
						
							|  |  |  |             return false; | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |      * Validate that $imgData is a valid image, place it in it's folder and resize | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |      * | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |      * @param $imgData - The image data to validate | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |      * @param null|string $url     - The url where the image came from, to fetch metadata | 
					
						
							|  |  |  |      * @param null|array  $headers - The headers possible previous request to $url | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |      */ | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |     protected function validateAndWriteImage($imgData, string $url, array $headers): array | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         $file = new TemporaryFile(); | 
					
						
							|  |  |  |         $file->write($imgData); | 
					
						
							| 
									
										
										
										
											2016-02-25 22:31:45 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |         $mimetype = $headers['content-type'][0]; | 
					
						
							|  |  |  |         Event::handle('AttachmentValidation', [&$file, &$mimetype]); | 
					
						
							| 
									
										
										
										
											2019-07-23 11:07:47 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |         Event::handle('HashFile', [$file->getPathname(), &$hash]); | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         $filename = Common::config('attachments', 'dir') . "embed/{$hash}"; | 
					
						
							|  |  |  |         $file->commit($filename); | 
					
						
							|  |  |  |         unset($file); | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |         if (array_key_exists('content-disposition', $headers) && preg_match('/^.+; filename="(.+?)"$/', $headers['content-disposition'][0], $matches) === 1) { | 
					
						
							|  |  |  |             $original_name = $matches[1]; | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         $info   = getimagesize($filename); | 
					
						
							|  |  |  |         $width  = $info[0]; | 
					
						
							|  |  |  |         $height = $info[1]; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return [$filename, $width, $height, $original_name ?? null, $mimetype]; | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |      * Create and store a thumbnail representation of a remote image | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |      */ | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |     protected function storeRemoteThumbnail(Attachment $attachment): array | bool | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |         if ($attachment->haveFilename() && file_exists($attachment->getPath())) { | 
					
						
							|  |  |  |             throw new AlreadyFulfilledException(_m('A thumbnail seems to already exist for remote file with id=={id}', ['id' => $attachment->getId()])); | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         $url = $attachment->getRemoteUrl(); | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |         if (substr($url, 0, 7) == 'file://') { | 
					
						
							|  |  |  |             $filename = substr($url, 7); | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |             $info     = getimagesize($filename); | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |             $filename = basename($filename); | 
					
						
							| 
									
										
										
										
											2021-04-14 15:27:37 +00:00
										 |  |  |             $width    = $info[0]; | 
					
						
							|  |  |  |             $height   = $info[1]; | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |         } else { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |             $this->checkAllowlist($url); | 
					
						
							|  |  |  |             $head    = HTTPClient::head($url); | 
					
						
							|  |  |  |             $headers = $head->getHeaders(); | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |             $headers = array_change_key_case($headers, CASE_LOWER); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             try { | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |                 $is_image = $this->isRemoteImage($url, $headers); | 
					
						
							|  |  |  |                 if ($is_image == true) { | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |                     $file_size = $this->getRemoteFileSize($url, $headers); | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                     $max_size  = Common::config('attachments', 'file_quota'); | 
					
						
							|  |  |  |                     if (($file_size != false) && ($file_size > $max_size)) { | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |                         throw new \Exception("Wanted to store remote thumbnail of size {$file_size} but the upload limit is {$max_size} so we aborted."); | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |                     } | 
					
						
							| 
									
										
										
										
											2019-09-02 16:31:32 +01:00
										 |  |  |                 } else { | 
					
						
							|  |  |  |                     return false; | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |                 } | 
					
						
							|  |  |  |             } catch (Exception $err) { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                 Log::debug('Could not determine size of remote image, aborted local storage.'); | 
					
						
							| 
									
										
										
										
											2021-02-16 18:30:21 +00:00
										 |  |  |                 throw $err; | 
					
						
							| 
									
										
										
										
											2019-08-19 01:40:31 +01:00
										 |  |  |             } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             // First we download the file to memory and test whether it's actually an image file
 | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |             Log::debug('Downloading remote thumbnail for file id==' . $attachment->getId() . " with thumbnail URL: {$url}"); | 
					
						
							| 
									
										
										
										
											2019-09-02 16:31:32 +01:00
										 |  |  |             try { | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |                 $imgData = HTTPClient::get($url)->getContent(); | 
					
						
							| 
									
										
										
										
											2019-09-02 16:31:32 +01:00
										 |  |  |                 if (isset($imgData)) { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                     [$filename, $width, $height, $original_name, $mimetype] = $this->validateAndWriteImage($imgData, $url, $headers); | 
					
						
							| 
									
										
										
										
											2019-09-02 16:31:32 +01:00
										 |  |  |                 } else { | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                     throw new UnsupportedMediaException(_m('HTTPClient returned an empty result')); | 
					
						
							| 
									
										
										
										
											2019-09-02 16:31:32 +01:00
										 |  |  |                 } | 
					
						
							| 
									
										
										
										
											2019-11-01 14:19:42 +03:00
										 |  |  |             } catch (UnsupportedMediaException $e) { | 
					
						
							| 
									
										
										
										
											2019-09-02 16:31:32 +01:00
										 |  |  |                 // Couldn't find anything that looks like an image, nothing to do
 | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |                 Log::debug($e); | 
					
						
							| 
									
										
										
										
											2019-09-02 16:31:32 +01:00
										 |  |  |                 return false; | 
					
						
							|  |  |  |             } | 
					
						
							| 
									
										
										
										
											2018-07-18 05:31:24 +01:00
										 |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |         DB::persist(AttachmentThumbnail::create(['attachment_id' => $attachment->getId(), 'width' => $width, 'height' => $height])); | 
					
						
							| 
									
										
										
										
											2021-04-25 21:23:46 +00:00
										 |  |  |         $attachment->setFilename($filename); | 
					
						
							|  |  |  |         DB::flush(); | 
					
						
							| 
									
										
										
										
											2015-01-25 02:34:40 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-04-27 20:56:50 +00:00
										 |  |  |         return [$filename, $width, $height, $original_name, $mimetype]; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							|  |  |  |      * Perform an oEmbed or OpenGraph lookup for the given $url. | 
					
						
							|  |  |  |      * | 
					
						
							|  |  |  |      * Some known hosts are allowlisted with API endpoints where we | 
					
						
							|  |  |  |      * know they exist but autodiscovery data isn't available. | 
					
						
							|  |  |  |      * | 
					
						
							|  |  |  |      * Throws exceptions on failure. | 
					
						
							|  |  |  |      * | 
					
						
							|  |  |  |      * @param string $url | 
					
						
							|  |  |  |      * | 
					
						
							|  |  |  |      * @throws EmbedHelper_BadHtmlException | 
					
						
							|  |  |  |      * @throws HTTP_Request2_Exception | 
					
						
							|  |  |  |      * | 
					
						
							|  |  |  |      * @return object | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function getEmbed(string $url, Attachment $attachment): array | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         Log::info('Checking for remote URL metadata for ' . $url); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         try { | 
					
						
							|  |  |  |             Log::info("Trying to find Embed data for {$url} with 'oscarotero/Embed'"); | 
					
						
							|  |  |  |             $embed                     = new LibEmbed(); | 
					
						
							|  |  |  |             $info                      = $embed->get($url); | 
					
						
							|  |  |  |             $metadata['title']         = $info->title; | 
					
						
							|  |  |  |             $metadata['html']          = Security::sanitize($info->description); | 
					
						
							|  |  |  |             $metadata['url']           = $info->url; | 
					
						
							|  |  |  |             $metadata['author_name']   = $info->authorName; | 
					
						
							|  |  |  |             $metadata['author_url']    = $info->authorUrl; | 
					
						
							|  |  |  |             $metadata['provider_name'] = $info->providerName; | 
					
						
							|  |  |  |             $metadata['provider_url']  = $info->providerUrl; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             if (!is_null($info->image)) { | 
					
						
							|  |  |  |                 if (substr($info->image, 0, 4) === 'data') { | 
					
						
							|  |  |  |                     // Inline image
 | 
					
						
							|  |  |  |                     $imgData                                                = base64_decode(substr($info->image, stripos($info->image, 'base64,') + 7)); | 
					
						
							|  |  |  |                     [$filename, $width, $height, $original_name, $mimetype] = $this->validateAndWriteImage($imgData); | 
					
						
							|  |  |  |                 } else { | 
					
						
							|  |  |  |                     $attachment->setRemoteUrl((string) $info->image); | 
					
						
							|  |  |  |                     [$filename, $width, $height, $original_name, $mimetype] = $this->storeRemoteThumbnail($attachment); | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |                 $metadata['width']    = $height; | 
					
						
							|  |  |  |                 $metadata['height']   = $width; | 
					
						
							|  |  |  |                 $metadata['mimetype'] = $mimetype; | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } catch (Exception $e) { | 
					
						
							|  |  |  |             Log::info("Failed to find Embed data for {$url} with 'oscarotero/Embed', got exception: " . get_class($e)); | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         $metadata = self::normalize($metadata); | 
					
						
							|  |  |  |         $attachment->setTitle($metadata['title']); | 
					
						
							|  |  |  |         return $metadata; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							|  |  |  |      * Normalize fetched info. | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public static function normalize(array $data): array | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         if (isset($metadata['url'])) { | 
					
						
							|  |  |  |             // sometimes sites serve the path, not the full URL, for images
 | 
					
						
							|  |  |  |             // let's "be liberal in what you accept from others"!
 | 
					
						
							|  |  |  |             // add protocol and host if the thumbnail_url starts with /
 | 
					
						
							|  |  |  |             if ($metadata['url'][0] == '/') { | 
					
						
							|  |  |  |                 $thumbnail_url_parsed = parse_url($metadata['url']); | 
					
						
							|  |  |  |                 $metadata['url']      = "{$thumbnail_url_parsed['scheme']}://{$thumbnail_url_parsed['host']}{$metadata['url']}"; | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             // Some wordpress opengraph implementations sometimes return a white blank image
 | 
					
						
							|  |  |  |             // no need for us to save that!
 | 
					
						
							|  |  |  |             if ($metadata['url'] == 'https://s0.wp.com/i/blank.jpg') { | 
					
						
							|  |  |  |                 $metadata['url'] = null; | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             if (!isset($data['width'])) { | 
					
						
							|  |  |  |                 $data['width']  = Common::config('thumbnail', 'width'); | 
					
						
							|  |  |  |                 $data['height'] = Common::config('thumbnail', 'height'); | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return $data; | 
					
						
							| 
									
										
										
										
											2014-05-06 23:00:30 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | } |