. // }}} namespace Component\Tag; use App\Core\Cache; use App\Core\DB\DB; use App\Core\Event; use App\Core\Modules\Component; use App\Core\Router\Router; use App\Entity\Language; use App\Entity\Note; use App\Entity\NoteTag; use App\Util\Formatting; use App\Util\HTML; use Doctrine\Common\Collections\ExpressionBuilder; use Doctrine\ORM\Query\Expr; use Doctrine\ORM\QueryBuilder; /** * Component responsible for extracting tags from posted notes, as well as normalizing them * * @author Hugo Sales * @copyright 2021 Free Software Foundation, Inc http://www.fsf.org * @license https://www.gnu.org/licenses/agpl.html GNU AGPL v3 or later */ class Tag extends Component { public const MAX_TAG_LENGTH = 64; public const TAG_REGEX = '/(^|\\s)(#[\\pL\\pN_\\-\\.]{1,64})/u'; // Brion Vibber 2011-02-23 v2:classes/Notice.php:367 function saveTags public const TAG_SLUG_REGEX = '[A-Za-z0-9]{1,64}'; public function onAddRoute($r): bool { $r->connect('single_note_tag', '/note-tag/{tag<' . self::TAG_SLUG_REGEX . '>}', [Controller\Tag::class, 'single_note_tag']); $r->connect('multiple_note_tags', '/note-tags/{tags<(' . self::TAG_SLUG_REGEX . ',)+' . self::TAG_SLUG_REGEX . '>}', [Controller\Tag::class, 'multi_note_tags']); $r->connect('single_actor_tag', '/actor-tag/{tag<' . self::TAG_SLUG_REGEX . '>}', [Controller\Tag::class, 'single_actor_tag']); $r->connect('multiple_actor_tags', '/actor-tags/{tags<(' . self::TAG_SLUG_REGEX . ',)+' . self::TAG_SLUG_REGEX . '>}', [Controller\Tag::class, 'multi_actor_tags']); return Event::next; } /** * Process note by extracting any tags present */ public function onProcessNoteContent(Note $note, string $content): bool { $matched_tags = []; $processed_tags = false; preg_match_all(self::TAG_REGEX, $content, $matched_tags, \PREG_SET_ORDER); foreach ($matched_tags as $match) { $tag = str_replace('#', '', self::ensureLength($match[2])); $canonical_tag = self::canonicalTag($tag, Language::getFromId($note->getLanguageId())->getLocale()); DB::persist(NoteTag::create(['tag' => $tag, 'canonical' => $canonical_tag, 'note_id' => $note->getId()])); Cache::pushList("tag-{$canonical_tag}", $note); $processed_tags = true; } if ($processed_tags) { DB::flush(); } return Event::next; } public function onRenderPlainTextNoteContent(string &$text, ?string $language = null): bool { $text = preg_replace_callback(self::TAG_REGEX, fn ($m) => $m[1] . self::tagLink($m[2], $language), $text); return Event::next; } private static function tagLink(string $tag, ?string $language): string { $tag = self::ensureLength($tag); $canonical = self::canonicalTag($tag, $language); $url = Router::url('single_note_tag', !\is_null($language) ? ['tag' => $canonical, 'lang' => $language] : ['tag' => $canonical]); return HTML::html(['a' => ['attrs' => ['href' => $url, 'title' => $tag, 'rel' => 'tag'], $tag]], options: ['indent' => false]); } public static function ensureLength(string $tag): string { return mb_substr($tag, 0, self::MAX_TAG_LENGTH); } /** * Convert a tag to it's canonical representation, by splitting it * into words, stemming it in the given language (if enabled) and * sluggifying it (turning it into an ASCII representation) */ public static function canonicalTag(string $tag, ?string $language): string { $result = ''; foreach (Formatting::splitWords(str_replace('#', '', $tag)) as $word) { $temp_res = null; if (\is_null($language) || Event::handle('StemWord', [$language, $word, &$temp_res]) !== Event::stop) { $temp_res = $word; } $result .= Formatting::slugify($temp_res); } return self::ensureLength($result); } /** * Populate $note_expr with an expression to match a tag, if the term looks like a tag * * $term /^(note|tag|people|actor)/ means we want to match only either a note or an actor */ public function onSearchCreateExpression(ExpressionBuilder $eb, string $term, &$note_expr, &$actor_expr): bool { $search_term = str_contains($term, ':#') ? explode(':', $term)[1] : $term; $temp_note_expr = $eb->eq('note_tag.tag', $search_term); $temp_actor_expr = $eb->eq('actor_tag.tag', $search_term); if (Formatting::startsWith($term, ['note', 'tag'])) { $note_expr = $temp_note_expr; } else { if (Formatting::startsWith($term, ['people', 'actor'])) { $actor_expr = $temp_actor_expr; } else { $note_expr = $temp_note_expr; $actor_expr = $temp_actor_expr; return Event::next; } } return Event::stop; } public function onSearchQueryAddJoins(QueryBuilder &$note_qb, QueryBuilder &$actor_qb): bool { $note_qb->join('App\Entity\NoteTag', 'note_tag', Expr\Join::WITH, 'note_tag.note_id = note.id'); $actor_qb->join('App\Entity\ActorTag', 'actor_tag', Expr\Join::WITH, 'actor_tag.tagger = actor.id'); return Event::next; } }