friendica-github/src/Model/Tag.php

844 lines
24 KiB
PHP
Raw Normal View History

2020-04-15 16:37:09 +00:00
<?php
/**
2023-01-01 09:36:24 -05:00
* @copyright Copyright (C) 2010-2023, the Friendica project
2020-04-15 16:37:09 +00:00
*
* @license GNU AGPL version 3 or any later version
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as
* published by the Free Software Foundation, either version 3 of the
* License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <https://www.gnu.org/licenses/>.
*
*/
namespace Friendica\Model;
use Friendica\Content\Text\BBCode;
use Friendica\Core\Cache\Enum\Duration;
2020-04-15 16:37:09 +00:00
use Friendica\Core\Logger;
use Friendica\Core\Protocol;
2020-11-19 19:34:48 +00:00
use Friendica\Database\Database;
2020-04-15 16:37:09 +00:00
use Friendica\Database\DBA;
2020-04-26 15:24:58 +00:00
use Friendica\DI;
use Friendica\Protocol\ActivityPub;
use Friendica\Util\DateTimeFormat;
2023-11-09 06:43:03 +00:00
use Friendica\Util\HTTPSignature;
use Friendica\Util\Strings;
2020-04-15 16:37:09 +00:00
/**
* Class Tag
*
* This Model class handles tag table interactions.
* This tables stores relevant tags related to posts, like hashtags and mentions.
*/
class Tag
{
2020-04-16 04:20:06 +00:00
const UNKNOWN = 0;
const HASHTAG = 1;
const MENTION = 2;
2020-04-15 16:37:09 +00:00
/**
* An implicit mention is a mention in a comment body that is redundant with the threading information.
*/
2020-04-16 04:20:06 +00:00
const IMPLICIT_MENTION = 8;
2020-04-15 16:37:09 +00:00
/**
* An exclusive mention transmits the post only to the target account without transmitting it to the followers, usually a group.
2020-04-15 16:37:09 +00:00
*/
2020-04-16 04:20:06 +00:00
const EXCLUSIVE_MENTION = 9;
2020-04-15 16:37:09 +00:00
const TO = 10;
const CC = 11;
const BTO = 12;
const BCC = 13;
const AUDIENCE = 14;
const ATTRIBUTED = 15;
2023-12-21 00:33:42 +00:00
const CAN_ANNOUNCE = 20;
const CAN_LIKE = 21;
const CAN_REPLY = 22;
2022-04-23 12:32:29 +00:00
const ACCOUNT = 1;
const GENERAL_COLLECTION = 2;
const FOLLOWER_COLLECTION = 3;
const PUBLIC_COLLECTION = 4;
2020-04-16 04:20:06 +00:00
const TAG_CHARACTER = [
self::HASHTAG => '#',
self::MENTION => '@',
self::EXCLUSIVE_MENTION => '!',
self::IMPLICIT_MENTION => '%',
2020-04-16 04:20:06 +00:00
];
2020-04-15 16:37:09 +00:00
2020-04-17 07:58:54 +00:00
/**
* Store tag/mention elements
*
2022-06-23 16:03:55 +02:00
* @param integer $uriId
* @param integer $type Tag type
* @param string $name Tag name
* @param string $url Contact URL (optional)
* @param integer $target Target (default: null)
* @return void
2020-04-17 07:58:54 +00:00
*/
public static function store(int $uriId, int $type, string $name, string $url = '', int $target = null)
{
2020-04-29 10:49:13 +00:00
if ($type == self::HASHTAG) {
// Trim Unicode non-word characters
$name = preg_replace('/(^\W+)|(\W+$)/us', '', $name);
2020-04-28 11:52:51 +00:00
$tags = explode(self::TAG_CHARACTER[self::HASHTAG], $name);
if (count($tags) > 1) {
foreach ($tags as $tag) {
self::store($uriId, $type, $tag, $url);
2020-04-28 11:52:51 +00:00
}
return;
}
}
if (empty($name)) {
return;
}
$cid = 0;
$tagid = 0;
if (in_array($type, [self::MENTION, self::EXCLUSIVE_MENTION, self::IMPLICIT_MENTION, self::TO, self::CC, self::BTO, self::BCC, self::AUDIENCE, self::ATTRIBUTED])) {
if (empty($url)) {
// No mention without a contact url
return;
}
2020-08-22 05:59:19 +00:00
if ((substr($url, 0, 7) == 'https//') || (substr($url, 0, 6) == 'http//')) {
Logger::notice('Wrong scheme in url', ['url' => $url]);
2020-08-22 05:59:19 +00:00
}
$cid = Contact::getIdForURL($url, 0, false);
Logger::debug('Got id for contact', ['cid' => $cid, 'url' => $url]);
2020-04-20 09:47:26 +00:00
if (empty($cid)) {
$tag = DBA::selectFirst('tag', ['name', 'type'], ['url' => $url]);
if (!empty($tag)) {
if ($tag['name'] != substr($name, 0, 96)) {
DBA::update('tag', ['name' => substr($name, 0, 96)], ['url' => $url, 'type' => $tag['type']]);
}
if (!empty($target) && ($tag['type'] != $target)) {
DBA::update('tag', ['type' => $target], ['url' => $url]);
}
2021-02-28 19:31:12 +00:00
}
}
}
if (empty($cid)) {
if (!in_array($type, [self::TO, self::CC, self::BTO, self::BCC, self::AUDIENCE, self::ATTRIBUTED])) {
if (($type != self::HASHTAG) && !empty($url) && ($url != $name)) {
$url = strtolower($url);
} else {
$url = '';
}
}
2020-04-20 09:47:26 +00:00
$tagid = self::getID($name, $url, $target);
if (empty($tagid)) {
return;
}
}
$fields = ['uri-id' => $uriId, 'type' => $type, 'tid' => $tagid, 'cid' => $cid];
2020-04-20 05:43:13 +00:00
2020-04-28 11:52:51 +00:00
if (in_array($type, [self::MENTION, self::EXCLUSIVE_MENTION, self::IMPLICIT_MENTION])) {
2020-04-20 05:43:13 +00:00
$condition = $fields;
2020-04-28 11:52:51 +00:00
$condition['type'] = [self::MENTION, self::EXCLUSIVE_MENTION, self::IMPLICIT_MENTION];
2020-04-20 05:43:13 +00:00
if (DBA::exists('post-tag', $condition)) {
Logger::info('Tag already exists', $fields);
return;
}
}
2020-11-19 19:34:48 +00:00
DBA::insert('post-tag', $fields, Database::INSERT_IGNORE);
Logger::debug('Stored tag/mention', ['uri-id' => $uriId, 'tag-id' => $tagid, 'contact-id' => $cid, 'name' => $name, 'type' => $type]);
}
2022-04-23 11:43:30 +00:00
/**
* Fetch the target type for the given url
*
2022-04-23 12:32:29 +00:00
* @param string $url
* @param bool $fetch Fetch information via network operations
2022-04-23 11:43:30 +00:00
* @return null|int
*/
2022-04-23 12:32:29 +00:00
public static function getTargetType(string $url, bool $fetch = true)
{
2022-04-23 12:32:29 +00:00
$target = null;
if (empty($url)) {
2022-04-23 12:32:29 +00:00
return $target;
}
$tag = DBA::selectFirst('tag', ['url', 'type'], ['url' => $url]);
if (!empty($tag['type'])) {
2022-04-23 12:32:29 +00:00
$target = $tag['type'];
if ($target != self::GENERAL_COLLECTION) {
Logger::debug('Found existing type', ['type' => $tag['type'], 'url' => $url]);
return $target;
}
}
if ($url == ActivityPub::PUBLIC_COLLECTION) {
2022-04-23 12:32:29 +00:00
$target = self::PUBLIC_COLLECTION;
Logger::debug('Public collection', ['url' => $url]);
} else {
if (DBA::exists('apcontact', ['followers' => $url])) {
2022-04-23 12:32:29 +00:00
$target = self::FOLLOWER_COLLECTION;
Logger::debug('Found collection via existing apcontact', ['url' => $url]);
2022-04-23 12:32:29 +00:00
} elseif (Contact::getIdForURL($url, 0, $fetch ? null : false)) {
$target = self::ACCOUNT;
Logger::debug('URL is an account', ['url' => $url]);
} elseif ($fetch && ($target != self::GENERAL_COLLECTION)) {
2023-11-09 06:43:03 +00:00
$content = HTTPSignature::fetch($url);
if (!empty($content['type']) && ($content['type'] == 'OrderedCollection')) {
2022-04-23 12:32:29 +00:00
$target = self::GENERAL_COLLECTION;
Logger::debug('URL is an ordered collection', ['url' => $url]);
}
}
}
2022-04-24 15:27:20 +00:00
if (!empty($target) && !empty($tag['url']) && ($tag['type'] != $target)) {
DBA::update('tag', ['type' => $target], ['url' => $url]);
}
if (empty($target)) {
Logger::debug('No type could be detected', ['url' => $url]);
}
return $target;
}
/**
* Get a tag id for a given tag name and URL
*
* @param string $name Name of tag
2022-06-23 16:03:55 +02:00
* @param string $url
* @param int $type Type of tag
* @return int Tag id
*/
public static function getID(string $name, string $url = '', int $type = null): int
{
$fields = ['name' => substr($name, 0, 96), 'url' => $url];
$tag = DBA::selectFirst('tag', ['id', 'type'], $fields);
if (DBA::isResult($tag)) {
if (empty($tag['type']) && !empty($type)) {
DBA::update('tag', ['type' => $type], $fields);
}
return $tag['id'];
}
if (!empty($type)) {
$fields['type'] = $type;
}
2020-11-19 19:34:48 +00:00
DBA::insert('tag', $fields, Database::INSERT_IGNORE);
$tid = DBA::lastInsertId();
if (!empty($tid)) {
return $tid;
}
2022-06-23 16:14:33 +02:00
// Also log type
$fields['type'] = $type;
Logger::error('No tag id created', $fields);
return 0;
}
2020-04-17 07:58:54 +00:00
/**
* Store tag/mention elements
*
2022-06-23 16:03:55 +02:00
* @param integer $uriId
* @param string $hash
* @param string $name
* @param string $url
* @return void
2020-04-17 07:58:54 +00:00
*/
2022-10-27 05:44:44 +00:00
public static function storeByHash(int $uriId, string $hash, string $name, string $url = '')
{
$type = self::getTypeForHash($hash);
if ($type == self::UNKNOWN) {
return;
}
2022-10-27 05:44:44 +00:00
self::store($uriId, $type, $name, $url);
}
2020-04-15 16:37:09 +00:00
/**
* Get tags and mentions from the body
2022-04-23 12:32:29 +00:00
*
2020-04-20 09:47:26 +00:00
* @param string $body Body of the post
* @param string $tags Accepted tags
*
* @return array Tag list
2020-04-15 16:37:09 +00:00
*/
public static function getFromBody(string $body, string $tags = null): array
2020-04-15 16:37:09 +00:00
{
2020-04-18 16:14:38 +00:00
if (is_null($tags)) {
$tags = self::TAG_CHARACTER[self::HASHTAG] . self::TAG_CHARACTER[self::MENTION] . self::TAG_CHARACTER[self::EXCLUSIVE_MENTION];
2020-04-18 16:14:38 +00:00
}
if (!preg_match_all("/([" . $tags . "])\[url\=([^\[\]]*)\]([^\[\]]*)\[\/url\]/ism", $body, $result, PREG_SET_ORDER)) {
return [];
}
return $result;
}
/**
* Store tags and mentions from the body
2022-04-23 12:32:29 +00:00
*
* @param integer $uriId URI-Id
* @param string $body Body of the post
* @param string $tags Accepted tags
* @return void
*/
2022-10-27 05:44:44 +00:00
public static function storeFromBody(int $uriId, string $body, string $tags = null)
{
2022-10-27 05:44:44 +00:00
$item = ['uri-id' => $uriId, 'body' => $body, 'quote-uri-id' => null];
self::storeFromArray($item, $tags);
}
/**
* Store tags and mentions from the item array
*
* @param array $item Item array
* @param string $tags Accepted tags
* @return void
*/
public static function storeFromArray(array $item, string $tags = null)
{
Logger::info('Check for tags', ['uri-id' => $item['uri-id'], 'hash' => $tags]);
if (is_null($tags)) {
$tags = self::TAG_CHARACTER[self::HASHTAG] . self::TAG_CHARACTER[self::MENTION] . self::TAG_CHARACTER[self::EXCLUSIVE_MENTION];
2020-04-15 16:37:09 +00:00
}
2022-10-27 05:44:44 +00:00
foreach (self::getFromBody($item['body'], $tags) as $tag) {
self::storeByHash($item['uri-id'], $tag[1], $tag[3], $tag[2]);
2020-04-15 16:37:09 +00:00
}
2022-10-29 22:11:39 +00:00
$shared = DI::contentItem()->getSharedPost($item, ['uri-id']);
// Search for hashtags in the shared body (but only if hashtags are wanted)
2022-10-27 05:44:44 +00:00
if (!empty($shared) && (strpos($tags, self::TAG_CHARACTER[self::HASHTAG]) !== false)) {
foreach (self::getByURIId($shared['post']['uri-id'], [self::HASHTAG]) as $tag) {
self::store($item['uri-id'], $tag['type'], $tag['name'], $tag['url']);
}
}
2020-04-15 16:37:09 +00:00
}
/**
* Store raw tags (not encapsulated in links) from the body
* This function is needed in the intermediate phase.
2023-12-20 19:55:34 +00:00
* Later we can call Item::setHashtags in advance to have all tags converted.
2022-04-23 12:32:29 +00:00
*
* @param integer $uriId URI-Id
* @param string $body Body of the post
* @return void
*/
public static function storeRawTagsFromBody(int $uriId, string $body)
{
Logger::info('Check for tags', ['uri-id' => $uriId]);
$result = BBCode::getTags($body);
if (empty($result)) {
return;
}
Logger::info('Found tags', ['uri-id' => $uriId, 'result' => $result]);
foreach ($result as $tag) {
if (substr($tag, 0, 1) != self::TAG_CHARACTER[self::HASHTAG]) {
continue;
}
self::storeByHash($uriId, substr($tag, 0, 1), substr($tag, 1));
}
}
2020-04-26 15:24:58 +00:00
/**
* Checks for stored hashtags and mentions for the given post
*
* @param integer $uriId
2020-04-26 15:24:58 +00:00
* @return bool
*/
public static function existsForPost(int $uriId): bool
2020-04-26 15:24:58 +00:00
{
return DBA::exists('post-tag', ['uri-id' => $uriId, 'type' => [self::HASHTAG, self::MENTION, self::EXCLUSIVE_MENTION, self::IMPLICIT_MENTION]]);
2020-04-26 15:24:58 +00:00
}
/**
* Remove tag/mention
*
2022-06-23 16:03:55 +02:00
* @param integer $uriId
* @param integer $type Type
* @param string $name Name
* @param string $url URL
* @return void
*/
public static function remove(int $uriId, int $type, string $name, string $url = '')
{
$condition = ['uri-id' => $uriId, 'type' => $type, 'url' => $url];
2020-04-24 11:04:50 +00:00
if ($type == self::HASHTAG) {
$condition['name'] = $name;
}
$tag = DBA::selectFirst('tag-view', ['tid', 'cid'], $condition);
if (!DBA::isResult($tag)) {
return;
}
2020-04-24 11:04:50 +00:00
Logger::debug('Removing tag/mention', ['uri-id' => $uriId, 'tid' => $tag['tid'], 'name' => $name, 'url' => $url]);
DBA::delete('post-tag', ['uri-id' => $uriId, 'type' => $type, 'tid' => $tag['tid'], 'cid' => $tag['cid']]);
}
/**
* Remove tag/mention
*
2022-06-23 16:03:55 +02:00
* @param integer $uriId
* @param string $hash
* @param string $name
* @param string $url
* @return void
*/
public static function removeByHash(int $uriId, string $hash, string $name, string $url = '')
{
$type = self::getTypeForHash($hash);
if ($type == self::UNKNOWN) {
return;
}
self::remove($uriId, $type, $name, $url);
}
/**
* Get the type for the given hash
*
2022-06-23 16:03:55 +02:00
* @param string $hash
* @return integer Tag type
*/
private static function getTypeForHash(string $hash): int
{
if ($hash == self::TAG_CHARACTER[self::MENTION]) {
return self::MENTION;
} elseif ($hash == self::TAG_CHARACTER[self::EXCLUSIVE_MENTION]) {
return self::EXCLUSIVE_MENTION;
} elseif ($hash == self::TAG_CHARACTER[self::IMPLICIT_MENTION]) {
return self::IMPLICIT_MENTION;
} elseif ($hash == self::TAG_CHARACTER[self::HASHTAG]) {
return self::HASHTAG;
} else {
return self::UNKNOWN;
}
2020-04-26 15:24:58 +00:00
}
/**
* Create implicit mentions for a given post
*
2022-06-23 16:03:55 +02:00
* @param integer $uriId
* @param integer $parentUriId
* @return void
*/
public static function createImplicitMentions(int $uriId, int $parentUriId)
{
2020-05-09 08:08:33 +00:00
// Always mention the direct parent author
$parent = Post::selectFirst(['author-link', 'author-name'], ['uri-id' => $parentUriId]);
self::store($uriId, self::IMPLICIT_MENTION, $parent['author-name'], $parent['author-link']);
2020-05-09 08:08:33 +00:00
if (DI::config()->get('system', 'disable_implicit_mentions')) {
return;
}
$tags = DBA::select('tag-view', ['name', 'url'], ['uri-id' => $parentUriId, 'type' => [self::MENTION, self::EXCLUSIVE_MENTION, self::IMPLICIT_MENTION]]);
while ($tag = DBA::fetch($tags)) {
self::store($uriId, self::IMPLICIT_MENTION, $tag['name'], $tag['url']);
}
2020-05-09 15:43:41 +00:00
DBA::close($tags);
}
2020-04-26 15:24:58 +00:00
/**
* Retrieves the terms from the provided type(s) associated with the provided item ID.
*
2022-06-23 16:03:55 +02:00
* @param int $uriId
* @param array $type Tag type(s)
* @return array|bool Array on success, false on error
2020-04-26 15:24:58 +00:00
* @throws \Exception
*/
public static function getByURIId(int $uriId, array $type = [self::HASHTAG, self::MENTION, self::EXCLUSIVE_MENTION, self::IMPLICIT_MENTION])
2020-04-26 15:24:58 +00:00
{
$condition = ['uri-id' => $uriId, 'type' => $type];
return DBA::selectToArray('tag-view', ['type', 'name', 'url', 'tag-type'], $condition);
}
2020-04-26 15:24:58 +00:00
/**
* Checks if the given url is mentioned in the post
*
* @param integer $uriId
* @param string $url
* @param array $type
*
* @return boolean
*/
public static function isMentioned(int $uriId, string $url, array $type = [self::MENTION, self::EXCLUSIVE_MENTION, self::AUDIENCE]): bool
{
$tags = self::getByURIId($uriId, $type);
foreach ($tags as $tag) {
if (Strings::compareLink($url, $tag['url'])) {
return true;
}
}
return false;
}
/**
* Return a string with all tags and mentions
*
2022-06-23 16:03:55 +02:00
* @param integer $uriId
* @param array $type Tag type(s)
* @return string tags and mentions
* @throws \Exception
*/
public static function getCSVByURIId(int $uriId, array $type = [self::HASHTAG, self::MENTION, self::EXCLUSIVE_MENTION, self::IMPLICIT_MENTION]): string
{
$tag_list = [];
foreach (self::getByURIId($uriId, $type) as $tag) {
$tag_list[] = self::TAG_CHARACTER[$tag['type']] . '[url=' . $tag['url'] . ']' . $tag['name'] . '[/url]';
}
return implode(',', $tag_list);
}
2020-05-01 06:01:22 +00:00
/**
2020-04-26 15:24:58 +00:00
* Sorts an item's tags into mentions, hashtags and other tags. Generate personalized URLs by user and modify the
* provided item's body with them.
*
* @param array $item
* @return array
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
* @throws \ImagickException
*/
public static function populateFromItem(array &$item): array
2020-04-26 15:24:58 +00:00
{
$return = [
'tags' => [],
'hashtags' => [],
'mentions' => [],
'implicit_mentions' => [],
];
$searchpath = DI::baseUrl() . '/search?tag=';
2020-04-26 15:24:58 +00:00
$taglist = DBA::select(
'tag-view',
['type', 'name', 'url', 'cid'],
['uri-id' => $item['uri-id'], 'type' => [self::HASHTAG, self::MENTION, self::EXCLUSIVE_MENTION, self::IMPLICIT_MENTION]]
);
2020-04-26 15:24:58 +00:00
while ($tag = DBA::fetch($taglist)) {
if ($tag['url'] == '') {
$tag['url'] = $searchpath . rawurlencode($tag['name']);
}
$orig_tag = $tag['url'];
$prefix = self::TAG_CHARACTER[$tag['type']];
switch ($tag['type']) {
2020-04-26 15:24:58 +00:00
case self::HASHTAG:
if ($orig_tag != $tag['url']) {
$item['body'] = str_replace($orig_tag, $tag['url'], $item['body']);
}
2021-05-20 08:20:06 -04:00
$return['hashtags'][] = '<bdi>' . $prefix . '<a href="' . $tag['url'] . '" target="_blank" rel="noopener noreferrer">' . htmlspecialchars($tag['name']) . '</a></bdi>';
$return['tags'][] = '<bdi>' . $prefix . '<a href="' . $tag['url'] . '" target="_blank" rel="noopener noreferrer">' . htmlspecialchars($tag['name']) . '</a></bdi>';
2020-04-26 15:24:58 +00:00
break;
2020-04-26 15:24:58 +00:00
case self::MENTION:
case self::EXCLUSIVE_MENTION:
if (!empty($tag['cid'])) {
$tag['url'] = Contact::magicLinkById($tag['cid']);
} else {
2020-04-26 15:24:58 +00:00
$tag['url'] = Contact::magicLink($tag['url']);
}
2021-05-20 08:20:06 -04:00
$return['mentions'][] = '<bdi>' . $prefix . '<a href="' . $tag['url'] . '" target="_blank" rel="noopener noreferrer">' . htmlspecialchars($tag['name']) . '</a></bdi>';
$return['tags'][] = '<bdi>' . $prefix . '<a href="' . $tag['url'] . '" target="_blank" rel="noopener noreferrer">' . htmlspecialchars($tag['name']) . '</a></bdi>';
2020-04-26 15:24:58 +00:00
break;
2020-04-26 15:24:58 +00:00
case self::IMPLICIT_MENTION:
$return['implicit_mentions'][] = $prefix . $tag['name'];
break;
default:
Logger::warning('Unknown tag type found', $tag);
2020-04-26 15:24:58 +00:00
}
}
DBA::close($taglist);
return $return;
}
2020-09-17 21:10:59 +00:00
/**
* Counts posts for given tag
*
* @param string $search
* @param integer $uid
* @return integer number of posts
*/
public static function countByTag(string $search, int $uid = 0): int
2020-09-17 21:10:59 +00:00
{
$condition = ["`name` = ? AND (`uid` = ? OR (`uid` = ? AND NOT `global`))
AND (`network` IN (?, ?, ?, ?) OR (`uid` = ? AND `uid` != ?))",
2022-06-23 16:03:55 +02:00
$search, 0, $uid,
Protocol::ACTIVITYPUB, Protocol::DFRN, Protocol::DIASPORA, Protocol::OSTATUS, $uid, 0,
];
2020-09-17 21:10:59 +00:00
return DBA::count('tag-search-view', $condition);
2020-09-17 21:10:59 +00:00
}
2020-04-28 11:52:51 +00:00
/**
* Search posts for given tag
*
* @param string $search Tag to search for
* @param integer $uid User Id
* @param integer $start Starting record
* @param integer $limit Maximum count of records
* @param integer $last_uriid
2020-04-28 11:52:51 +00:00
* @return array with URI-ID
*/
public static function getURIIdListByTag(string $search, int $uid = 0, int $start = 0, int $limit = 100, int $last_uriid = 0): array
2020-04-28 11:52:51 +00:00
{
$condition = ["`name` = ? AND (`uid` = ? OR (`uid` = ? AND NOT `global`))
AND (`network` IN (?, ?, ?, ?) OR (`uid` = ? AND `uid` != ?))",
2022-06-23 16:03:55 +02:00
$search, 0, $uid,
Protocol::ACTIVITYPUB, Protocol::DFRN, Protocol::DIASPORA, Protocol::OSTATUS, $uid, 0,
];
if (!empty($last_uriid)) {
$condition = DBA::mergeConditions($condition, ["`uri-id` < ?", $last_uriid]);
}
2020-04-28 11:52:51 +00:00
$params = [
'order' => ['uri-id' => true],
'limit' => [$start, $limit]
];
$tags = DBA::select('tag-search-view', ['uri-id'], $condition, $params);
$uriIds = [];
2020-04-28 11:52:51 +00:00
while ($tag = DBA::fetch($tags)) {
$uriIds[] = $tag['uri-id'];
2020-04-28 11:52:51 +00:00
}
DBA::close($tags);
return $uriIds;
2020-04-28 11:52:51 +00:00
}
2020-05-01 10:57:32 +00:00
/**
* Returns a list of the most frequent global hashtags over the given period
*
* @param int $period Period in hours to consider posts
* @param int $limit Number of returned tags
* @param int $offset Page offset in results
2020-05-01 10:57:32 +00:00
* @return array
* @throws \Exception
*/
public static function getGlobalTrendingHashtags(int $period, int $limit = 10, int $offset = 0): array
2020-05-01 10:57:32 +00:00
{
$tags = DI::cache()->get("global_trending_tags-$period");
if (empty($tags)) {
$tags = self::setGlobalTrendingHashtags($period, 1000);
}
return array_slice($tags, $offset, $limit);
}
2020-05-01 10:57:32 +00:00
2021-03-09 22:34:41 +00:00
/**
* Fetch the blocked tags as SQL
*
* @return string SQL for blocked tag names or empty string
2021-03-09 22:34:41 +00:00
*/
private static function getBlockedSQL(): string
2021-03-09 22:34:41 +00:00
{
$blocked_txt = DI::config()->get('system', 'blocked_tags');
if (empty($blocked_txt)) {
return '';
}
$blocked = explode(',', $blocked_txt);
array_walk($blocked, function (&$value) {
$value = "'" . DBA::escape(trim($value)) . "'";
});
return ' AND NOT `name` IN (' . implode(',', $blocked) . ')';
2021-03-09 22:34:41 +00:00
}
/**
* Creates a list of the most frequent global hashtags over the given period
*
* @param int $period Period in hours to consider posts
* @param int $limit Number of returned tags
* @return array
* @throws \Exception
*/
public static function setGlobalTrendingHashtags(int $period, int $limit = 10): array
{
/*
* Get a uri-id that is at least X hours old.
* We use the uri-id in the query for the hash tags since this is much faster
*/
$post = Post::selectFirstThread(
['uri-id'],
["`uid` = ? AND `received` < ?", 0, DateTimeFormat::utc('now - ' . $period . ' hour')],
['order' => ['received' => true]]
);
2021-07-22 15:35:30 +00:00
if (empty($post['uri-id'])) {
return [];
}
2021-03-09 22:34:41 +00:00
$block_sql = self::getBlockedSQL();
$tagsStmt = DBA::p(
"SELECT `name` AS `term`, COUNT(*) AS `score`, COUNT(DISTINCT(`author-id`)) as `authors`
FROM `tag-search-view`
2021-07-22 15:35:30 +00:00
WHERE `private` = ? AND `uid` = ? AND `uri-id` > ? $block_sql
GROUP BY `term` ORDER BY `authors` DESC, `score` DESC LIMIT ?",
Item::PUBLIC,
0,
$post['uri-id'],
$limit
);
if (DBA::isResult($tagsStmt)) {
$tags = DBA::toArray($tagsStmt);
DI::cache()->set("global_trending_tags-$period", $tags, Duration::HOUR);
return $tags;
2020-05-01 10:57:32 +00:00
}
return [];
2020-05-01 10:57:32 +00:00
}
/**
* Returns a list of the most frequent local hashtags over the given period
*
* @param int $period Period in hours to consider posts
* @param int $limit Number of returned tags
* @param int $offset Page offset in results
2020-05-01 10:57:32 +00:00
* @return array
* @throws \Exception
*/
public static function getLocalTrendingHashtags(int $period, $limit = 10, int $offset = 0): array
2020-05-01 10:57:32 +00:00
{
$tags = DI::cache()->get("local_trending_tags-$period");
if (empty($tags)) {
$tags = self::setLocalTrendingHashtags($period, 1000);
}
return array_slice($tags, $offset, $limit);
}
2020-05-01 10:57:32 +00:00
/**
* Returns a list of the most frequent local hashtags over the given period
*
* @param int $period Period in hours to consider posts
* @param int $limit Number of returned tags
* @return array
* @throws \Exception
*/
public static function setLocalTrendingHashtags(int $period, int $limit = 10): array
{
2021-07-22 15:35:30 +00:00
// Get a uri-id that is at least X hours old.
// We use the uri-id in the query for the hash tags since this is much faster
$post = Post::selectFirstThread(
['uri-id'],
["`uid` = ? AND `received` < ?", 0, DateTimeFormat::utc('now - ' . $period . ' hour')],
['order' => ['received' => true]]
);
2021-07-22 15:35:30 +00:00
if (empty($post['uri-id'])) {
return [];
}
2021-03-09 22:34:41 +00:00
$block_sql = self::getBlockedSQL();
$tagsStmt = DBA::p(
"SELECT `name` AS `term`, COUNT(*) AS `score`, COUNT(DISTINCT(`author-id`)) as `authors`
FROM `tag-search-view`
2021-07-22 15:35:30 +00:00
WHERE `private` = ? AND `wall` AND `origin` AND `uri-id` > ? $block_sql
GROUP BY `term` ORDER BY `authors` DESC, `score` DESC LIMIT ?",
Item::PUBLIC,
$post['uri-id'],
$limit
);
if (DBA::isResult($tagsStmt)) {
$tags = DBA::toArray($tagsStmt);
DI::cache()->set("local_trending_tags-$period", $tags, Duration::HOUR);
return $tags;
2020-05-01 10:57:32 +00:00
}
return [];
2020-05-01 10:57:32 +00:00
}
2020-05-01 12:39:41 +00:00
/**
* Check if the provided tag is of one of the provided term types.
*
* @param string $tag Tag name
2020-05-01 12:39:41 +00:00
* @param int ...$types
* @return bool
*/
public static function isType(string $tag, ...$types): bool
2020-05-01 12:39:41 +00:00
{
$tag_chars = [];
foreach ($types as $type) {
if (array_key_exists($type, self::TAG_CHARACTER)) {
$tag_chars[] = self::TAG_CHARACTER[$type];
}
}
return Strings::startsWithChars($tag, $tag_chars);
}
/**
* Fetch user who subscribed to the given tag
*
* @param string $tag
* @return array User list
*/
private static function getUIDListByTag(string $tag): array
{
$uids = [];
$searches = DBA::select('search', ['uid'], ['term' => $tag]);
while ($search = DBA::fetch($searches)) {
$uids[] = $search['uid'];
}
DBA::close($searches);
return $uids;
}
/**
* Fetch user who subscribed to the tags of the given item
*
2022-06-23 16:03:55 +02:00
* @param integer $uriId
* @return array User list
*/
public static function getUIDListByURIId(int $uriId): array
{
$uids = [];
2023-08-28 04:05:52 +00:00
foreach (self::getByURIId($uriId, [self::HASHTAG]) as $tag) {
foreach (self::getUIDListByTag(self::TAG_CHARACTER[self::HASHTAG] . $tag['name']) as $uid) {
$uids[$uid][] = $tag['name'];
}
}
2023-08-28 04:05:52 +00:00
return $uids;
}
2020-04-15 16:37:09 +00:00
}