2018-07-31 04:06:22 +02:00
|
|
|
<?php
|
2020-02-09 15:45:36 +01:00
|
|
|
/**
|
2022-01-02 08:27:47 +01:00
|
|
|
* @copyright Copyright (C) 2010-2022, the Friendica project
|
2020-02-09 15:45:36 +01:00
|
|
|
*
|
|
|
|
* @license GNU AGPL version 3 or any later version
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU Affero General Public License as
|
|
|
|
* published by the Free Software Foundation, either version 3 of the
|
|
|
|
* License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU Affero General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
|
|
* along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
*
|
|
|
|
*/
|
2018-07-31 04:06:22 +02:00
|
|
|
|
|
|
|
namespace Friendica\Util;
|
|
|
|
|
2021-07-05 05:41:05 +00:00
|
|
|
use Friendica\Core\Logger;
|
|
|
|
use Friendica\Core\System;
|
2019-12-15 22:34:11 +01:00
|
|
|
use Friendica\DI;
|
2018-07-31 04:06:22 +02:00
|
|
|
|
|
|
|
/**
|
2020-01-19 06:05:23 +00:00
|
|
|
* Proxy utilities class
|
2018-07-31 04:06:22 +02:00
|
|
|
*/
|
|
|
|
class Proxy
|
|
|
|
{
|
|
|
|
/**
|
|
|
|
* Sizes constants
|
|
|
|
*/
|
2021-06-27 11:50:10 +00:00
|
|
|
const SIZE_MICRO = 'micro'; // 48
|
|
|
|
const SIZE_THUMB = 'thumb'; // 80
|
|
|
|
const SIZE_SMALL = 'small'; // 300
|
|
|
|
const SIZE_MEDIUM = 'medium'; // 600
|
|
|
|
const SIZE_LARGE = 'large'; // 1024
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Pixel Sizes
|
|
|
|
*/
|
|
|
|
const PIXEL_MICRO = 48;
|
|
|
|
const PIXEL_THUMB = 80;
|
|
|
|
const PIXEL_SMALL = 300;
|
|
|
|
const PIXEL_MEDIUM = 600;
|
|
|
|
const PIXEL_LARGE = 1024;
|
2018-07-31 04:06:22 +02:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Accepted extensions
|
|
|
|
*
|
|
|
|
* @var array
|
|
|
|
* @todo Make this configurable?
|
|
|
|
*/
|
|
|
|
private static $extensions = [
|
|
|
|
'jpg',
|
|
|
|
'jpeg',
|
|
|
|
'gif',
|
|
|
|
'png',
|
|
|
|
];
|
|
|
|
|
|
|
|
/**
|
2020-01-19 06:05:23 +00:00
|
|
|
* Private constructor
|
2018-07-31 04:06:22 +02:00
|
|
|
*/
|
|
|
|
private function __construct () {
|
|
|
|
// No instances from utilities classes
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2020-01-19 06:05:23 +00:00
|
|
|
* Transform a remote URL into a local one.
|
2018-07-31 04:06:22 +02:00
|
|
|
*
|
|
|
|
* This function only performs the URL replacement on http URL and if the
|
2021-07-06 06:44:18 +00:00
|
|
|
* provided URL isn't local
|
2018-07-31 04:06:22 +02:00
|
|
|
*
|
|
|
|
* @param string $url The URL to proxyfy
|
2021-10-05 20:18:19 +00:00
|
|
|
* @param string $size One of the Proxy::SIZE_* constants
|
2018-07-31 04:06:22 +02:00
|
|
|
* @return string The proxyfied URL or relative path
|
2019-01-06 16:06:53 -05:00
|
|
|
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
|
2018-07-31 04:06:22 +02:00
|
|
|
*/
|
2022-06-23 11:59:37 +02:00
|
|
|
public static function proxifyUrl(string $url, string $size = ''): string
|
2018-07-31 04:06:22 +02:00
|
|
|
{
|
2021-09-09 12:40:19 +00:00
|
|
|
if (!DI::config()->get('system', 'proxify_content')) {
|
|
|
|
return $url;
|
|
|
|
}
|
|
|
|
|
2018-07-31 04:06:22 +02:00
|
|
|
// Trim URL first
|
|
|
|
$url = trim($url);
|
|
|
|
|
2021-07-05 04:16:02 +00:00
|
|
|
// Quit if not an HTTP/HTTPS link or if local
|
|
|
|
if (!in_array(parse_url($url, PHP_URL_SCHEME), ['http', 'https']) || self::isLocalImage($url)) {
|
2018-07-31 04:06:22 +02:00
|
|
|
return $url;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Image URL may have encoded ampersands for display which aren't desirable for proxy
|
|
|
|
$url = html_entity_decode($url, ENT_NOQUOTES, 'utf-8');
|
|
|
|
|
|
|
|
$shortpath = hash('md5', $url);
|
|
|
|
$longpath = substr($shortpath, 0, 2);
|
|
|
|
|
|
|
|
$longpath .= '/' . strtr(base64_encode($url), '+/', '-_');
|
|
|
|
|
|
|
|
// Extract the URL extension
|
|
|
|
$extension = pathinfo(parse_url($url, PHP_URL_PATH), PATHINFO_EXTENSION);
|
|
|
|
|
|
|
|
if (in_array($extension, self::$extensions)) {
|
|
|
|
$shortpath .= '.' . $extension;
|
|
|
|
$longpath .= '.' . $extension;
|
|
|
|
}
|
|
|
|
|
2019-12-30 23:00:08 +01:00
|
|
|
$proxypath = DI::baseUrl() . '/proxy/' . $longpath;
|
2018-07-31 04:06:22 +02:00
|
|
|
|
|
|
|
if ($size != '') {
|
|
|
|
$size = ':' . $size;
|
|
|
|
}
|
|
|
|
|
2021-07-05 05:41:05 +00:00
|
|
|
Logger::info('Created proxy link', ['url' => $url, 'callstack' => System::callstack(20)]);
|
|
|
|
|
2018-07-31 04:06:22 +02:00
|
|
|
// Too long files aren't supported by Apache
|
2021-07-04 21:24:49 +00:00
|
|
|
if (strlen($proxypath) > 250) {
|
2019-12-30 23:00:08 +01:00
|
|
|
return DI::baseUrl() . '/proxy/' . $shortpath . '?url=' . urlencode($url);
|
2018-07-31 04:06:22 +02:00
|
|
|
} else {
|
|
|
|
return $proxypath . $size;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2020-01-19 06:05:23 +00:00
|
|
|
* "Proxifies" HTML code's image tags
|
2018-07-31 04:06:22 +02:00
|
|
|
*
|
|
|
|
* "Proxifies", means replaces image URLs in given HTML code with those from
|
|
|
|
* proxy storage directory.
|
|
|
|
*
|
|
|
|
* @param string $html Un-proxified HTML code
|
2022-08-18 22:05:00 +02:00
|
|
|
*
|
2018-07-31 04:06:22 +02:00
|
|
|
* @return string Proxified HTML code
|
2019-01-06 16:06:53 -05:00
|
|
|
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
|
2018-07-31 04:06:22 +02:00
|
|
|
*/
|
2022-06-23 11:59:37 +02:00
|
|
|
public static function proxifyHtml(string $html): string
|
2018-07-31 04:06:22 +02:00
|
|
|
{
|
2019-12-30 23:00:08 +01:00
|
|
|
$html = str_replace(Strings::normaliseLink(DI::baseUrl()) . '/', DI::baseUrl() . '/', $html);
|
2018-07-31 04:06:22 +02:00
|
|
|
|
|
|
|
return preg_replace_callback('/(<img [^>]*src *= *["\'])([^"\']+)(["\'][^>]*>)/siU', 'self::replaceUrl', $html);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2020-01-19 06:05:23 +00:00
|
|
|
* Checks if the URL is a local URL.
|
2018-07-31 04:06:22 +02:00
|
|
|
*
|
|
|
|
* @param string $url
|
2022-08-18 22:05:00 +02:00
|
|
|
*
|
2018-07-31 04:06:22 +02:00
|
|
|
* @return boolean
|
2019-01-06 16:06:53 -05:00
|
|
|
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
|
2018-07-31 04:06:22 +02:00
|
|
|
*/
|
2022-06-23 10:18:38 +02:00
|
|
|
public static function isLocalImage(string $url): bool
|
2018-07-31 04:06:22 +02:00
|
|
|
{
|
|
|
|
if (substr($url, 0, 1) == '/') {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (strtolower(substr($url, 0, 5)) == 'data:') {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2021-07-05 04:16:02 +00:00
|
|
|
return Network::isLocalLink($url);
|
2018-07-31 04:06:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2020-01-19 06:05:23 +00:00
|
|
|
* Return the array of query string parameters from a URL
|
2018-07-31 04:06:22 +02:00
|
|
|
*
|
|
|
|
* @param string $url URL to parse
|
2022-08-18 22:05:00 +02:00
|
|
|
*
|
2018-07-31 04:06:22 +02:00
|
|
|
* @return array Associative array of query string parameters
|
|
|
|
*/
|
2022-06-23 10:18:38 +02:00
|
|
|
private static function parseQuery(string $url): array
|
2018-07-31 04:06:22 +02:00
|
|
|
{
|
|
|
|
$query = parse_url($url, PHP_URL_QUERY);
|
|
|
|
$query = html_entity_decode($query);
|
|
|
|
|
2018-08-05 15:57:04 +02:00
|
|
|
parse_str($query, $arr);
|
2018-07-31 04:06:22 +02:00
|
|
|
|
|
|
|
return $arr;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
2020-01-19 06:05:23 +00:00
|
|
|
* Call-back method to replace the UR
|
2018-07-31 04:06:22 +02:00
|
|
|
*
|
|
|
|
* @param array $matches Matches from preg_replace_callback()
|
2022-08-18 22:05:00 +02:00
|
|
|
*
|
2018-07-31 04:06:22 +02:00
|
|
|
* @return string Proxified HTML image tag
|
2019-01-06 16:06:53 -05:00
|
|
|
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
|
2018-07-31 04:06:22 +02:00
|
|
|
*/
|
2022-06-23 11:59:37 +02:00
|
|
|
private static function replaceUrl(array $matches): string
|
2018-07-31 04:06:22 +02:00
|
|
|
{
|
|
|
|
// if the picture seems to be from another picture cache then take the original source
|
|
|
|
$queryvar = self::parseQuery($matches[2]);
|
|
|
|
|
|
|
|
if (!empty($queryvar['url']) && substr($queryvar['url'], 0, 4) == 'http') {
|
|
|
|
$matches[2] = urldecode($queryvar['url']);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Following line changed per bug #431
|
|
|
|
if (self::isLocalImage($matches[2])) {
|
|
|
|
return $matches[1] . $matches[2] . $matches[3];
|
|
|
|
}
|
|
|
|
|
|
|
|
// Return proxified HTML
|
|
|
|
return $matches[1] . self::proxifyUrl(htmlspecialchars_decode($matches[2])) . $matches[3];
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|