2018-07-31 04:06:22 +02:00
|
|
|
<?php
|
|
|
|
/**
|
|
|
|
* @file src/Module/Proxy.php
|
2020-01-19 07:05:23 +01:00
|
|
|
* Based upon "Privacy Image Cache" by Tobias Hößl <https://github.com/CatoTH/>
|
2018-07-31 04:06:22 +02:00
|
|
|
*/
|
|
|
|
namespace Friendica\Module;
|
|
|
|
|
|
|
|
use Friendica\BaseModule;
|
2019-10-06 20:48:33 +02:00
|
|
|
use Friendica\Core\Logger;
|
2019-12-15 22:34:11 +01:00
|
|
|
use Friendica\DI;
|
2018-07-31 04:06:22 +02:00
|
|
|
use Friendica\Model\Photo;
|
|
|
|
use Friendica\Object\Image;
|
2019-03-18 23:33:20 +01:00
|
|
|
use Friendica\Util\HTTPSignature;
|
2018-07-31 04:06:22 +02:00
|
|
|
use Friendica\Util\Proxy as ProxyUtils;
|
|
|
|
|
|
|
|
/**
|
2020-01-19 07:05:23 +01:00
|
|
|
* Module Proxy
|
2018-12-09 12:33:38 +01:00
|
|
|
*
|
|
|
|
* urls:
|
|
|
|
* /proxy/[sub1/[sub2/]]<base64url image url>[.ext][:size]
|
|
|
|
* /proxy?url=<image url>
|
2018-07-31 04:06:22 +02:00
|
|
|
*/
|
|
|
|
class Proxy extends BaseModule
|
|
|
|
{
|
|
|
|
|
|
|
|
/**
|
2020-01-19 07:05:23 +01:00
|
|
|
* Initializer method for this class.
|
2018-07-31 04:06:22 +02:00
|
|
|
*
|
|
|
|
* Sets application instance and checks if /proxy/ path is writable.
|
|
|
|
*
|
|
|
|
*/
|
2019-11-05 22:48:54 +01:00
|
|
|
public static function init(array $parameters = [])
|
2018-07-31 04:06:22 +02:00
|
|
|
{
|
|
|
|
// Set application instance here
|
2019-12-15 22:34:11 +01:00
|
|
|
$a = DI::app();
|
2018-07-31 04:06:22 +02:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Pictures are stored in one of the following ways:
|
|
|
|
*
|
|
|
|
* 1. If a folder "proxy" exists and is writeable, then use this for caching
|
|
|
|
* 2. If a cache path is defined, use this
|
|
|
|
* 3. If everything else failed, cache into the database
|
|
|
|
*
|
|
|
|
* Question: Do we really need these three methods?
|
|
|
|
*/
|
2018-08-26 21:49:39 +02:00
|
|
|
if (isset($_SERVER['HTTP_IF_MODIFIED_SINCE']) && isset($_SERVER['HTTP_IF_NONE_MATCH'])) {
|
2018-07-31 04:06:22 +02:00
|
|
|
header('HTTP/1.1 304 Not Modified');
|
|
|
|
header('Last-Modified: ' . gmdate('D, d M Y H:i:s', time()) . ' GMT');
|
|
|
|
header('Etag: ' . $_SERVER['HTTP_IF_NONE_MATCH']);
|
|
|
|
header('Expires: ' . gmdate('D, d M Y H:i:s', time() + (31536000)) . ' GMT');
|
|
|
|
header('Cache-Control: max-age=31536000');
|
|
|
|
|
|
|
|
if (function_exists('header_remove')) {
|
|
|
|
header_remove('Last-Modified');
|
|
|
|
header_remove('Expires');
|
|
|
|
header_remove('Cache-Control');
|
|
|
|
}
|
|
|
|
|
|
|
|
/// @TODO Stop here?
|
|
|
|
exit();
|
|
|
|
}
|
|
|
|
|
|
|
|
if (function_exists('header_remove')) {
|
|
|
|
header_remove('Pragma');
|
|
|
|
header_remove('pragma');
|
|
|
|
}
|
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
$direct_cache = self::setupDirectCache();
|
2018-07-31 04:06:22 +02:00
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
$request = self::getRequestInfo();
|
|
|
|
|
|
|
|
if (empty($request['url'])) {
|
2019-05-02 05:16:10 +02:00
|
|
|
throw new \Friendica\Network\HTTPException\BadRequestException();
|
2018-07-31 04:06:22 +02:00
|
|
|
}
|
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
// Webserver already tried direct cache...
|
|
|
|
|
|
|
|
// Try to use filecache;
|
|
|
|
$cachefile = self::responseFromCache($request);
|
|
|
|
|
|
|
|
// Try to use photo from db
|
|
|
|
self::responseFromDB($request);
|
|
|
|
|
|
|
|
//
|
|
|
|
// If script is here, the requested url has never cached before.
|
|
|
|
// Let's fetch it, scale it if required, then save it in cache.
|
|
|
|
//
|
|
|
|
|
|
|
|
// It shouldn't happen but it does - spaces in URL
|
|
|
|
$request['url'] = str_replace(' ', '+', $request['url']);
|
2019-03-18 23:33:20 +01:00
|
|
|
$fetchResult = HTTPSignature::fetchRaw($request['url'], local_user(), true, ['timeout' => 10]);
|
2018-12-09 12:33:38 +01:00
|
|
|
$img_str = $fetchResult->getBody();
|
|
|
|
|
|
|
|
// If there is an error then return a blank image
|
2019-10-06 20:48:33 +02:00
|
|
|
if ((substr($fetchResult->getReturnCode(), 0, 1) == '4') || empty($img_str)) {
|
|
|
|
Logger::info('Error fetching image', ['image' => $request['url'], 'return' => $fetchResult->getReturnCode(), 'empty' => empty($img_str)]);
|
2019-01-07 18:09:10 +01:00
|
|
|
self::responseError();
|
2018-12-09 12:33:38 +01:00
|
|
|
// stop.
|
|
|
|
}
|
|
|
|
|
2019-03-18 23:33:20 +01:00
|
|
|
$tempfile = tempnam(get_temppath(), 'cache');
|
|
|
|
file_put_contents($tempfile, $img_str);
|
|
|
|
$mime = mime_content_type($tempfile);
|
|
|
|
unlink($tempfile);
|
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
$image = new Image($img_str, $mime);
|
|
|
|
if (!$image->isValid()) {
|
2019-10-06 20:48:33 +02:00
|
|
|
Logger::info('The image is invalid', ['image' => $request['url'], 'mime' => $mime]);
|
2019-01-07 18:09:10 +01:00
|
|
|
self::responseError();
|
2018-12-09 12:33:38 +01:00
|
|
|
// stop.
|
|
|
|
}
|
2019-03-18 23:33:20 +01:00
|
|
|
|
2019-01-03 18:34:18 +01:00
|
|
|
$basepath = $a->getBasePath();
|
2019-03-18 23:33:20 +01:00
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
// Store original image
|
|
|
|
if ($direct_cache) {
|
|
|
|
// direct cache , store under ./proxy/
|
|
|
|
file_put_contents($basepath . '/proxy/' . ProxyUtils::proxifyUrl($request['url'], true), $image->asString());
|
|
|
|
} elseif($cachefile !== '') {
|
|
|
|
// cache file
|
|
|
|
file_put_contents($cachefile, $image->asString());
|
|
|
|
} else {
|
|
|
|
// database
|
|
|
|
Photo::store($image, 0, 0, $request['urlhash'], $request['url'], '', 100);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// reduce quality - if it isn't a GIF
|
|
|
|
if ($image->getType() != 'image/gif') {
|
|
|
|
$image->scaleDown($request['size']);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// Store scaled image
|
|
|
|
if ($direct_cache && $request['sizetype'] != '') {
|
|
|
|
file_put_contents($basepath . '/proxy/' . ProxyUtils::proxifyUrl($request['url'], true) . $request['sizetype'], $image->asString());
|
|
|
|
}
|
|
|
|
|
|
|
|
self::responseImageHttpCache($image);
|
|
|
|
// stop.
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
2020-01-19 07:05:23 +01:00
|
|
|
* Build info about requested image to be proxied
|
2018-12-09 12:33:38 +01:00
|
|
|
*
|
|
|
|
* @return array
|
|
|
|
* [
|
|
|
|
* 'url' => requested url,
|
|
|
|
* 'urlhash' => sha1 has of the url prefixed with 'pic:',
|
|
|
|
* 'size' => requested image size (int)
|
|
|
|
* 'sizetype' => requested image size (string): ':micro', ':thumb', ':small', ':medium', ':large'
|
|
|
|
* ]
|
2019-01-06 22:06:53 +01:00
|
|
|
* @throws \Exception
|
2018-12-09 12:33:38 +01:00
|
|
|
*/
|
|
|
|
private static function getRequestInfo()
|
|
|
|
{
|
2019-12-15 22:34:11 +01:00
|
|
|
$a = DI::app();
|
2018-12-09 12:33:38 +01:00
|
|
|
$size = 1024;
|
|
|
|
$sizetype = '';
|
2019-03-18 23:33:20 +01:00
|
|
|
|
2018-07-31 04:06:22 +02:00
|
|
|
// Look for filename in the arguments
|
2019-05-01 21:29:04 +02:00
|
|
|
// @TODO: Replace with parameter from router
|
2018-12-09 12:33:38 +01:00
|
|
|
if (($a->argc > 1) && !isset($_REQUEST['url'])) {
|
2018-07-31 04:06:22 +02:00
|
|
|
if (isset($a->argv[3])) {
|
|
|
|
$url = $a->argv[3];
|
|
|
|
} elseif (isset($a->argv[2])) {
|
|
|
|
$url = $a->argv[2];
|
|
|
|
} else {
|
|
|
|
$url = $a->argv[1];
|
|
|
|
}
|
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
/// @TODO: Why? And what about $url in this case?
|
2019-05-01 21:29:04 +02:00
|
|
|
/// @TODO: Replace with parameter from router
|
2018-07-31 04:06:22 +02:00
|
|
|
if (isset($a->argv[3]) && ($a->argv[3] == 'thumb')) {
|
|
|
|
$size = 200;
|
|
|
|
}
|
|
|
|
|
|
|
|
// thumb, small, medium and large.
|
|
|
|
if (substr($url, -6) == ':micro') {
|
|
|
|
$size = 48;
|
|
|
|
$sizetype = ':micro';
|
|
|
|
$url = substr($url, 0, -6);
|
|
|
|
} elseif (substr($url, -6) == ':thumb') {
|
|
|
|
$size = 80;
|
|
|
|
$sizetype = ':thumb';
|
|
|
|
$url = substr($url, 0, -6);
|
|
|
|
} elseif (substr($url, -6) == ':small') {
|
2018-10-23 16:36:57 +02:00
|
|
|
$size = 300;
|
2018-07-31 04:06:22 +02:00
|
|
|
$url = substr($url, 0, -6);
|
|
|
|
$sizetype = ':small';
|
|
|
|
} elseif (substr($url, -7) == ':medium') {
|
|
|
|
$size = 600;
|
|
|
|
$url = substr($url, 0, -7);
|
|
|
|
$sizetype = ':medium';
|
|
|
|
} elseif (substr($url, -6) == ':large') {
|
|
|
|
$size = 1024;
|
|
|
|
$url = substr($url, 0, -6);
|
|
|
|
$sizetype = ':large';
|
|
|
|
}
|
|
|
|
|
|
|
|
$pos = strrpos($url, '=.');
|
|
|
|
if ($pos) {
|
|
|
|
$url = substr($url, 0, $pos + 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
$url = str_replace(['.jpg', '.jpeg', '.gif', '.png'], ['','','',''], $url);
|
|
|
|
|
|
|
|
$url = base64_decode(strtr($url, '-_', '+/'), true);
|
|
|
|
|
|
|
|
} else {
|
2019-10-15 15:20:32 +02:00
|
|
|
$url = $_REQUEST['url'] ?? '';
|
2018-07-31 04:06:22 +02:00
|
|
|
}
|
2019-03-18 23:33:20 +01:00
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
return [
|
|
|
|
'url' => $url,
|
|
|
|
'urlhash' => 'pic:' . sha1($url),
|
|
|
|
'size' => $size,
|
|
|
|
'sizetype' => $sizetype,
|
|
|
|
];
|
|
|
|
}
|
2019-01-06 22:06:53 +01:00
|
|
|
|
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
/**
|
2020-01-19 07:05:23 +01:00
|
|
|
* setup ./proxy folder for direct cache
|
2018-12-09 12:33:38 +01:00
|
|
|
*
|
|
|
|
* @return bool False if direct cache can't be used.
|
2019-01-06 22:06:53 +01:00
|
|
|
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
|
2018-12-09 12:33:38 +01:00
|
|
|
*/
|
|
|
|
private static function setupDirectCache()
|
|
|
|
{
|
2019-12-15 22:34:11 +01:00
|
|
|
$a = DI::app();
|
2018-12-09 12:33:38 +01:00
|
|
|
$basepath = $a->getBasePath();
|
2018-07-31 04:06:22 +02:00
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
// If the cache path isn't there, try to create it
|
|
|
|
if (!is_dir($basepath . '/proxy') && is_writable($basepath)) {
|
|
|
|
mkdir($basepath . '/proxy');
|
2018-07-31 04:06:22 +02:00
|
|
|
}
|
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
// Checking if caching into a folder in the webroot is activated and working
|
|
|
|
$direct_cache = (is_dir($basepath . '/proxy') && is_writable($basepath . '/proxy'));
|
2019-03-18 23:33:20 +01:00
|
|
|
// we don't use direct cache if image url is passed in args and not in querystring
|
2018-12-09 12:33:38 +01:00
|
|
|
$direct_cache = $direct_cache && ($a->argc > 1) && !isset($_REQUEST['url']);
|
2019-03-18 23:33:20 +01:00
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
return $direct_cache;
|
|
|
|
}
|
2019-01-06 22:06:53 +01:00
|
|
|
|
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
/**
|
2020-01-19 07:05:23 +01:00
|
|
|
* Try to reply with image in cachefile
|
2018-12-09 12:33:38 +01:00
|
|
|
*
|
2019-01-06 22:06:53 +01:00
|
|
|
* @param array $request Array from getRequestInfo
|
2018-12-09 12:33:38 +01:00
|
|
|
*
|
|
|
|
* @return string Cache file name, empty string if cache is not enabled.
|
2019-01-06 22:06:53 +01:00
|
|
|
*
|
2018-12-09 12:33:38 +01:00
|
|
|
* If cachefile exists, script ends here and this function will never returns
|
2019-01-06 22:06:53 +01:00
|
|
|
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
|
|
|
|
* @throws \ImagickException
|
2018-12-09 12:33:38 +01:00
|
|
|
*/
|
|
|
|
private static function responseFromCache(&$request)
|
|
|
|
{
|
|
|
|
$cachefile = get_cachefile(hash('md5', $request['url']));
|
|
|
|
if ($cachefile != '' && file_exists($cachefile)) {
|
|
|
|
$img = new Image(file_get_contents($cachefile), mime_content_type($cachefile));
|
|
|
|
self::responseImageHttpCache($img);
|
|
|
|
// stop.
|
2018-07-31 04:06:22 +02:00
|
|
|
}
|
2018-12-09 12:33:38 +01:00
|
|
|
return $cachefile;
|
|
|
|
}
|
2019-01-06 22:06:53 +01:00
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
/**
|
2020-01-19 07:05:23 +01:00
|
|
|
* Try to reply with image in database
|
2018-12-09 12:33:38 +01:00
|
|
|
*
|
2019-01-06 22:06:53 +01:00
|
|
|
* @param array $request Array from getRequestInfo
|
2018-12-09 12:33:38 +01:00
|
|
|
*
|
|
|
|
* If the image exists in database, then script ends here and this function will never returns
|
2019-01-06 22:06:53 +01:00
|
|
|
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
|
|
|
|
* @throws \ImagickException
|
2018-12-09 12:33:38 +01:00
|
|
|
*/
|
2019-03-18 23:33:20 +01:00
|
|
|
private static function responseFromDB(&$request)
|
|
|
|
{
|
2018-12-09 12:33:38 +01:00
|
|
|
$photo = Photo::getPhoto($request['urlhash']);
|
|
|
|
|
|
|
|
if ($photo !== false) {
|
|
|
|
$img = Photo::getImageForPhoto($photo);
|
|
|
|
self::responseImageHttpCache($img);
|
|
|
|
// stop.
|
2018-07-31 04:06:22 +02:00
|
|
|
}
|
2018-12-09 12:33:38 +01:00
|
|
|
}
|
2019-03-18 23:33:20 +01:00
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
/**
|
2019-10-01 14:41:49 +02:00
|
|
|
* In case of an error just stop. We don't return content to avoid caching problems
|
2018-12-09 12:33:38 +01:00
|
|
|
*
|
2019-10-01 14:41:49 +02:00
|
|
|
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
|
2018-12-09 12:33:38 +01:00
|
|
|
*/
|
2019-03-18 23:33:20 +01:00
|
|
|
private static function responseError()
|
|
|
|
{
|
2019-10-01 14:41:49 +02:00
|
|
|
throw new \Friendica\Network\HTTPException\InternalServerErrorException();
|
2018-12-09 12:33:38 +01:00
|
|
|
}
|
2019-01-06 22:06:53 +01:00
|
|
|
|
2018-12-09 12:33:38 +01:00
|
|
|
/**
|
2020-01-19 07:05:23 +01:00
|
|
|
* Output the image with cache headers
|
2018-12-09 12:33:38 +01:00
|
|
|
*
|
2019-01-06 22:06:53 +01:00
|
|
|
* @param Image $img
|
|
|
|
* @throws \Friendica\Network\HTTPException\InternalServerErrorException
|
2018-12-09 12:33:38 +01:00
|
|
|
*/
|
|
|
|
private static function responseImageHttpCache(Image $img)
|
|
|
|
{
|
|
|
|
if (is_null($img) || !$img->isValid()) {
|
2019-10-06 20:48:33 +02:00
|
|
|
Logger::info('The cached image is invalid');
|
2018-12-09 12:33:38 +01:00
|
|
|
self::responseError();
|
|
|
|
// stop.
|
2018-07-31 04:06:22 +02:00
|
|
|
}
|
2018-12-09 12:33:38 +01:00
|
|
|
header('Content-type: ' . $img->getType());
|
|
|
|
header('Last-Modified: ' . gmdate('D, d M Y H:i:s', time()) . ' GMT');
|
|
|
|
header('Etag: "' . md5($img->asString()) . '"');
|
|
|
|
header('Expires: ' . gmdate('D, d M Y H:i:s', time() + (31536000)) . ' GMT');
|
|
|
|
header('Cache-Control: max-age=31536000');
|
|
|
|
echo $img->asString();
|
2018-07-31 04:06:22 +02:00
|
|
|
exit();
|
|
|
|
}
|
|
|
|
}
|