2019-09-30 20:52:05 +02:00
< ? php
/**
* Name : Photo Track
* Description : Track which photos are actually being used and delete any others
* Version : 1.0
* Author : Matthew Exon < http :// mat . exon . name >
*/
/*
* List of tables and the fields that are checked :
*
* contact : photo thumb micro about
* fcontact : photo
* fsuggest : photo
* gcontact : photo about
* item : body
* item - content : body
* mail : from - photo
* notify : photo
* profile : photo thumb about
*/
use Friendica\Core\Addon ;
use Friendica\Core\Logger ;
use Friendica\Object\Image ;
use Friendica\Database\DBA ;
2022-03-02 17:36:38 +01:00
use Friendica\Util\Images ;
2022-03-02 21:20:20 +01:00
use Friendica\Util\DateTimeFormat ;
2020-01-10 07:34:19 +01:00
use Friendica\DI ;
2019-09-30 20:52:05 +02:00
if ( ! defined ( 'PHOTOTRACK_DEFAULT_BATCH_SIZE' )) {
define ( 'PHOTOTRACK_DEFAULT_BATCH_SIZE' , 1000 );
}
// Time in *minutes* between searching for photo uses
if ( ! defined ( 'PHOTOTRACK_DEFAULT_SEARCH_INTERVAL' )) {
define ( 'PHOTOTRACK_DEFAULT_SEARCH_INTERVAL' , 10 );
}
function phototrack_install () {
global $db ;
Addon :: registerHook ( 'post_local_end' , 'addon/phototrack/phototrack.php' , 'phototrack_post_local_end' );
Addon :: registerHook ( 'post_remote_end' , 'addon/phototrack/phototrack.php' , 'phototrack_post_remote_end' );
Addon :: registerHook ( 'notifier_end' , 'addon/phototrack/phototrack.php' , 'phototrack_notifier_end' );
Addon :: registerHook ( 'cron' , 'addon/phototrack/phototrack.php' , 'phototrack_cron' );
2020-08-23 22:15:18 +02:00
if ( DI :: config () -> get ( 'phototrack' , 'dbversion' ) != '0.1' ) {
2019-09-30 20:52:05 +02:00
$schema = file_get_contents ( dirname ( __file__ ) . '/database.sql' );
$arr = explode ( ';' , $schema );
foreach ( $arr as $a ) {
if ( ! DBA :: e ( $a )) {
Logger :: warning ( 'Unable to create database table: ' . DBA :: errorMessage ());
return ;
}
}
2020-08-23 22:15:18 +02:00
DI :: config () -> set ( 'phototrack' , 'dbversion' , '0.1' );
2019-09-30 20:52:05 +02:00
}
}
function phototrack_uninstall () {
Addon :: unregisterHook ( 'post_local_end' , 'addon/phototrack/phototrack.php' , 'phototrack_post_local_end' );
Addon :: unregisterHook ( 'post_remote_end' , 'addon/phototrack/phototrack.php' , 'phototrack_post_remote_end' );
Addon :: unregisterHook ( 'notifier_end' , 'addon/phototrack/phototrack.php' , 'phototrack_notifier_end' );
Addon :: unregisterHook ( 'cron' , 'addon/phototrack/phototrack.php' , 'phototrack_cron' );
}
function phototrack_module () {}
function phototrack_finished_row ( $table , $id ) {
$existing = DBA :: selectFirst ( 'phototrack_row_check' , [ 'id' ], [ 'table' => $table , 'row-id' => $id ]);
if ( ! is_bool ( $existing )) {
2022-03-02 21:39:03 +01:00
DBA :: update ( 'phototrack_row_check' , [ 'checked' => DateTimeFormat :: utcNow ()], [ 'table' => $table , 'row-id' => $id ]);
2019-09-30 20:52:05 +02:00
}
else {
2022-03-02 21:39:03 +01:00
DBA :: insert ( 'phototrack_row_check' , [ 'table' => $table , 'row-id' => $id , 'checked' => DateTimeFormat :: utcNow ()]);
2019-09-30 20:52:05 +02:00
}
}
function phototrack_photo_use ( $photo , $table , $field , $id ) {
Logger :: debug ( '@@@ phototrack_photo_use ' . $photo );
2022-03-02 17:36:38 +01:00
foreach ( Images :: supportedTypes () as $m => $e ) {
2019-09-30 20:52:05 +02:00
$photo = str_replace ( " . $e " , '' , $photo );
}
if ( substr ( $photo , - 2 , 1 ) == '-' ) {
$resolution = intval ( substr ( $photo , - 1 , 1 ));
$photo = substr ( $photo , 0 , - 2 );
}
if ( strlen ( $photo ) != 32 ) {
return ;
}
2022-03-02 21:20:20 +01:00
$r = DBA :: selectFirst ( 'photo' , [ 'resource-id' ], [ 'resource-id' => $photo ]);
if ( ! DBA :: isResult ( $r )) {
2019-09-30 20:52:05 +02:00
return ;
}
2022-03-02 21:20:20 +01:00
$rid = $r [ 'resource-id' ];
2022-03-02 22:02:01 +01:00
$existing = DBA :: selectFirst ( 'phototrack_photo_use' , [ 'id' ], [ 'resource-id' => $rid , 'table' => $table , 'field' => $field , 'row-id' => $id ]);
2022-03-02 21:20:20 +01:00
if ( DBA :: isResult ( $existing )) {
2022-03-02 22:02:01 +01:00
DBA :: update ( 'phototrack_photo_use' , [ 'checked' => DateTimeFormat :: utcNow ()], [ 'resource-id' => $rid , 'table' => $table , 'field' => $field , 'row-id' => $id ]);
2019-09-30 20:52:05 +02:00
}
else {
2022-03-02 22:02:58 +01:00
DBA :: insert ( 'phototrack_photo_use' , [ 'resource-id' => $rid , 'table' => $table , 'field' => $field , 'row-id' => $id , 'checked' => DateTimeFormat :: utcNow ()]);
2019-09-30 20:52:05 +02:00
}
}
2023-12-26 17:35:27 +01:00
function phototrack_check_field_url ( $a , $table , $id_field , $field , $id , $url ) {
Logger :: info ( '@@@ phototrack_check_field_url table ' . $table . ' id_field ' . $id_field . ' field ' . $field . ' id ' . $id . ' url ' . $url );
2020-01-10 07:47:08 +01:00
$baseurl = DI :: baseUrl () -> get ( true );
2020-01-06 22:12:47 +01:00
if ( strpos ( $url , $baseurl ) === FALSE ) {
return ;
}
else {
2019-09-30 20:52:05 +02:00
$url = substr ( $url , strlen ( $baseurl ));
Logger :: info ( '@@@ phototrack_check_field_url funny url stuff ' . $url . ' base ' . $baseurl );
}
2020-01-06 22:12:47 +01:00
if ( strpos ( $url , '/photo/' ) === FALSE ) {
return ;
}
else {
$url = substr ( $url , strlen ( '/photo/' ));
Logger :: info ( '@@@ phototrack_check_field_url more url stuff ' . $url );
}
if ( preg_match ( '/([0-9a-z]{32})/' , $url , $matches )) {
$rid = $matches [ 0 ];
2019-09-30 20:52:05 +02:00
Logger :: info ( '@@@ phototrack_check_field_url rid ' . $rid );
phototrack_photo_use ( $rid , $table , $field , $id );
}
}
2023-12-26 17:35:27 +01:00
function phototrack_check_field_bbcode ( $a , $table , $id_field , $field , $id , $value ) {
Logger :: info ( '@@@ phototrack_check_field_url table ' . $table . ' id_field ' . $id_field . ' field ' . $field . ' id ' . $id . ' value ' . $value );
2020-01-10 07:47:08 +01:00
$baseurl = DI :: baseUrl () -> get ( true );
2019-09-30 20:52:05 +02:00
$matches = array ();
preg_match_all ( " / \ [img( \ =([0-9]*)x([0-9]*))? \ ](.*?) \ [ \ /img \ ]/ism " , $value , $matches );
foreach ( $matches [ 4 ] as $url ) {
2023-12-26 17:35:27 +01:00
phototrack_check_field_url ( $a , $table , $id_field , $field , $id , $url );
2019-09-30 20:52:05 +02:00
}
}
function phototrack_post_local_end ( & $a , & $item ) {
2023-12-26 17:35:27 +01:00
phototrack_check_row ( $a , 'item' , 'id' , $item );
phototrack_check_row ( $a , 'item-content' , 'id' , $item );
2019-09-30 20:52:05 +02:00
}
function phototrack_post_remote_end ( & $a , & $item ) {
2023-12-26 17:35:27 +01:00
phototrack_check_row ( $a , 'item' , 'id' , $item );
phototrack_check_row ( $a , 'item-content' , 'id' , $item );
2019-09-30 20:52:05 +02:00
}
function phototrack_notifier_end ( $item ) {
}
2023-12-26 17:35:27 +01:00
function phototrack_check_row ( $a , $table , $id_field , $row ) {
2019-09-30 20:52:05 +02:00
switch ( $table ) {
2023-12-26 17:35:27 +01:00
case 'post-content' :
2019-09-30 20:52:05 +02:00
$fields = array (
'body' => 'bbcode' );
break ;
case 'contact' :
$fields = array (
'photo' => 'url' ,
'thumb' => 'url' ,
'micro' => 'url' ,
'about' => 'bbcode' );
break ;
case 'fcontact' :
$fields = array (
'photo' => 'url' );
break ;
case 'fsuggest' :
$fields = array (
'photo' => 'url' );
break ;
case 'gcontact' :
$fields = array (
'photo' => 'url' ,
'about' => 'bbcode' );
break ;
default : $fields = array (); break ;
}
foreach ( $fields as $field => $type ) {
switch ( $type ) {
2023-12-26 17:35:27 +01:00
case 'bbcode' : phototrack_check_field_bbcode ( $a , $table , $id_field , $field , $row [ 'id' ], $row [ $field ]); break ;
case 'url' : phototrack_check_field_url ( $a , $table , $id_field , $field , $row [ 'id' ], $row [ $field ]); break ;
2019-09-30 20:52:05 +02:00
}
}
phototrack_finished_row ( $table , $row [ 'id' ]);
}
function phototrack_batch_size () {
2020-08-23 22:15:18 +02:00
$batch_size = DI :: config () -> get ( 'phototrack' , 'batch_size' );
2019-09-30 20:52:05 +02:00
if ( $batch_size > 0 ) {
return $batch_size ;
}
return PHOTOTRACK_DEFAULT_BATCH_SIZE ;
}
2023-12-26 17:35:27 +01:00
function phototrack_search_table ( $a , $table , $id_field ) {
2019-09-30 20:52:05 +02:00
$batch_size = phototrack_batch_size ();
2023-12-26 17:35:27 +01:00
$rows = DBA :: p ( " SELECT ` $table `.* FROM ` $table ` LEFT OUTER JOIN phototrack_row_check ON ( phototrack_row_check.`table` = ' $table ' AND phototrack_row_check.`row-id` = ` $table `. $id_field ) WHERE ( ( phototrack_row_check.checked IS NULL ) OR ( phototrack_row_check.checked < DATE_SUB(NOW(), INTERVAL 1 MONTH) ) ) ORDER BY phototrack_row_check.checked LIMIT $batch_size " );
2022-03-02 21:20:20 +01:00
if ( DBA :: isResult ( $rows )) {
while ( $row = DBA :: fetch ( $rows )) {
2023-12-26 17:35:27 +01:00
phototrack_check_row ( $a , $table , $id_field , $row );
2022-03-02 21:20:20 +01:00
}
2019-09-30 20:52:05 +02:00
}
2023-12-26 17:35:27 +01:00
$r = DBA :: p ( " SELECT COUNT(*) FROM ` $table ` LEFT OUTER JOIN phototrack_row_check ON ( phototrack_row_check.`table` = ' $table ' AND phototrack_row_check.`row-id` = ` $table `. $id_field ) WHERE ( ( phototrack_row_check.checked IS NULL ) OR ( phototrack_row_check.checked < DATE_SUB(NOW(), INTERVAL 1 MONTH) ) ) " );
2022-03-02 22:19:00 +01:00
Logger :: info ( " @@@ phototrack_search_table " . print_r ( DBA :: fetch ( $r )));
2022-03-02 22:05:28 +01:00
$remaining = DBA :: fetch ( $r )[ 'count' ];
Logger :: info ( 'phototrack: searched ' . DBA :: numRows ( $rows ) . ' rows in table ' . $table . ', ' . $remaining . ' still remaining to search' );
2019-09-30 20:52:05 +02:00
return $remaining ;
}
function phototrack_cron_time () {
2020-08-23 22:15:18 +02:00
$prev_remaining = DI :: config () -> get ( 'phototrack' , 'remaining_items' );
2019-09-30 20:52:05 +02:00
if ( $prev_remaining > 10 * phototrack_batch_size ()) {
Logger :: debug ( 'phototrack: more than ' . ( 10 * phototrack_batch_size ()) . ' items remaining' );
return true ;
}
2020-08-23 22:15:18 +02:00
$last = DI :: config () -> get ( 'phototrack' , 'last_search' );
$search_interval = intval ( DI :: config () -> get ( 'phototrack' , 'search_interval' ));
2019-09-30 20:52:05 +02:00
if ( ! $search_interval ) {
$search_interval = PHOTOTRACK_DEFAULT_SEARCH_INTERVAL ;
}
if ( $last ) {
$next = $last + ( $search_interval * 60 );
if ( $next > time ()) {
Logger :: debug ( 'phototrack: search interval not reached' );
return false ;
}
}
2023-12-26 17:35:27 +01:00
Logger :: debug ( '@@@ phototrack: search interval reached last ' . $last . ' search interval ' . $search_interval );
2019-09-30 20:52:05 +02:00
return true ;
}
function phototrack_cron ( $a , $b ) {
2023-12-26 17:35:27 +01:00
return ; // @@@ something is broken
2019-09-30 20:52:05 +02:00
if ( ! phototrack_cron_time ()) {
return ;
}
2020-08-23 22:15:18 +02:00
DI :: config () -> set ( 'phototrack' , 'last_search' , time ());
2019-09-30 20:52:05 +02:00
$remaining = 0 ;
2023-12-26 17:35:27 +01:00
$remaining += phototrack_search_table ( $a , 'post-content' , 'uri-id' );
$remaining += phototrack_search_table ( $a , 'contact' , 'id' );
$remaining += phototrack_search_table ( $a , 'fcontact' , 'id' );
$remaining += phototrack_search_table ( $a , 'fsuggest' , 'id' );
$remaining += phototrack_search_table ( $a , 'gcontact' , 'id' );
2019-09-30 20:52:05 +02:00
2020-08-23 22:15:18 +02:00
DI :: config () -> set ( 'phototrack' , 'remaining_items' , $remaining );
2019-09-30 20:52:05 +02:00
if ( $remaining === 0 ) {
phototrack_tidy ();
}
}
function phototrack_tidy () {
$batch_size = phototrack_batch_size ();
2022-03-02 16:15:59 +01:00
DBA :: e ( 'CREATE TABLE IF NOT EXISTS `phototrack-temp` (`resource-id` char(255) not null)' );
DBA :: e ( 'INSERT INTO `phototrack-temp` SELECT DISTINCT(`resource-id`) FROM photo WHERE photo.`created` < DATE_SUB(NOW(), INTERVAL 2 MONTH)' );
2022-03-02 16:51:40 +01:00
$rows = DBA :: p ( 'SELECT `phototrack-temp`.`resource-id` FROM `phototrack-temp` LEFT OUTER JOIN phototrack_photo_use ON (`phototrack-temp`.`resource-id` = phototrack_photo_use.`resource-id`) WHERE phototrack_photo_use.id IS NULL limit ' . /*$batch_size*/ 1000 );
2021-04-26 20:38:00 +02:00
if ( DBA :: isResult ( $rows )) {
2021-04-26 20:14:54 +02:00
foreach ( $rows as $row ) {
Logger :: debug ( 'phototrack: remove photo ' . $row [ 'resource-id' ]);
2022-03-02 16:15:59 +01:00
DBA :: e ( 'DELETE FROM photo WHERE `resource-id` = "' . $row [ 'resource-id' ] . '"' );
2021-04-26 20:14:54 +02:00
}
2022-03-02 22:05:28 +01:00
Logger :: info ( 'phototrack_tidy: deleted ' . DBA :: numRows ( $rows ) . ' photos' );
2019-09-30 20:52:05 +02:00
}
2022-03-02 16:15:59 +01:00
DBA :: e ( 'DROP TABLE `phototrack-temp`' );
2023-12-26 17:35:27 +01:00
$rows = DBA :: p ( 'SELECT id FROM phototrack_photo_use WHERE checked < DATE_SUB(NOW(), INTERVAL 2 MONTH)' );
2019-09-30 20:52:05 +02:00
foreach ( $rows as $row ) {
2022-03-02 16:15:59 +01:00
DBA :: e ( 'DELETE FROM phototrack_photo_use WHERE id = ' . $row [ 'id' ]);
2019-09-30 20:52:05 +02:00
}
2022-03-02 22:05:28 +01:00
Logger :: info ( 'phototrack_tidy: deleted ' . DBA :: numRows ( $rows ) . ' phototrack_photo_use rows' );
2019-09-30 20:52:05 +02:00
}