2015-09-10 21:32:56 +00:00
< ? php
if ( ! file_exists ( " boot.php " ) AND ( sizeof ( $_SERVER [ " argv " ]) != 0 )) {
$directory = dirname ( $_SERVER [ " argv " ][ 0 ]);
if ( substr ( $directory , 0 , 1 ) != " / " )
$directory = $_SERVER [ " PWD " ] . " / " . $directory ;
$directory = realpath ( $directory . " /.. " );
chdir ( $directory );
}
require_once ( " boot.php " );
function cron_run ( & $argv , & $argc ){
global $a , $db ;
if ( is_null ( $a )) {
$a = new App ;
}
if ( is_null ( $db )) {
@ include ( " .htconfig.php " );
require_once ( " include/dba.php " );
$db = new dba ( $db_host , $db_user , $db_pass , $db_data );
unset ( $db_host , $db_user , $db_pass , $db_data );
};
require_once ( 'include/session.php' );
require_once ( 'include/datetime.php' );
require_once ( 'include/items.php' );
require_once ( 'include/Contact.php' );
require_once ( 'include/email.php' );
require_once ( 'include/socgraph.php' );
require_once ( 'mod/nodeinfo.php' );
2016-04-03 11:48:31 +00:00
require_once ( 'include/post_update.php' );
2015-09-10 21:32:56 +00:00
load_config ( 'config' );
load_config ( 'system' );
2016-03-07 23:20:06 +00:00
// Don't check this stuff if the function is called by the poller
if ( App :: callstack () != " poller_run " ) {
2016-03-08 19:28:09 +00:00
if ( App :: maxload_reached ())
return ;
2016-03-08 21:28:49 +00:00
if ( App :: is_already_running ( 'cron' , 'include/cron.php' , 540 ))
2016-03-08 19:28:09 +00:00
return ;
2015-09-10 21:32:56 +00:00
}
2015-09-11 19:35:58 +00:00
$last = get_config ( 'system' , 'last_cron' );
$poll_interval = intval ( get_config ( 'system' , 'cron_interval' ));
if ( ! $poll_interval )
$poll_interval = 10 ;
if ( $last ) {
$next = $last + ( $poll_interval * 60 );
if ( $next > time ()) {
logger ( 'cron intervall not reached' );
return ;
}
}
2015-09-10 21:32:56 +00:00
$a -> set_baseurl ( get_config ( 'system' , 'url' ));
load_hooks ();
logger ( 'cron: start' );
2015-09-11 19:35:58 +00:00
// run queue delivery process in the background
2016-08-27 21:05:38 +00:00
proc_run ( PRIORITY_NEGLIGIBLE , " include/queue.php " );
2015-09-11 19:35:58 +00:00
// run the process to discover global contacts in the background
2016-08-01 05:48:43 +00:00
proc_run ( PRIORITY_LOW , " include/discover_poco.php " );
2015-09-11 19:35:58 +00:00
// run the process to update locally stored global contacts in the background
2016-08-01 05:48:43 +00:00
proc_run ( PRIORITY_LOW , " include/discover_poco.php " , " checkcontact " );
2015-09-11 19:35:58 +00:00
2016-08-03 08:03:05 +00:00
// Expire and remove user entries
cron_expire_and_remove_users ();
2015-09-10 21:32:56 +00:00
2016-08-03 08:03:05 +00:00
// If the worker is active, split the jobs in several sub processes
if ( get_config ( " system " , " worker " )) {
// Check OStatus conversations
proc_run ( PRIORITY_MEDIUM , " include/cronjobs.php " , " ostatus_mentions " );
2015-09-10 21:32:56 +00:00
2016-08-03 08:03:05 +00:00
// Check every conversation
proc_run ( PRIORITY_MEDIUM , " include/cronjobs.php " , " ostatus_conversations " );
2015-09-10 21:32:56 +00:00
2016-08-03 08:03:05 +00:00
// Call possible post update functions
proc_run ( PRIORITY_LOW , " include/cronjobs.php " , " post_update " );
2015-09-10 21:32:56 +00:00
2016-08-03 08:03:05 +00:00
// update nodeinfo data
proc_run ( PRIORITY_LOW , " include/cronjobs.php " , " nodeinfo " );
} else {
// Check OStatus conversations
// Check only conversations with mentions (for a longer time)
ostatus :: check_conversations ( true );
2015-09-10 21:32:56 +00:00
2016-08-03 08:03:05 +00:00
// Check every conversation
ostatus :: check_conversations ( false );
2015-09-10 21:32:56 +00:00
2016-08-03 08:03:05 +00:00
// Call possible post update functions
// see include/post_update.php for more details
post_update ();
2015-09-10 21:32:56 +00:00
2016-08-03 08:03:05 +00:00
// update nodeinfo data
nodeinfo_cron ();
}
2015-09-10 21:32:56 +00:00
// once daily run birthday_updates and then expire in background
$d1 = get_config ( 'system' , 'last_expire_day' );
$d2 = intval ( datetime_convert ( 'UTC' , 'UTC' , 'now' , 'd' ));
if ( $d2 != intval ( $d1 )) {
update_contact_birthdays ();
2016-08-01 05:48:43 +00:00
proc_run ( PRIORITY_LOW , " include/discover_poco.php " , " suggestions " );
2015-09-10 21:32:56 +00:00
set_config ( 'system' , 'last_expire_day' , $d2 );
2015-11-07 16:52:52 +00:00
2016-08-01 05:48:43 +00:00
proc_run ( PRIORITY_LOW , 'include/expire.php' );
2016-10-19 21:06:37 +00:00
proc_run ( PRIORITY_LOW , 'include/dbclean.php' );
2015-09-10 21:32:56 +00:00
}
2016-01-15 22:27:25 +00:00
// Clear cache entries
cron_clear_cache ( $a );
2015-09-10 21:32:56 +00:00
2016-01-15 22:27:25 +00:00
// Repair missing Diaspora values in contacts
cron_repair_diaspora ( $a );
2016-01-10 22:08:25 +00:00
2016-01-23 21:05:27 +00:00
// Repair entries in the database
cron_repair_database ();
2016-08-02 04:28:34 +00:00
// Poll contacts
cron_poll_contacts ( $argc , $argv );
logger ( 'cron: end' );
set_config ( 'system' , 'last_cron' , time ());
return ;
}
2016-08-03 08:03:05 +00:00
/**
* @ brief Expire and remove user entries
*/
function cron_expire_and_remove_users () {
// expire any expired accounts
q ( " UPDATE user SET `account_expired` = 1 where `account_expired` = 0
AND `account_expires_on` != '0000-00-00 00:00:00'
AND `account_expires_on` < UTC_TIMESTAMP () " );
// delete user and contact records for recently removed accounts
$r = q ( " SELECT * FROM `user` WHERE `account_removed` AND `account_expires_on` < UTC_TIMESTAMP() - INTERVAL 3 DAY " );
if ( $r ) {
foreach ( $r as $user ) {
q ( " DELETE FROM `contact` WHERE `uid` = %d " , intval ( $user [ 'uid' ]));
q ( " DELETE FROM `user` WHERE `uid` = %d " , intval ( $user [ 'uid' ]));
}
}
}
2016-08-02 04:28:34 +00:00
/**
2016-08-02 08:19:10 +00:00
* @ brief Poll contacts for unreceived messages
2016-08-02 04:28:34 +00:00
*
2016-08-02 08:19:10 +00:00
* @ param Integer $argc Number of command line arguments
* @ param Array $argv Array of command line arguments
2016-08-02 04:28:34 +00:00
*/
function cron_poll_contacts ( $argc , $argv ) {
2015-09-10 21:32:56 +00:00
$manual_id = 0 ;
$generation = 0 ;
$force = false ;
$restart = false ;
2016-08-02 04:28:34 +00:00
if (( $argc > 1 ) && ( $argv [ 1 ] == 'force' ))
2015-09-10 21:32:56 +00:00
$force = true ;
2016-08-02 04:28:34 +00:00
if (( $argc > 1 ) && ( $argv [ 1 ] == 'restart' )) {
2015-09-10 21:32:56 +00:00
$restart = true ;
$generation = intval ( $argv [ 2 ]);
2016-08-02 04:28:34 +00:00
if ( ! $generation )
2015-09-10 21:32:56 +00:00
killme ();
}
2016-08-02 04:28:34 +00:00
if (( $argc > 1 ) && intval ( $argv [ 1 ])) {
2015-09-10 21:32:56 +00:00
$manual_id = intval ( $argv [ 1 ]);
$force = true ;
}
$interval = intval ( get_config ( 'system' , 'poll_interval' ));
2016-08-02 04:28:34 +00:00
if ( ! $interval )
2015-09-10 21:32:56 +00:00
$interval = (( get_config ( 'system' , 'delivery_interval' ) === false ) ? 3 : intval ( get_config ( 'system' , 'delivery_interval' )));
2015-09-12 16:08:03 +00:00
// If we are using the worker we don't need a delivery interval
if ( get_config ( " system " , " worker " ))
$interval = false ;
2015-09-10 21:32:56 +00:00
$sql_extra = (( $manual_id ) ? " AND `id` = $manual_id " : " " );
reload_plugins ();
$d = datetime_convert ();
// Only poll from those with suitable relationships,
// and which have a polling address and ignore Diaspora since
// we are unable to match those posts with a Diaspora GUID and prevent duplicates.
2016-08-03 08:03:05 +00:00
$abandon_days = intval ( get_config ( 'system' , 'account_abandon_days' ));
if ( $abandon_days < 1 )
$abandon_days = 0 ;
2015-09-10 21:32:56 +00:00
$abandon_sql = (( $abandon_days )
? sprintf ( " AND `user`.`login_date` > UTC_TIMESTAMP() - INTERVAL %d DAY " , intval ( $abandon_days ))
: ''
);
$contacts = q ( " SELECT `contact`.`id` FROM `contact` INNER JOIN `user` ON `user`.`uid` = `contact`.`uid`
WHERE `rel` IN ( % d , % d ) AND `poll` != '' AND `network` IN ( '%s' , '%s' , '%s' , '%s' , '%s' , '%s' )
$sql_extra
AND NOT `self` AND NOT `contact` . `blocked` AND NOT `contact` . `readonly` AND NOT `contact` . `archive`
AND NOT `user` . `account_expired` AND NOT `user` . `account_removed` $abandon_sql ORDER BY RAND () " ,
intval ( CONTACT_IS_SHARING ),
intval ( CONTACT_IS_FRIEND ),
dbesc ( NETWORK_DFRN ),
dbesc ( NETWORK_ZOT ),
dbesc ( NETWORK_OSTATUS ),
dbesc ( NETWORK_FEED ),
dbesc ( NETWORK_MAIL ),
dbesc ( NETWORK_MAIL2 )
);
2016-08-02 04:28:34 +00:00
if ( ! count ( $contacts )) {
2015-09-10 21:32:56 +00:00
return ;
}
2016-08-02 04:28:34 +00:00
foreach ( $contacts as $c ) {
2015-09-10 21:32:56 +00:00
$res = q ( " SELECT * FROM `contact` WHERE `id` = %d LIMIT 1 " ,
intval ( $c [ 'id' ])
);
if (( ! $res ) || ( ! count ( $res )))
continue ;
foreach ( $res as $contact ) {
$xml = false ;
if ( $manual_id )
$contact [ 'last-update' ] = '0000-00-00 00:00:00' ;
if ( in_array ( $contact [ 'network' ], array ( NETWORK_DFRN , NETWORK_ZOT , NETWORK_OSTATUS )))
$contact [ 'priority' ] = 2 ;
if ( $contact [ 'subhub' ] AND in_array ( $contact [ 'network' ], array ( NETWORK_DFRN , NETWORK_ZOT , NETWORK_OSTATUS ))) {
// We should be getting everything via a hub. But just to be sure, let's check once a day.
// (You can make this more or less frequent if desired by setting 'pushpoll_frequency' appropriately)
// This also lets us update our subscription to the hub, and add or replace hubs in case it
// changed. We will only update hubs once a day, regardless of 'pushpoll_frequency'.
$poll_interval = get_config ( 'system' , 'pushpoll_frequency' );
$contact [ 'priority' ] = (( $poll_interval !== false ) ? intval ( $poll_interval ) : 3 );
}
if ( $contact [ 'priority' ] AND ! $force ) {
$update = false ;
$t = $contact [ 'last-update' ];
/**
* Based on $contact [ 'priority' ], should we poll this site now ? Or later ?
*/
switch ( $contact [ 'priority' ]) {
case 5 :
if ( datetime_convert ( 'UTC' , 'UTC' , 'now' ) > datetime_convert ( 'UTC' , 'UTC' , $t . " + 1 month " ))
$update = true ;
break ;
case 4 :
if ( datetime_convert ( 'UTC' , 'UTC' , 'now' ) > datetime_convert ( 'UTC' , 'UTC' , $t . " + 1 week " ))
$update = true ;
break ;
case 3 :
if ( datetime_convert ( 'UTC' , 'UTC' , 'now' ) > datetime_convert ( 'UTC' , 'UTC' , $t . " + 1 day " ))
$update = true ;
break ;
case 2 :
if ( datetime_convert ( 'UTC' , 'UTC' , 'now' ) > datetime_convert ( 'UTC' , 'UTC' , $t . " + 12 hour " ))
$update = true ;
break ;
case 1 :
default :
if ( datetime_convert ( 'UTC' , 'UTC' , 'now' ) > datetime_convert ( 'UTC' , 'UTC' , $t . " + 1 hour " ))
$update = true ;
break ;
}
2016-08-02 04:28:34 +00:00
if ( ! $update )
2015-09-10 21:32:56 +00:00
continue ;
}
logger ( " Polling " . $contact [ " network " ] . " " . $contact [ " id " ] . " " . $contact [ " nick " ] . " " . $contact [ " name " ]);
2016-08-01 05:48:43 +00:00
proc_run ( PRIORITY_MEDIUM , 'include/onepoll.php' , $contact [ 'id' ]);
2015-09-10 21:32:56 +00:00
if ( $interval )
@ time_sleep_until ( microtime ( true ) + ( float ) $interval );
}
}
}
2016-01-15 22:27:25 +00:00
/**
* @ brief Clear cache entries
*
* @ param App $a
*/
function cron_clear_cache ( & $a ) {
$last = get_config ( 'system' , 'cache_last_cleared' );
if ( $last ) {
$next = $last + ( 3600 ); // Once per hour
$clear_cache = ( $next <= time ());
} else
$clear_cache = true ;
if ( ! $clear_cache )
return ;
// clear old cache
Cache :: clear ();
// clear old item cache files
clear_cache ();
// clear cache for photos
clear_cache ( $a -> get_basepath (), $a -> get_basepath () . " /photo " );
// clear smarty cache
clear_cache ( $a -> get_basepath () . " /view/smarty3/compiled " , $a -> get_basepath () . " /view/smarty3/compiled " );
// clear cache for image proxy
if ( ! get_config ( " system " , " proxy_disabled " )) {
clear_cache ( $a -> get_basepath (), $a -> get_basepath () . " /proxy " );
$cachetime = get_config ( 'system' , 'proxy_cache_time' );
if ( ! $cachetime ) $cachetime = PROXY_DEFAULT_TIME ;
q ( 'DELETE FROM `photo` WHERE `uid` = 0 AND `resource-id` LIKE "pic:%%" AND `created` < NOW() - INTERVAL %d SECOND' , $cachetime );
}
// Delete the cached OEmbed entries that are older than one year
2016-10-19 21:06:37 +00:00
q ( " DELETE FROM `oembed` WHERE `created` < NOW() - INTERVAL 3 MONTH " );
2016-01-15 22:27:25 +00:00
// Delete the cached "parse_url" entries that are older than one year
2016-10-19 21:06:37 +00:00
q ( " DELETE FROM `parsed_url` WHERE `created` < NOW() - INTERVAL 3 MONTH " );
2016-01-15 22:27:25 +00:00
// Maximum table size in megabyte
$max_tablesize = intval ( get_config ( 'system' , 'optimize_max_tablesize' )) * 1000000 ;
if ( $max_tablesize == 0 )
$max_tablesize = 100 * 1000000 ; // Default are 100 MB
2016-04-01 19:09:52 +00:00
if ( $max_tablesize > 0 ) {
// Minimum fragmentation level in percent
$fragmentation_level = intval ( get_config ( 'system' , 'optimize_fragmentation' )) / 100 ;
if ( $fragmentation_level == 0 )
$fragmentation_level = 0.3 ; // Default value is 30%
2016-01-15 22:27:25 +00:00
2016-04-01 19:09:52 +00:00
// Optimize some tables that need to be optimized
$r = q ( " SHOW TABLE STATUS " );
foreach ( $r as $table ) {
2016-01-15 22:27:25 +00:00
2016-04-01 19:09:52 +00:00
// Don't optimize tables that are too large
if ( $table [ " Data_length " ] > $max_tablesize )
continue ;
2016-01-15 22:27:25 +00:00
2016-04-01 19:09:52 +00:00
// Don't optimize empty tables
if ( $table [ " Data_length " ] == 0 )
continue ;
2016-01-15 22:27:25 +00:00
2016-04-01 19:09:52 +00:00
// Calculate fragmentation
$fragmentation = $table [ " Data_free " ] / ( $table [ " Data_length " ] + $table [ " Index_length " ]);
2016-01-15 22:27:25 +00:00
2016-04-01 19:09:52 +00:00
logger ( " Table " . $table [ " Name " ] . " - Fragmentation level: " . round ( $fragmentation * 100 , 2 ), LOGGER_DEBUG );
2016-01-15 22:27:25 +00:00
2016-04-01 19:09:52 +00:00
// Don't optimize tables that needn't to be optimized
if ( $fragmentation < $fragmentation_level )
continue ;
2016-01-15 22:27:25 +00:00
2016-04-01 19:09:52 +00:00
// So optimize it
logger ( " Optimize Table " . $table [ " Name " ], LOGGER_DEBUG );
q ( " OPTIMIZE TABLE `%s` " , dbesc ( $table [ " Name " ]));
}
2016-01-15 22:27:25 +00:00
}
set_config ( 'system' , 'cache_last_cleared' , time ());
}
/**
* @ brief Repair missing values in Diaspora contacts
*
* @ param App $a
*/
function cron_repair_diaspora ( & $a ) {
$r = q ( " SELECT `id`, `url` FROM `contact`
WHERE `network` = '%s' AND ( `batch` = '' OR `notify` = '' OR `poll` = '' OR pubkey = '' )
ORDER BY RAND () LIMIT 50 " , dbesc(NETWORK_DIASPORA));
if ( $r ) {
foreach ( $r AS $contact ) {
if ( poco_reachable ( $contact [ " url " ])) {
$data = probe_url ( $contact [ " url " ]);
if ( $data [ " network " ] == NETWORK_DIASPORA ) {
logger ( " Repair contact " . $contact [ " id " ] . " " . $contact [ " url " ], LOGGER_DEBUG );
q ( " UPDATE `contact` SET `batch` = '%s', `notify` = '%s', `poll` = '%s', pubkey = '%s' WHERE `id` = %d " ,
dbesc ( $data [ " batch " ]), dbesc ( $data [ " notify " ]), dbesc ( $data [ " poll " ]), dbesc ( $data [ " pubkey " ]),
intval ( $contact [ " id " ]));
}
}
}
}
}
2016-01-23 21:05:27 +00:00
/**
* @ brief Do some repairs in database entries
*
*/
function cron_repair_database () {
// Set the parent if it wasn't set. (Shouldn't happen - but does sometimes)
// This call is very "cheap" so we can do it at any time without a problem
q ( " UPDATE `item` INNER JOIN `item` AS `parent` ON `parent`.`uri` = `item`.`parent-uri` AND `parent`.`uid` = `item`.`uid` SET `item`.`parent` = `parent`.`id` WHERE `item`.`parent` = 0 " );
2016-04-02 13:41:55 +00:00
// There was an issue where the nick vanishes from the contact table
q ( " UPDATE `contact` INNER JOIN `user` ON `contact`.`uid` = `user`.`uid` SET `nick` = `nickname` WHERE `self` AND `nick`='' " );
2016-05-05 13:38:28 +00:00
// Update the global contacts for local users
$r = q ( " SELECT `uid` FROM `user` WHERE `verified` AND NOT `blocked` AND NOT `account_removed` AND NOT `account_expired` " );
if ( $r )
foreach ( $r AS $user )
update_gcontact_for_user ( $user [ " uid " ]);
2016-01-23 21:05:27 +00:00
/// @todo
2016-01-24 06:57:36 +00:00
/// - remove thread entries without item
/// - remove sign entries without item
/// - remove children when parent got lost
/// - set contact-id in item when not present
2016-01-23 21:05:27 +00:00
}
2015-09-10 21:32:56 +00:00
if ( array_search ( __file__ , get_included_files ()) === 0 ){
2015-09-12 18:22:58 +00:00
cron_run ( $_SERVER [ " argv " ], $_SERVER [ " argc " ]);
killme ();
2015-09-10 21:32:56 +00:00
}