Speed up of OStatus transmission/Ignoring "created" with remote self

This commit is contained in:
Michael 2017-08-03 05:42:44 +00:00
parent 390e34d587
commit a80329b416
4 changed files with 100 additions and 85 deletions

View file

@ -623,11 +623,11 @@ function item_store($arr, $force_parent = false, $notify = false, $dontcache = f
$arr['owner-name'] = ((x($arr, 'owner-name')) ? trim($arr['owner-name']) : ''); $arr['owner-name'] = ((x($arr, 'owner-name')) ? trim($arr['owner-name']) : '');
$arr['owner-link'] = ((x($arr, 'owner-link')) ? notags(trim($arr['owner-link'])) : ''); $arr['owner-link'] = ((x($arr, 'owner-link')) ? notags(trim($arr['owner-link'])) : '');
$arr['owner-avatar'] = ((x($arr, 'owner-avatar')) ? notags(trim($arr['owner-avatar'])) : ''); $arr['owner-avatar'] = ((x($arr, 'owner-avatar')) ? notags(trim($arr['owner-avatar'])) : '');
$arr['created'] = ((x($arr, 'created') !== false) ? datetime_convert('UTC','UTC', $arr['created']) : datetime_convert());
$arr['edited'] = ((x($arr, 'edited') !== false) ? datetime_convert('UTC','UTC', $arr['edited']) : datetime_convert());
$arr['commented'] = ((x($arr, 'commented') !== false) ? datetime_convert('UTC','UTC', $arr['commented']) : datetime_convert());
$arr['received'] = ((x($arr, 'received') !== false) ? datetime_convert('UTC','UTC', $arr['received']) : datetime_convert()); $arr['received'] = ((x($arr, 'received') !== false) ? datetime_convert('UTC','UTC', $arr['received']) : datetime_convert());
$arr['changed'] = ((x($arr, 'changed') !== false) ? datetime_convert('UTC','UTC', $arr['changed']) : datetime_convert()); $arr['created'] = ((x($arr, 'created') !== false) ? datetime_convert('UTC','UTC', $arr['created']) : $arr['received']);
$arr['edited'] = ((x($arr, 'edited') !== false) ? datetime_convert('UTC','UTC', $arr['edited']) : $arr['created']);
$arr['changed'] = ((x($arr, 'changed') !== false) ? datetime_convert('UTC','UTC', $arr['changed']) : $arr['created']);
$arr['commented'] = ((x($arr, 'commented') !== false) ? datetime_convert('UTC','UTC', $arr['commented']) : $arr['created']);
$arr['title'] = ((x($arr, 'title')) ? trim($arr['title']) : ''); $arr['title'] = ((x($arr, 'title')) ? trim($arr['title']) : '');
$arr['location'] = ((x($arr, 'location')) ? trim($arr['location']) : ''); $arr['location'] = ((x($arr, 'location')) ? trim($arr['location']) : '');
$arr['coord'] = ((x($arr, 'coord')) ? notags(trim($arr['coord'])) : ''); $arr['coord'] = ((x($arr, 'coord')) ? notags(trim($arr['coord'])) : '');
@ -1640,6 +1640,9 @@ function item_is_remote_self($contact, &$datarray) {
$datarray['author-name'] = $datarray['owner-name']; $datarray['author-name'] = $datarray['owner-name'];
$datarray['author-link'] = $datarray['owner-link']; $datarray['author-link'] = $datarray['owner-link'];
$datarray['author-avatar'] = $datarray['owner-avatar']; $datarray['author-avatar'] = $datarray['owner-avatar'];
unset($datarray['created']);
unset($datarray['edited']);
} }
if ($contact['network'] != NETWORK_FEED) { if ($contact['network'] != NETWORK_FEED) {

View file

@ -21,6 +21,7 @@ require_once 'include/follow.php';
require_once 'include/api.php'; require_once 'include/api.php';
require_once 'mod/proxy.php'; require_once 'mod/proxy.php';
require_once 'include/xml.php'; require_once 'include/xml.php';
require_once 'include/cache.php';
/** /**
* @brief This class contain functions for the OStatus protocol * @brief This class contain functions for the OStatus protocol
@ -195,7 +196,7 @@ class ostatus {
link_gcontact($gcid, $contact["uid"], $contact["id"]); link_gcontact($gcid, $contact["uid"], $contact["id"]);
} }
return($author); return $author;
} }
/** /**
@ -677,14 +678,14 @@ class ostatus {
if ((count($elements) == 4) && ($elements[2] == "post")) if ((count($elements) == 4) && ($elements[2] == "post"))
return "http://".$server[0]."/notice/".$elements[3]; return "http://".$server[0]."/notice/".$elements[3];
if ((count($conversation) != 2) || ($conversation[1] =="")) if ((count($conversation) != 2) || ($conversation[1] =="")) {
return $href; return $href;
}
if ($elements[3] == "objectType=thread") if ($elements[3] == "objectType=thread") {
return "http://".$server[0]."/conversation/".$conversation[1]; return "http://".$server[0]."/conversation/".$conversation[1];
else } else {
return "http://".$server[0]."/notice/".$conversation[1]; return "http://".$server[0]."/notice/".$conversation[1];
}
return $href; return $href;
} }
@ -946,9 +947,9 @@ class ostatus {
STRAIGHT_JOIN `item` ON `item`.`parent` = `thritem`.`parent` STRAIGHT_JOIN `item` ON `item`.`parent` = `thritem`.`parent`
WHERE `term`.`uid` = %d AND `term`.`otype` = %d AND `term`.`type` = %d AND `term`.`url` = '%s'", WHERE `term`.`uid` = %d AND `term`.`otype` = %d AND `term`.`type` = %d AND `term`.`url` = '%s'",
intval($uid), intval(TERM_OBJ_POST), intval(TERM_CONVERSATION), dbesc($conversation_url)); intval($uid), intval(TERM_OBJ_POST), intval(TERM_CONVERSATION), dbesc($conversation_url));
if ($parents) if ($parents) {
$parent = $parents[0]; $parent = $parents[0];
elseif (count($item) > 0) { } elseif (count($item) > 0) {
$parent = $item; $parent = $item;
$parent["type"] = "remote"; $parent["type"] = "remote";
$parent["verb"] = ACTIVITY_POST; $parent["verb"] = ACTIVITY_POST;
@ -956,9 +957,9 @@ class ostatus {
} else { } else {
// Preset the parent // Preset the parent
$r = q("SELECT `id` FROM `contact` WHERE `self` AND `uid`=%d", $uid); $r = q("SELECT `id` FROM `contact` WHERE `self` AND `uid`=%d", $uid);
if (!$r) if (!dbm::is_result($r)) {
return(-2); return -2;
}
$parent = array(); $parent = array();
$parent["id"] = 0; $parent["id"] = 0;
$parent["parent"] = 0; $parent["parent"] = 0;
@ -985,9 +986,9 @@ class ostatus {
} elseif (!$conv_arr["success"] && (substr($conv, 0, 8) == "https://")) { } elseif (!$conv_arr["success"] && (substr($conv, 0, 8) == "https://")) {
$conv = str_replace("https://", "http://", $conv); $conv = str_replace("https://", "http://", $conv);
$conv_as = fetch_url($conv."?page=".$pageno); $conv_as = fetch_url($conv."?page=".$pageno);
} else } else {
$conv_as = $conv_arr["body"]; $conv_as = $conv_arr["body"];
}
$conv_as = str_replace(',"statusnet:notice_info":', ',"statusnet_notice_info":', $conv_as); $conv_as = str_replace(',"statusnet:notice_info":', ',"statusnet_notice_info":', $conv_as);
$conv_as = json_decode($conv_as); $conv_as = json_decode($conv_as);
@ -1015,9 +1016,10 @@ class ostatus {
self::store_conversation($item_id, $conversation_url); self::store_conversation($item_id, $conversation_url);
} }
return($item_stored); return $item_stored;
} else } else {
return(-3); return -3;
}
} }
$items = array_reverse($items); $items = array_reverse($items);
@ -1197,17 +1199,17 @@ class ostatus {
$arr['conversation-uri'] = $single_conv->status_net->conversation; $arr['conversation-uri'] = $single_conv->status_net->conversation;
} }
if (isset($single_conv->status_net->notice_info->source)) if (isset($single_conv->status_net->notice_info->source)) {
$arr["app"] = strip_tags($single_conv->status_net->notice_info->source); $arr["app"] = strip_tags($single_conv->status_net->notice_info->source);
elseif (isset($single_conv->statusnet->notice_info->source)) } elseif (isset($single_conv->statusnet->notice_info->source)) {
$arr["app"] = strip_tags($single_conv->statusnet->notice_info->source); $arr["app"] = strip_tags($single_conv->statusnet->notice_info->source);
elseif (isset($single_conv->statusnet_notice_info->source)) } elseif (isset($single_conv->statusnet_notice_info->source)) {
$arr["app"] = strip_tags($single_conv->statusnet_notice_info->source); $arr["app"] = strip_tags($single_conv->statusnet_notice_info->source);
elseif (isset($single_conv->provider->displayName)) } elseif (isset($single_conv->provider->displayName)) {
$arr["app"] = $single_conv->provider->displayName; $arr["app"] = $single_conv->provider->displayName;
else } else {
$arr["app"] = "OStatus"; $arr["app"] = "OStatus";
}
$arr["source"] = json_encode($single_conv); $arr["source"] = json_encode($single_conv);
$arr["protocol"] = PROTOCOL_GS_CONVERSATION; $arr["protocol"] = PROTOCOL_GS_CONVERSATION;
@ -1324,7 +1326,7 @@ class ostatus {
} }
} }
return($item_stored); return $item_stored;
} }
/** /**
@ -1367,16 +1369,16 @@ class ostatus {
// Skip if it isn't a pure repeated messages // Skip if it isn't a pure repeated messages
// Does it start with a share? // Does it start with a share?
if (strpos($body, "[share") > 0) if (strpos($body, "[share") > 0)
return(""); return "";
// Does it end with a share? // Does it end with a share?
if (strlen($body) > (strrpos($body, "[/share]") + 8)) if (strlen($body) > (strrpos($body, "[/share]") + 8))
return(""); return "";
$attributes = preg_replace("/\[share(.*?)\]\s?(.*?)\s?\[\/share\]\s?/ism","$1",$body); $attributes = preg_replace("/\[share(.*?)\]\s?(.*?)\s?\[\/share\]\s?/ism","$1",$body);
// Skip if there is no shared message in there // Skip if there is no shared message in there
if ($body == $attributes) if ($body == $attributes)
return(false); return false;
$guid = ""; $guid = "";
preg_match("/guid='(.*?)'/ism", $attributes, $matches); preg_match("/guid='(.*?)'/ism", $attributes, $matches);
@ -1543,7 +1545,7 @@ class ostatus {
break; break;
} }
if (($siteinfo["type"] != "photo") && isset($siteinfo["image"])) { if (!Config::get('system', 'ostatus_not_attach_preview') && ($siteinfo["type"] != "photo") && isset($siteinfo["image"])) {
$imgdata = get_photo_info($siteinfo["image"]); $imgdata = get_photo_info($siteinfo["image"]);
$attributes = array("rel" => "enclosure", $attributes = array("rel" => "enclosure",
"href" => $siteinfo["image"], "href" => $siteinfo["image"],
@ -1586,9 +1588,9 @@ class ostatus {
private function add_author($doc, $owner) { private function add_author($doc, $owner) {
$r = q("SELECT `homepage`, `publish` FROM `profile` WHERE `uid` = %d AND `is-default` LIMIT 1", intval($owner["uid"])); $r = q("SELECT `homepage`, `publish` FROM `profile` WHERE `uid` = %d AND `is-default` LIMIT 1", intval($owner["uid"]));
if ($r) if (dbm::is_result($r)) {
$profile = $r[0]; $profile = $r[0];
}
$author = $doc->createElement("author"); $author = $doc->createElement("author");
xml::add_element($doc, $author, "id", $owner["url"]); xml::add_element($doc, $author, "id", $owner["url"]);
xml::add_element($doc, $author, "activity:object-type", ACTIVITY_OBJ_PERSON); xml::add_element($doc, $author, "activity:object-type", ACTIVITY_OBJ_PERSON);
@ -1743,22 +1745,22 @@ class ostatus {
$r = q("SELECT * FROM `contact` WHERE `nurl` = '%s' AND `uid` IN (0, %d) ORDER BY `uid` DESC LIMIT 1", $r = q("SELECT * FROM `contact` WHERE `nurl` = '%s' AND `uid` IN (0, %d) ORDER BY `uid` DESC LIMIT 1",
dbesc(normalise_link($url)), intval($owner["uid"])); dbesc(normalise_link($url)), intval($owner["uid"]));
if ($r) { if (dbm::is_result($r)) {
$contact = $r[0]; $contact = $r[0];
$contact["uid"] = -1; $contact["uid"] = -1;
} }
if (!$r) { if (!dbm::is_result($r)) {
$r = q("SELECT * FROM `gcontact` WHERE `nurl` = '%s' LIMIT 1", $r = q("SELECT * FROM `gcontact` WHERE `nurl` = '%s' LIMIT 1",
dbesc(normalise_link($url))); dbesc(normalise_link($url)));
if ($r) { if (dbm::is_result($r)) {
$contact = $r[0]; $contact = $r[0];
$contact["uid"] = -1; $contact["uid"] = -1;
$contact["success_update"] = $contact["updated"]; $contact["success_update"] = $contact["updated"];
} }
} }
if (!$r) if (!dbm::is_result($r))
$contact = owner; $contact = owner;
if (!isset($contact["poll"])) { if (!isset($contact["poll"])) {
@ -1797,11 +1799,11 @@ class ostatus {
$r = q("SELECT * FROM `item` WHERE `uid` = %d AND `guid` = '%s' AND NOT `private` AND `network` IN ('%s', '%s', '%s') LIMIT 1", $r = q("SELECT * FROM `item` WHERE `uid` = %d AND `guid` = '%s' AND NOT `private` AND `network` IN ('%s', '%s', '%s') LIMIT 1",
intval($owner["uid"]), dbesc($repeated_guid), intval($owner["uid"]), dbesc($repeated_guid),
dbesc(NETWORK_DFRN), dbesc(NETWORK_DIASPORA), dbesc(NETWORK_OSTATUS)); dbesc(NETWORK_DFRN), dbesc(NETWORK_DIASPORA), dbesc(NETWORK_OSTATUS));
if ($r) if (dbm::is_result($r)) {
$repeated_item = $r[0]; $repeated_item = $r[0];
else } else {
return false; return false;
}
$contact = self::contact_entry($repeated_item['author-link'], $owner); $contact = self::contact_entry($repeated_item['author-link'], $owner);
$parent_item = (($item['thr-parent']) ? $item['thr-parent'] : $item['parent-uri']); $parent_item = (($item['thr-parent']) ? $item['thr-parent'] : $item['parent-uri']);
@ -2227,19 +2229,33 @@ class ostatus {
* *
* @return string XML feed * @return string XML feed
*/ */
public static function feed(App $a, $owner_nick, $last_update) { public static function feed(App $a, $owner_nick, &$last_update) {
$stamp = microtime(true);
$cachekey = "ostatus:feed:".$owner_nick.":".$last_update;
$previous_created = $last_update;
$result = Cache::get($cachekey);
if (!is_null($result)) {
logger('Feed duration: '.number_format(microtime(true) - $stamp, 3).' - '.$owner_nick.' - '.$previous_created.' (cached)', LOGGER_DEBUG);
$last_update = $result['last_update'];
return $result['feed'];
}
$r = q("SELECT `contact`.*, `user`.`nickname`, `user`.`timezone`, `user`.`page-flags` $r = q("SELECT `contact`.*, `user`.`nickname`, `user`.`timezone`, `user`.`page-flags`
FROM `contact` INNER JOIN `user` ON `user`.`uid` = `contact`.`uid` FROM `contact` INNER JOIN `user` ON `user`.`uid` = `contact`.`uid`
WHERE `contact`.`self` AND `user`.`nickname` = '%s' LIMIT 1", WHERE `contact`.`self` AND `user`.`nickname` = '%s' LIMIT 1",
dbesc($owner_nick)); dbesc($owner_nick));
if (!$r) if (!dbm::is_result($r)) {
return; return;
}
$owner = $r[0]; $owner = $r[0];
if (!strlen($last_update)) if (!strlen($last_update)) {
$last_update = 'now -30 days'; $last_update = 'now -30 days';
}
$check_date = datetime_convert('UTC','UTC',$last_update,'Y-m-d H:i:s'); $check_date = datetime_convert('UTC','UTC',$last_update,'Y-m-d H:i:s');
$authorid = get_contact($owner["url"], 0); $authorid = get_contact($owner["url"], 0);
@ -2255,28 +2271,6 @@ class ostatus {
intval($authorid), dbesc($check_date), intval($authorid), dbesc($check_date),
dbesc(NETWORK_OSTATUS), dbesc(NETWORK_DFRN)); dbesc(NETWORK_OSTATUS), dbesc(NETWORK_DFRN));
/* 2016-10-23: The old query will be kept until we are sure that the query above is a good and fast replacement
$items = q("SELECT `item`.*, `item`.`id` AS `item_id` FROM `item`
STRAIGHT_JOIN `thread` ON `thread`.`iid` = `item`.`parent`
LEFT JOIN `item` AS `thritem` ON `thritem`.`uri`=`item`.`thr-parent` AND `thritem`.`uid`=`item`.`uid`
WHERE `item`.`uid` = %d AND `item`.`received` > '%s' AND NOT `item`.`private` AND NOT `item`.`deleted`
AND `item`.`allow_cid` = '' AND `item`.`allow_gid` = '' AND `item`.`deny_cid` = '' AND `item`.`deny_gid` = ''
AND ((`item`.`wall` AND (`item`.`parent` = `item`.`id`))
OR (`item`.`network` = '%s' AND ((`thread`.`network` IN ('%s', '%s')) OR (`thritem`.`network` IN ('%s', '%s')))) AND `thread`.`mention`)
AND ((`item`.`owner-link` IN ('%s', '%s') AND (`item`.`parent` = `item`.`id`))
OR (`item`.`author-link` IN ('%s', '%s')))
ORDER BY `item`.`id` DESC
LIMIT 0, 300",
intval($owner["uid"]), dbesc($check_date), dbesc(NETWORK_DFRN),
//dbesc(NETWORK_OSTATUS), dbesc(NETWORK_OSTATUS),
//dbesc(NETWORK_OSTATUS), dbesc(NETWORK_OSTATUS),
dbesc(NETWORK_OSTATUS), dbesc(NETWORK_DFRN),
dbesc(NETWORK_OSTATUS), dbesc(NETWORK_DFRN),
dbesc($owner["nurl"]), dbesc(str_replace("http://", "https://", $owner["nurl"])),
dbesc($owner["nurl"]), dbesc(str_replace("http://", "https://", $owner["nurl"]))
);
*/
$doc = new DOMDocument('1.0', 'utf-8'); $doc = new DOMDocument('1.0', 'utf-8');
$doc->formatOutput = true; $doc->formatOutput = true;
@ -2288,9 +2282,20 @@ class ostatus {
} }
$entry = self::entry($doc, $item, $owner); $entry = self::entry($doc, $item, $owner);
$root->appendChild($entry); $root->appendChild($entry);
if ($last_update < $item['created']) {
$last_update = $item['created'];
}
} }
return(trim($doc->saveXML())); $feeddata = trim($doc->saveXML());
$msg = array('feed' => $feeddata, 'last_update' => $last_update);
Cache::set($cachekey, $msg, CACHE_QUARTER_HOUR);
logger('Feed duration: '.number_format(microtime(true) - $stamp, 3).' - '.$owner_nick.' - '.$previous_created, LOGGER_DEBUG);
return $feeddata;
} }
/** /**
@ -2314,6 +2319,6 @@ class ostatus {
$doc->appendChild($entry); $doc->appendChild($entry);
return(trim($doc->saveXML())); return trim($doc->saveXML());
} }
} }

View file

@ -273,7 +273,9 @@ function poller_exec_function($queue, $funcname, $argv) {
$argc = count($argv); $argc = count($argv);
logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." ".$queue["parameter"]); $new_process_id = uniqid("wrk", true);
logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." ".$queue["parameter"]." - Process PID: ".$new_process_id);
$stamp = (float)microtime(true); $stamp = (float)microtime(true);
@ -295,7 +297,7 @@ function poller_exec_function($queue, $funcname, $argv) {
// For better logging create a new process id for every worker call // For better logging create a new process id for every worker call
// But preserve the old one for the worker // But preserve the old one for the worker
$old_process_id = $a->process_id; $old_process_id = $a->process_id;
$a->process_id = uniqid("wrk", true); $a->process_id = $new_process_id;
$a->queue = $queue; $a->queue = $queue;
$up_duration = number_format(microtime(true) - $poller_up_start, 3); $up_duration = number_format(microtime(true) - $poller_up_start, 3);
@ -330,7 +332,7 @@ function poller_exec_function($queue, $funcname, $argv) {
logger("Prio ".$queue["priority"].": ".$queue["parameter"]." - longer than 2 minutes (".round($duration/60, 3).")", LOGGER_DEBUG); logger("Prio ".$queue["priority"].": ".$queue["parameter"]." - longer than 2 minutes (".round($duration/60, 3).")", LOGGER_DEBUG);
} }
logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." - done in ".$duration." seconds."); logger("Process ".$mypid." - Prio ".$queue["priority"]." - ID ".$queue["id"].": ".$funcname." - done in ".$duration." seconds. Process PID: ".$new_process_id);
// Write down the performance values into the log // Write down the performance values into the log
if (Config::get("system", "profiler")) { if (Config::get("system", "profiler")) {

View file

@ -14,7 +14,7 @@ function pubsubpublish_run(&$argv, &$argc){
} else { } else {
// We'll push to each subscriber that has push > 0, // We'll push to each subscriber that has push > 0,
// i.e. there has been an update (set in notifier.php). // i.e. there has been an update (set in notifier.php).
$r = q("SELECT `id`, `callback_url` FROM `push_subscriber` WHERE `push` > 0"); $r = q("SELECT `id`, `callback_url` FROM `push_subscriber` WHERE `push` > 0 ORDER BY `last_update` DESC");
foreach ($r as $rr) { foreach ($r as $rr) {
logger("Publish feed to ".$rr["callback_url"], LOGGER_DEBUG); logger("Publish feed to ".$rr["callback_url"], LOGGER_DEBUG);
@ -43,7 +43,13 @@ function handle_pubsubhubbub($id) {
logger("Generate feed of user ".$rr['nickname']." to ".$rr['callback_url']." - last updated ".$rr['last_update'], LOGGER_DEBUG); logger("Generate feed of user ".$rr['nickname']." to ".$rr['callback_url']." - last updated ".$rr['last_update'], LOGGER_DEBUG);
$params = ostatus::feed($a, $rr['nickname'], $rr['last_update']); $last_update = $rr['last_update'];
$params = ostatus::feed($a, $rr['nickname'], $last_update);
if (!$params) {
return;
}
$hmac_sig = hash_hmac("sha1", $params, $rr['secret']); $hmac_sig = hash_hmac("sha1", $params, $rr['secret']);
$headers = array("Content-type: application/atom+xml", $headers = array("Content-type: application/atom+xml",
@ -60,10 +66,9 @@ function handle_pubsubhubbub($id) {
if ($ret >= 200 && $ret <= 299) { if ($ret >= 200 && $ret <= 299) {
logger('successfully pushed to '.$rr['callback_url']); logger('successfully pushed to '.$rr['callback_url']);
// set last_update to "now", and reset push=0 // set last_update to the "created" date of the last item, and reset push=0
$date_now = datetime_convert('UTC','UTC','now','Y-m-d H:i:s');
q("UPDATE `push_subscriber` SET `push` = 0, last_update = '%s' WHERE id = %d", q("UPDATE `push_subscriber` SET `push` = 0, last_update = '%s' WHERE id = %d",
dbesc($date_now), dbesc($last_update),
intval($rr['id'])); intval($rr['id']));
} else { } else {