streams/include/oembed.php

403 lines
10 KiB
PHP
Raw Normal View History

2013-02-26 01:09:40 +00:00
<?php /** @file */
2016-05-03 05:28:27 +00:00
2016-06-23 12:18:58 +00:00
use Zotlabs\Lib as Zlib;
2016-08-12 00:33:28 +00:00
require_once('include/hubloc.php');
function oembed_replacecb($matches){
2014-01-24 07:46:43 +00:00
$embedurl=$matches[1];
2015-08-05 03:07:55 +00:00
2016-05-03 05:28:27 +00:00
$result = oembed_action($embedurl);
if($result['action'] === 'block') {
return '<a href="' . $result['url'] . '">' . $result['url'] . '</a>';
}
2016-05-03 05:28:27 +00:00
$j = oembed_fetch_url($result['url']);
$s = oembed_format_object($j);
return $s;
}
function oembed_action($embedurl) {
$host = '';
2016-05-03 05:28:27 +00:00
$action = 'filter';
2016-05-03 05:28:27 +00:00
$embedurl = trim(str_replace('&amp;','&', $embedurl));
2016-05-03 05:28:27 +00:00
logger('oembed_action: ' . $embedurl, LOGGER_DEBUG, LOG_INFO);
2016-05-03 05:28:27 +00:00
if(strpos($embedurl,'http://') === 0) {
if(intval(get_config('system','embed_sslonly'))) {
$action = 'block';
}
}
// site white/black list
if(($x = get_config('system','embed_deny'))) {
if(($x) && (! is_array($x)))
$x = explode("\n",$x);
if($x) {
foreach($x as $ll) {
$t = trim($ll);
if(($t) && (strpos($embedurl,$t) !== false)) {
$action = 'block';
break;
}
}
}
}
$found = false;
if(($x = get_config('system','embed_allow'))) {
if(($x) && (! is_array($x)))
$x = explode("\n",$x);
if($x) {
foreach($x as $ll) {
$t = trim($ll);
2016-05-03 05:28:27 +00:00
if(($t) && (strpos($embedurl,$t) !== false) && ($action !== 'block')) {
$found = true;
$action = 'allow';
break;
}
}
}
if((! $found) && ($action !== 'block')) {
$action = 'filter';
}
}
// allow individual members to block something that wasn't blocked already.
// They cannot over-ride the site to allow or change the filtering on an
2016-05-03 05:28:27 +00:00
// embed that is not allowed by the site admin.
2015-08-05 03:07:55 +00:00
if(local_channel()) {
if(($x = get_pconfig(local_channel(),'system','embed_deny'))) {
if(($x) && (! is_array($x)))
$x = explode("\n",$x);
if($x) {
foreach($x as $ll) {
$t = trim($ll);
if(($t) && (strpos($embedurl,$t) !== false)) {
$action = 'block';
2015-08-05 03:07:55 +00:00
break;
}
}
}
}
}
2016-05-03 05:28:27 +00:00
$arr = array('url' => $embedurl, 'action' => $action);
call_hooks('oembed_action',$arr);
logger('action: ' . $arr['action'] . ' url: ' . $arr['url'], LOGGER_DEBUG,LOG_DEBUG);
2016-05-03 05:28:27 +00:00
return $arr;
}
// if the url is embeddable with oembed, return the bbcode link.
function oembed_process($url) {
$j = oembed_fetch_url($url);
logger('oembed_process: ' . print_r($j,true));
if($j && $j->type !== 'error')
return '[embed]' . $url . '[/embed]';
return false;
}
function oembed_fetch_url($embedurl){
// These media files should now be caught in bbcode.php
// left here as a fallback in case this is called from another source
$noexts = array(".mp3",".mp4",".ogg",".ogv",".oga",".ogm",".webm",".opus");
2016-05-03 05:28:27 +00:00
$result = oembed_action($embedurl);
2016-05-03 05:28:27 +00:00
$embedurl = $result['url'];
$action = $result['action'];
foreach($noexts as $ext) {
if(strpos(strtolower($embedurl),$ext) !== false) {
$action = 'block';
}
}
$txt = null;
2016-08-12 00:33:28 +00:00
// we should try to cache this and avoid a lookup on each render
$zrl = is_matrix_url($embedurl);
if($action !== 'block') {
2016-06-23 12:18:58 +00:00
$txt = Zlib\Cache::get('[' . App::$videowidth . '] ' . $embedurl);
if(strstr($txt,'youtu') && strstr(z_root(),'https:')) {
$txt = str_replace('http:','https:',$txt);
}
}
if(is_null($txt)) {
$txt = "";
$furl = $embedurl;
2016-08-12 00:33:28 +00:00
logger('local_channel: ' . local_channel());
2016-08-12 00:33:28 +00:00
if(local_channel() && $zrl)
$furl = zid($furl);
if ($action !== 'block') {
// try oembed autodiscovery
$redirects = 0;
$result = z_fetch_url($furl, false, $redirects, array('timeout' => 15, 'accept_content' => "text/*", 'novalidate' => true ));
2013-02-26 04:13:30 +00:00
if($result['success'])
$html_text = $result['body'];
if($html_text) {
$dom = @DOMDocument::loadHTML($html_text);
if ($dom){
$xpath = new DOMXPath($dom);
$attr = "oembed";
$xattr = oe_build_xpath("class","oembed");
2016-01-31 23:55:27 +00:00
$entries = $xpath->query("//link[@type='application/json+oembed']");
foreach($entries as $e){
$href = $e->getAttributeNode("href")->nodeValue;
2016-03-31 23:06:03 +00:00
$x = z_fetch_url($href . '&maxwidth=' . App::$videowidth);
$txt = $x['body'];
break;
}
// soundcloud is now using text/json+oembed instead of application/json+oembed,
// others may be also
$entries = $xpath->query("//link[@type='text/json+oembed']");
foreach($entries as $e){
$href = $e->getAttributeNode("href")->nodeValue;
2016-03-31 23:06:03 +00:00
$x = z_fetch_url($href . '&maxwidth=' . App::$videowidth);
$txt = $x['body'];
break;
}
}
}
}
2013-06-03 23:53:53 +00:00
if ($txt==false || $txt=="") {
2016-03-31 23:06:03 +00:00
$x = array('url' => $embedurl,'videowidth' => App::$videowidth);
2013-06-03 23:53:53 +00:00
call_hooks('oembed_probe',$x);
if(array_key_exists('embed',$x))
$txt = $x['embed'];
}
$txt=trim($txt);
if ($txt[0]!="{") $txt='{"type":"error"}';
//save in cache
if(! get_config('system','oembed_cache_disable'))
2016-06-23 12:18:58 +00:00
Zlib\Cache::set('[' . App::$videowidth . '] ' . $embedurl,$txt);
2011-10-24 11:02:38 +00:00
}
$j = json_decode($txt);
2016-05-03 05:28:27 +00:00
if($action === 'filter') {
if($j->html) {
$orig = $j->html;
$allow_position = (($zrl) ? true : false);
$j->html = purify_html($j->html,$allow_position);
if($j->html != $orig) {
logger('oembed html was purified. original: ' . $orig . ' purified: ' . $j->html, LOGGER_DEBUG, LOG_INFO);
}
2016-08-12 00:33:28 +00:00
$orig_len = mb_strlen(preg_replace('/\s+/','',$orig));
$new_len = mb_strlen(preg_replace('/\s+/','',$j->html));
if(stripos($orig,'<script') || (! $new_len))
$j->type = 'error';
elseif($orig_len) {
$ratio = $new_len / $orig_len;
2016-08-12 00:33:28 +00:00
if($ratio < 0.5) {
$j->type = 'error';
2016-08-12 00:33:28 +00:00
logger('oembed html truncated: ' . $ratio, LOGGER_DEBUG, LOG_INFO);
}
}
}
}
$j->embedurl = $embedurl;
2016-08-12 00:33:28 +00:00
// logger('fetch return: ' . print_r($j,true));
return $j;
}
function oembed_format_object($j){
2016-05-25 03:49:23 +00:00
2012-06-07 12:49:33 +00:00
$embedurl = $j->embedurl;
2014-10-09 03:37:46 +00:00
// logger('format: ' . print_r($j,true));
2014-10-09 03:37:46 +00:00
$jhtml = oembed_iframe($j->embedurl,(isset($j->width) ? $j->width : null), (isset($j->height) ? $j->height : null));
2014-01-24 07:46:43 +00:00
$ret="<span class='oembed ".$j->type."'>";
switch ($j->type) {
case "video": {
if (isset($j->thumbnail_url)) {
2011-10-24 15:31:14 +00:00
$tw = (isset($j->thumbnail_width)) ? $j->thumbnail_width:200;
$th = (isset($j->thumbnail_height)) ? $j->thumbnail_height:180;
$tr = $tw/$th;
$th=120; $tw = $th*$tr;
$tpl=get_markup_template('oembed_video.tpl');
if(strstr($embedurl,'youtu') && strstr(z_root(),'https:')) {
$embedurl = str_replace('http:','https:',$embedurl);
$j->thumbnail_url = str_replace('http:','https:', $j->thumbnail_url);
$jhtml = str_replace('http:','https:', $jhtml);
$j->html = str_replace('http:','https:', $j->html);
}
$ret.=replace_macros($tpl, array(
2016-03-31 05:13:24 +00:00
'$baseurl' => z_root(),
'$embedurl'=>$embedurl,
'$escapedhtml'=>base64_encode($jhtml),
'$tw'=>$tw,
'$th'=>$th,
'$turl'=>$j->thumbnail_url,
));
} else {
$ret=$jhtml;
}
$ret.="<br>";
}; break;
case "photo": {
$ret.= "<img width='".$j->width."' src='".$j->url."'>";
$ret.="<br>";
}; break;
case "link": {
2016-01-31 23:55:27 +00:00
if($j->thumbnail_url) {
2016-02-01 00:33:25 +00:00
if(is_matrix_url($embedurl)) {
$embedurl = zid($embedurl);
$j->thumbnail_url = zid($j->thumbnail_url);
}
2016-01-31 23:55:27 +00:00
$ret = '<a href="' . $embedurl . '" ><img src="' . $j->thumbnail_url . '" alt="thumbnail" /></a><br /><br />';
}
//$ret = "<a href='".$embedurl."'>".$j->title."</a>";
}; break;
case "rich": {
// not so safe..
$ret.= $jhtml;
}; break;
}
// add link to source if not present in "rich" type
if ( $j->type!='rich' || !strpos($j->html,$embedurl) ){
$embedlink = (isset($j->title))?$j->title:$embedurl;
$ret .= '<br />' . "<a href='$embedurl' rel='oembed'>$embedlink</a>";
2016-02-02 07:09:45 +00:00
$ret .= "<br />";
if (isset($j->author_name)) $ret.=" by ".$j->author_name;
if (isset($j->provider_name)) $ret.=" on ".$j->provider_name;
} else {
// add <a> for html2bbcode conversion
2016-02-02 07:09:45 +00:00
$ret .= "<br /><a href='$embedurl' rel='oembed'>$embedurl</a>";
}
$ret.="<br style='clear:left'></span>";
return mb_convert_encoding($ret, 'HTML-ENTITIES', mb_detect_encoding($ret));
}
function oembed_iframe($src,$width,$height) {
$scroll = ' scrolling="no" ';
if(! $width || strstr($width,'%')) {
$width = '640';
$scroll = ' scrolling="auto" ';
}
if(! $height || strstr($height,'%')) {
$height = '300';
$scroll = ' scrolling="auto" ';
}
// try and leave some room for the description line.
$height = intval($height) + 80;
$width = intval($width) + 40;
2014-10-09 03:37:46 +00:00
$s = z_root() . '/oembed/' . base64url_encode($src);
2014-10-09 03:37:46 +00:00
// Make sure any children are sandboxed within their own iframe.
return '<iframe ' . $scroll . 'height="' . $height . '" width="' . $width . '" src="' . $s . '" frameborder="no" >'
2014-10-09 03:37:46 +00:00
. t('Embedded content') . '</iframe>';
}
function oembed_bbcode2html($text){
$stopoembed = get_config("system","no_oembed");
2011-01-31 10:00:35 +00:00
if ($stopoembed == true){
return preg_replace("/\[embed\](.+?)\[\/embed\]/is", "<!-- oembed $1 --><i>". t('Embedding disabled') ." : $1</i><!-- /oembed $1 -->" ,$text);
}
return preg_replace_callback("/\[embed\](.+?)\[\/embed\]/is", 'oembed_replacecb' ,$text);
}
function oe_build_xpath($attr, $value){
// http://westhoffswelt.de/blog/0036_xpath_to_select_html_by_class.html
return "contains( normalize-space( @$attr ), ' $value ' ) or substring( normalize-space( @$attr ), 1, string-length( '$value' ) + 1 ) = '$value ' or substring( normalize-space( @$attr ), string-length( @$attr ) - string-length( '$value' ) ) = ' $value' or @$attr = '$value'";
}
function oe_get_inner_html( $node ) {
$innerHTML= '';
$children = $node->childNodes;
foreach ($children as $child) {
$innerHTML .= $child->ownerDocument->saveXML( $child );
}
return $innerHTML;
}
/**
* Find <span class='oembed'>..<a href='url' rel='oembed'>..</a></span>
* and replace it with [embed]url[/embed]
*/
function oembed_html2bbcode($text) {
// start parser only if 'oembed' is in text
if (strpos($text, "oembed")){
// convert non ascii chars to html entities
$html_text = mb_convert_encoding($text, 'HTML-ENTITIES', mb_detect_encoding($text));
// If it doesn't parse at all, just return the text.
$dom = @DOMDocument::loadHTML($html_text);
if(! $dom)
return $text;
$xpath = new DOMXPath($dom);
$attr = "oembed";
$xattr = oe_build_xpath("class","oembed");
$entries = $xpath->query("//span[$xattr]");
$xattr = "@rel='oembed'";//oe_build_xpath("rel","oembed");
foreach($entries as $e) {
$href = $xpath->evaluate("a[$xattr]/@href", $e)->item(0)->nodeValue;
if(!is_null($href)) $e->parentNode->replaceChild(new DOMText("[embed]".$href."[/embed]"), $e);
}
return oe_get_inner_html( $dom->getElementsByTagName("body")->item(0) );
} else {
2011-02-09 04:55:34 +00:00
return $text;
}
}
2011-10-24 11:02:38 +00:00