599 lines
20 KiB
PHP
599 lines
20 KiB
PHP
<?php
|
|
/**
|
|
* OEMBED PLUGIN
|
|
*
|
|
* Version history
|
|
* 2008-07-31 - release v0.6 by Dwayne Bent <dbb.pub0@liqd.org>
|
|
* 2019-09-01 - resuscitation & realignment with "Greebo"
|
|
*
|
|
* Licensed under the GPL 2 [http://www.gnu.org/licenses/gpl.html]
|
|
*
|
|
**/
|
|
|
|
if(!defined('DOKU_INC')) define('DOKU_INC',realpath(dirname(__FILE__).'/../../').'/');
|
|
if(!defined('DOKU_PLUGIN')) define('DOKU_PLUGIN',DOKU_INC.'lib/plugins/');
|
|
define('OEMBED_BASE',DOKU_PLUGIN.'oembed/');
|
|
require_once(DOKU_PLUGIN.'syntax.php');
|
|
require_once(DOKU_INC.'inc/HTTP/HTTPClient.php');
|
|
|
|
class syntax_plugin_oembed extends DokuWiki_Syntax_Plugin {
|
|
var $errors = array();
|
|
var $version = '1.0';
|
|
var $regex_master = '/^{{>\s*(?<url>.+?)(?:\s+(?<params>.+?))??\s*}}$/';
|
|
|
|
function getType(){
|
|
return 'substition';
|
|
}
|
|
|
|
function getAllowedTypes() {
|
|
return array();
|
|
}
|
|
|
|
function getPType(){
|
|
return 'block';
|
|
}
|
|
|
|
function getSort(){
|
|
return 285;
|
|
}
|
|
|
|
function connectTo($mode) {
|
|
$this->Lexer->addSpecialPattern('{{>.+?}}', $mode, 'plugin_oembed');
|
|
}
|
|
|
|
function handle($match, $state, $pos, Doku_Handler $handler){
|
|
if($state == DOKU_LEXER_SPECIAL){
|
|
if($parsed_tag = $this->parseTag($match)){
|
|
$oembed_data = $this->resolve($parsed_tag);
|
|
return array('oembed_data' => $oembed_data,
|
|
'tag' => $parsed_tag,
|
|
'errors' => $this->errors);
|
|
}
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
function render($mode, Doku_Renderer $renderer, $data) {
|
|
if($mode == 'xhtml'){
|
|
$renderer->doc .= $this->renderXHTML($data);
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
/***************************************************************************
|
|
* PARSE FUNCTIONS
|
|
* Convert input strings to a usable form
|
|
**************************************************************************/
|
|
|
|
/*
|
|
* Parse the entire matched string
|
|
*
|
|
* $tag: The entire matched string
|
|
*
|
|
* returns:
|
|
* false on error otherwise
|
|
* array of parsed data:
|
|
* url: the target url
|
|
* params: array of parsed parameters, see parseParams()
|
|
*/
|
|
function parseTag($tag){
|
|
if(preg_match($this->regex_master, $tag, $matches)){
|
|
return array('url' => $matches['url'],
|
|
'params' => $this->parseParams($matches['params']));
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* Parse the tag parameters
|
|
*
|
|
* $params: whitespace delimited list of parameters (no trailing or leading
|
|
* whitespace)
|
|
*
|
|
* returns:
|
|
* array of parsed parameters:
|
|
* provider: array of provider parameters:
|
|
* name => value
|
|
* plugin: array of plugin parameters
|
|
* name => value
|
|
*/
|
|
function parseParams($params){
|
|
$parsed_params = array('provider' => array(), 'plugin' => array());
|
|
|
|
if($params != null){
|
|
foreach(preg_split('/\s+/', $params) as $param){
|
|
if(preg_match('/^(?<type>!|\?)(?<name>\S+?)(?:=(?<value>\S+?))?$/', $param, $matches)){
|
|
if($matches['type'] == '?'){
|
|
$parsed_params['provider'][$matches['name']] = $matches['value'];
|
|
}
|
|
else if($matches['type'] == '!'){
|
|
$parsed_params['plugin'][$matches['name']] = $matches['value'];
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return $parsed_params;
|
|
}
|
|
|
|
/*
|
|
* Parse an HTTP response containing OEmbed data
|
|
*
|
|
* $response: array of HTTP response data
|
|
* status: numerical HTTP status code
|
|
* headers: array of HTTP headers
|
|
* name => value
|
|
* body: body of the response
|
|
*
|
|
* returns: false on error or array of parsed oembed data:
|
|
* name => value
|
|
*/
|
|
function parseResponse($response){
|
|
if($response['status'] != 200) return $this->error("Provider returned HTTP Status {$response['status']} for {$tag['url']}");
|
|
if(!$type = $this->parseContentType($response['headers']['content-type'])) return false;
|
|
|
|
$oembed = array();
|
|
|
|
switch($type){
|
|
case 'xml':
|
|
if(!$xml = simplexml_load_string($response['body'])) return $this->error("Unable to parse XML: {$response['body']}");
|
|
|
|
foreach($xml as $element){
|
|
$oembed[$element->getName()] = (string) $element;
|
|
}
|
|
|
|
break;
|
|
case 'json':
|
|
$oembed = json_decode($response['body']);
|
|
|
|
break;
|
|
default:
|
|
return $this->error("Internal error occured. Found type: {$type}");
|
|
}
|
|
|
|
//if($oembed['version'] != '1.0') return $this->error("Unsupported OEmbed version: {$oembed['version']}");
|
|
return $oembed;
|
|
}
|
|
|
|
/*
|
|
* Parse a content-type string from an HTTP header
|
|
*
|
|
* $header: The content-type string
|
|
*
|
|
* returns: false on error or 'json' for JSON content or 'xml' for XML content
|
|
*/
|
|
function parseContentType($header){
|
|
if(!preg_match('/^\s*(?<type>[^;\s]+)(.*)?/', $header, $matches)){
|
|
return $this->error("Invalid Content-Type header: {$header}");
|
|
}
|
|
|
|
switch($matches['type']){
|
|
case 'text/xml':
|
|
return 'xml';
|
|
case 'application/json':
|
|
return 'json';
|
|
// non-spec content-types, only supported for compatibility
|
|
case 'application/xml':
|
|
return 'xml';
|
|
case 'text/json':
|
|
return 'json';
|
|
case 'text/plain':
|
|
return 'json';
|
|
default:
|
|
return $this->error("Unsupported Content-Type: {$matches['type']}");
|
|
}
|
|
}
|
|
|
|
/***************************************************************************
|
|
* RESOLVE FUNCTIONS
|
|
* Given parsed tag data get OEmbed data
|
|
**************************************************************************/
|
|
|
|
/*
|
|
* Given parsed tag information, return OEmbed data
|
|
*
|
|
* $tag: Parsed tag information, as from parseTag()
|
|
*
|
|
* returns: false on error or array of OEmbed data
|
|
* oembed: array of OEmbed data as returned from provider
|
|
* query_url: URL used to get the OEmbed data
|
|
* target_url: URL to which the OEmbed data refers
|
|
*/
|
|
function resolve($tag){
|
|
|
|
// try to resolve using cache
|
|
if($data = $this->resolveCache($tag)) return $data;
|
|
|
|
// try to resolve directly
|
|
if(array_key_exists('direct', $tag['params']['plugin'])){
|
|
if($this->getConf('enable_direct_link')){
|
|
return $this->resolveDirect($tag);
|
|
}
|
|
}
|
|
|
|
if($this->getConf('resolution_priority') == 'link discovery'){
|
|
// try link discovery
|
|
if($this->getConf('enable_link_discovery')){
|
|
if($data = $this->resolveDiscovery($tag)) return $data;
|
|
}
|
|
|
|
// try local provider list
|
|
if($this->getConf('enable_provider_list')){
|
|
if($data = $this->resolveProviderList($tag)) return $data;
|
|
}
|
|
}
|
|
else if($this->getConf('resolution_priority') == 'provider list'){
|
|
// try local provider list
|
|
if($this->getConf('enable_provider_list')){
|
|
if($data = $this->resolveProviderList($tag)) return $data;
|
|
}
|
|
|
|
// try link discovery
|
|
if($this->getConf('enable_link_discovery')){
|
|
if($data = $this->resolveDiscovery($tag)) return $data;
|
|
}
|
|
}
|
|
return $this->error("All resolution methods failed");
|
|
}
|
|
|
|
/*
|
|
* Analogous to resolve(), using the cache for resolution
|
|
*/
|
|
function resolveCache($tag){
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* Analogous to resolve(), using a directly entered API endpoint for
|
|
* resolution
|
|
*/
|
|
function resolveDirect($tag){
|
|
$query_url = $this->buildURL($tag['url'], $tag['params']['provider']);
|
|
if(!$response = $this->fetch($query_url)) return false;
|
|
if(!$oembed = $this->parseResponse($response)) return false;
|
|
|
|
return array('oembed' => $oembed,
|
|
'query_url' => $query_url,
|
|
'target_url' => $tag['params']['provider']['url']);
|
|
}
|
|
|
|
/*
|
|
* Analogous to resolve(), using link discovery for resolution
|
|
*/
|
|
function resolveDiscovery($tag){
|
|
|
|
if(!$response = $this->fetch($tag['url'])) return false;
|
|
if(!$link_url = $this->getOEmbedLink($response['body'])) return false;
|
|
|
|
$query_url = $this->buildURL($link_url, $tag['params']['provider']);
|
|
|
|
if(!$response = $this->fetch($query_url)) return false;
|
|
if(!$oembed = $this->parseResponse($response)) return false;
|
|
|
|
|
|
|
|
return array('oembed' => $oembed,
|
|
'query_url' => $query_url,
|
|
'target_url' => $tag['url']);
|
|
}
|
|
|
|
/*
|
|
* Analogous to resolve(), using the local provider list for resolution
|
|
*/
|
|
function resolveProviderList($tag){
|
|
if(!$api = $this->getProviderAPI($tag['url'])) return false;
|
|
|
|
$api = str_replace("{format}", $this->getConf('format_preference'), $api);
|
|
$params = array_merge($tag['params']['provider'], array('url' => $tag['url']));
|
|
$query_url = $this->buildURL($api, $params);
|
|
|
|
if(!$response = $this->fetch($query_url)) return false;
|
|
if(!$oembed = $this->parseResponse($response)) return false;
|
|
|
|
return array('oembed' => $oembed,
|
|
'query_url' => $query_url,
|
|
'target_url' => $tag['url']);
|
|
}
|
|
|
|
/***************************************************************************
|
|
* RENDER FUNCTIONS
|
|
* Convert OEmbed data to a presentable form
|
|
**************************************************************************/
|
|
|
|
/*
|
|
* Given OEmbed data as returned by resolve(), produces a valid XHTML
|
|
* representation
|
|
*
|
|
* $data: OEmbed data as returned by resolve()
|
|
*
|
|
* returns: XHTML representation of OEmbed data
|
|
*/
|
|
function renderXHTML($data){
|
|
$content = '';
|
|
|
|
if(!$data['oembed_data']){
|
|
$content .= "OEmbed Error";
|
|
$content .= "<ul>";
|
|
foreach($data['errors'] as $error){
|
|
$content .= "<li>".$error."</li>";
|
|
}
|
|
$content .= "</ul>";
|
|
|
|
return $content;
|
|
}
|
|
|
|
$oembed = $this->sanitizeOEmbed($data['oembed_data']['oembed']);
|
|
|
|
if(array_key_exists('thumbnail', $data['tag']['params']['plugin'])){
|
|
if($oembed['thumbnail_url']){
|
|
$img = '<img src="'.$oembed['thumbnail_url'].'" alt="'.$oembed['title'].'" title="'.$oembed['title'].'" height="'.$oembed['thumbnail_height'].'px" width="'.$oembed['thumbnail_width'].'px"/>';
|
|
$content = '<a href="'.$data['oembed_data']['target_url'].'">'.$img.'</a>';
|
|
}
|
|
else{
|
|
$content = $this->renderXHTMLLink($data);
|
|
}
|
|
}
|
|
else{
|
|
switch($oembed['type']){
|
|
case 'photo':
|
|
if($this->getConf('fullwidth_images')){
|
|
$content = '<img src="'.$oembed['url'].'" alt="'.$oembed['title'].'" title="'.$oembed['title'].'" width=100% />';
|
|
} else {
|
|
$content = '<img src="'.$oembed['url'].'" alt="'.$oembed['title'].'" title="'.$oembed['title'].'" height="'.$oembed['height'].'px" width="'.$oembed['width'].'px"/>';
|
|
}
|
|
break;
|
|
case 'video':
|
|
$content = $oembed['html'];
|
|
break;
|
|
case 'link':
|
|
$content = $this->renderXHTMLLink($data);
|
|
break;
|
|
case 'rich':
|
|
$content = $oembed['html'];
|
|
break;
|
|
default:
|
|
$content = "OEmbed Error <ul><li>Unsupported media type: {$oembed['type']}</li></ul>";
|
|
}
|
|
}
|
|
|
|
return $content;
|
|
}
|
|
|
|
/*
|
|
* Given OEmbed data as returned by resolve(), produces a valid XHTML
|
|
* representation as a simple link
|
|
*
|
|
* $data: OEmbed data as returned by resolve()
|
|
*
|
|
* returns: XHTML representation of OEmbed data as a simple link
|
|
*/
|
|
function renderXHTMLLink($data){
|
|
$text .= ($data['oembed_data']['oembed']['provider_name'] != null) ? $data['oembed_data']['oembed']['provider_name'].': ' : '';
|
|
$text .= $data['oembed_data']['oembed']['title'];
|
|
$text .= ($data['oembed_data']['oembed']['author_name'] != null) ? ' – '.$data['oembed_data']['oembed']['author_name'] : '';
|
|
return '<a class="urlextern" href="'.$data['oembed_data']['target_url'].'">'.$text.'</a>';
|
|
}
|
|
|
|
/***************************************************************************
|
|
* UTILITY FUNCTIONS
|
|
* Provides shared functionality
|
|
**************************************************************************/
|
|
|
|
/*
|
|
* Stores a message in the errors array and returns false
|
|
*
|
|
* $msg: message to store
|
|
*
|
|
* returns: false
|
|
*/
|
|
function error($msg){
|
|
array_push($this->errors, $msg);
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* Performs an HTTP GET request on the given URL
|
|
*
|
|
* $url: URL to perform the request on
|
|
*
|
|
* returns: false on error or array representing the HTTP response
|
|
* status: numerical HTTP status code
|
|
* headers: array of HTTP headers
|
|
* name => value
|
|
* body: HTTP response body
|
|
*/
|
|
function fetch($url){
|
|
$client = new DokuHTTPClient();
|
|
if(!$client->sendRequest($url)){
|
|
return $this->error("Error sending request to provider: {$url}");
|
|
}
|
|
|
|
return array('status' => $client->status,
|
|
'headers' => $client->resp_headers,
|
|
'body' => $client->resp_body);
|
|
}
|
|
|
|
/*
|
|
* Given a base URL, create a new URL using the given parameters. Query
|
|
* values are URL encoded.
|
|
*
|
|
* $base: base URL, any existing parameter values should be URL encoded.
|
|
* $params: array of parameters to add to URL
|
|
* name => value
|
|
*
|
|
* returns: the new URL
|
|
*/
|
|
function buildURL($base, $params){
|
|
$url = $base;
|
|
|
|
$first = strpos($base,"?") === false ? true : false;
|
|
foreach($params as $name => $value){
|
|
if($first){ $url .= "?"; $first = false; }
|
|
else { $url .= "&"; }
|
|
|
|
$url .= $name."=".rawurlencode($value);
|
|
}
|
|
|
|
return $url;
|
|
}
|
|
|
|
/*
|
|
* Given raw HTML, tries to extract oembed discovery link
|
|
*
|
|
* Based on code by Keith Devens:
|
|
* http://keithdevens.com/weblog/archive/2002/Jun/03/RSSAuto-DiscoveryPHP
|
|
*
|
|
* Parameters:
|
|
* $html: raw HTML
|
|
*
|
|
* Returns: false on error or no link present or an OEmbed discovery link
|
|
*/
|
|
function getOEmbedLink($html){
|
|
$ret_link = false;
|
|
|
|
if(!$html) return false;
|
|
|
|
// search through the HTML, save all <link> tags
|
|
// and store each link's attributes in an associative array
|
|
preg_match_all('/<link\s+(.*?)\s*\/?>/si', $html, $matches);
|
|
$links = $matches[1];
|
|
$final_links = array();
|
|
$link_count = count($links);
|
|
for($n=0; $n<$link_count; $n++){
|
|
$attributes = preg_split('/\s+/s', $links[$n]);
|
|
foreach($attributes as $attribute){
|
|
$att = preg_split('/\s*=\s*/s', $attribute, 2);
|
|
if(isset($att[1])){
|
|
$att[1] = preg_replace('/([\'"]?)(.*)\1/', '$2', $att[1]);
|
|
$final_link[strtolower($att[0])] = $att[1];
|
|
}
|
|
}
|
|
$final_links[$n] = $final_link;
|
|
}
|
|
|
|
// now figure out which one points to the OEmbed data
|
|
for($n=0; $n<$link_count; $n++){
|
|
if(strtolower($final_links[$n]['rel']) == 'alternate'){
|
|
if(strtolower($final_links[$n]['type']) == 'application/json+oembed'){
|
|
if($this->getConf('format_preference') == 'json'){
|
|
return $final_links[$n]['href'];
|
|
}
|
|
else{
|
|
$ret_link = $final_links[$n]['href'];
|
|
}
|
|
}
|
|
|
|
// application/xml+oembed only exists for compatability not in spec
|
|
if(strtolower($final_links[$n]['type']) == 'text/xml+oembed' or
|
|
strtolower($final_links[$n]['type']) == 'application/xml+oembed'){
|
|
if($this->getConf('format_preference') == 'xml'){
|
|
return $final_links[$n]['href'];
|
|
}
|
|
else{
|
|
$ret_link = $final_links[$n]['href'];
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return $ret_link;
|
|
}
|
|
|
|
/*
|
|
* Given a URL, finds a OEmbed provider API endpoint which can be used with
|
|
* it from the local provider list.
|
|
*
|
|
* $url: URL to search a provider for
|
|
*
|
|
* Returns: false on error or no provider find or the API endpoint of an
|
|
* appropriate provider
|
|
*/
|
|
function getProviderAPI($url){
|
|
$providers_path = OEMBED_BASE.'providers.xml';
|
|
if(!$providers = simplexml_load_file($providers_path)) return false;
|
|
|
|
foreach($providers->provider as $provider){
|
|
foreach($provider->scheme as $scheme){
|
|
$regex = "@^".str_replace("@","\@",$scheme)."$@i";
|
|
if(preg_match($regex, trim($url))){
|
|
$attrs = $provider->attributes();
|
|
if(($api = $attrs['api']) != null){
|
|
return $api;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* Runs htmlspecialchars() on values in OEmbed data EXCEPT for html values
|
|
*
|
|
* $oembed: array of OEmbed data from parseResponse()
|
|
*
|
|
* Returns: identical array to $oembed in which all values except for html
|
|
* are run through htmlspecialchars()
|
|
*/
|
|
function sanitizeOEmbed($oembed){
|
|
$retarray = array();
|
|
|
|
foreach($oembed as $key => $value){
|
|
if($key == 'html'){
|
|
$retarray[$key] = $value;
|
|
}
|
|
else{
|
|
$retarray[$key] = htmlspecialchars($value);
|
|
}
|
|
}
|
|
|
|
return $retarray;
|
|
}
|
|
|
|
/***************************************************************************
|
|
* DEBUG FUNCTIONS
|
|
* For testing and devlopment, not regularly used
|
|
**************************************************************************/
|
|
|
|
function _log($msg){
|
|
$fh = fopen(OEMBED_BASE."oembed.log",'a');
|
|
$curtime = date('Y-m-d H:i:s');
|
|
fwrite($fh, "[{$curtime}] {$msg}\n");
|
|
fclose($fh);
|
|
}
|
|
|
|
function _logParsedTag($parsed_tag){
|
|
$this->_log("Parsed Tag");
|
|
$this->_log(" URL: {$parsed_tag['url']}");
|
|
$this->_log(" Provider Params:");
|
|
foreach($parsed_tag['params']['provider'] as $key => $value){
|
|
$this->_log(" {$key} => {$value}");
|
|
}
|
|
$this->_log(" Plugin Params:");
|
|
foreach($parsed_tag['params']['plugin'] as $key => $value){
|
|
$this->_log(" {$key} => {$value}");
|
|
}
|
|
}
|
|
|
|
function _logOEmbedData($oembed){
|
|
$this->_log("OEmbed Data:");
|
|
$this->_log(" target_url: {$oembed['target_url']}");
|
|
$this->_log(" query_url: {$oembed['query_url']}");
|
|
$this->_log(" Response:");
|
|
foreach($oembed['oembed'] as $name => $value){
|
|
$this->_log(" {$name}: {$value}");
|
|
}
|
|
}
|
|
|
|
function _logErrors($errors){
|
|
$this->_log("Errors:");
|
|
foreach($errors as $error){
|
|
$this->_log(" {$error}");
|
|
}
|
|
}
|
|
}
|
|
|