3 * API for fetching the HTML to embed remote content based on a provided URL.
4 * Used internally by the {@link WP_Embed} class, but is designed to be generic.
6 * @link http://codex.wordpress.org/oEmbed oEmbed Codex Article
7 * @link http://oembed.com/ oEmbed Homepage
21 public $providers = array();
22 public static $early_providers = array();
29 public function __construct() {
31 '#http://(www\.)?youtube\.com/watch.*#i' => array( 'http://www.youtube.com/oembed', true ),
32 '#https://(www\.)?youtube\.com/watch.*#i' => array( 'http://www.youtube.com/oembed?scheme=https', true ),
33 '#http://(www\.)?youtube\.com/playlist.*#i' => array( 'http://www.youtube.com/oembed', true ),
34 '#https://(www\.)?youtube\.com/playlist.*#i' => array( 'http://www.youtube.com/oembed?scheme=https', true ),
35 '#http://youtu\.be/.*#i' => array( 'http://www.youtube.com/oembed', true ),
36 '#https://youtu\.be/.*#i' => array( 'http://www.youtube.com/oembed?scheme=https', true ),
37 'http://blip.tv/*' => array( 'http://blip.tv/oembed/', false ),
38 '#https?://(.+\.)?vimeo\.com/.*#i' => array( 'http://vimeo.com/api/oembed.{format}', true ),
39 '#https?://(www\.)?dailymotion\.com/.*#i' => array( 'http://www.dailymotion.com/services/oembed', true ),
40 'http://dai.ly/*' => array( 'http://www.dailymotion.com/services/oembed', false ),
41 '#https?://(www\.)?flickr\.com/.*#i' => array( 'https://www.flickr.com/services/oembed/', true ),
42 '#https?://flic\.kr/.*#i' => array( 'https://www.flickr.com/services/oembed/', true ),
43 '#https?://(.+\.)?smugmug\.com/.*#i' => array( 'http://api.smugmug.com/services/oembed/', true ),
44 '#https?://(www\.)?hulu\.com/watch/.*#i' => array( 'http://www.hulu.com/api/oembed.{format}', true ),
45 'http://revision3.com/*' => array( 'http://revision3.com/api/oembed/', false ),
46 'http://i*.photobucket.com/albums/*' => array( 'http://photobucket.com/oembed', false ),
47 'http://gi*.photobucket.com/groups/*' => array( 'http://photobucket.com/oembed', false ),
48 '#https?://(www\.)?scribd\.com/doc/.*#i' => array( 'http://www.scribd.com/services/oembed', true ),
49 '#https?://wordpress.tv/.*#i' => array( 'http://wordpress.tv/oembed/', true ),
50 '#https?://(.+\.)?polldaddy\.com/.*#i' => array( 'https://polldaddy.com/oembed/', true ),
51 '#https?://poll\.fm/.*#i' => array( 'https://polldaddy.com/oembed/', true ),
52 '#https?://(www\.)?funnyordie\.com/videos/.*#i' => array( 'http://www.funnyordie.com/oembed', true ),
53 '#https?://(www\.)?twitter\.com/.+?/status(es)?/.*#i' => array( 'https://api.twitter.com/1/statuses/oembed.{format}', true ),
54 '#https?://(www\.)?soundcloud\.com/.*#i' => array( 'http://soundcloud.com/oembed', true ),
55 '#https?://(www\.)?slideshare\.net/.*#i' => array( 'https://www.slideshare.net/api/oembed/2', true ),
56 '#http://instagr(\.am|am\.com)/p/.*#i' => array( 'http://api.instagram.com/oembed', true ),
57 '#https?://(www\.)?rdio\.com/.*#i' => array( 'http://www.rdio.com/api/oembed/', true ),
58 '#https?://rd\.io/x/.*#i' => array( 'http://www.rdio.com/api/oembed/', true ),
59 '#https?://(open|play)\.spotify\.com/.*#i' => array( 'https://embed.spotify.com/oembed/', true ),
60 '#https?://(.+\.)?imgur\.com/.*#i' => array( 'http://api.imgur.com/oembed', true ),
61 '#https?://(www\.)?meetu(\.ps|p\.com)/.*#i' => array( 'http://api.meetup.com/oembed', true ),
62 '#https?://(www\.)?issuu\.com/.+/docs/.+#i' => array( 'http://issuu.com/oembed_wp', true ),
63 '#https?://(www\.)?collegehumor\.com/video/.*#i' => array( 'http://www.collegehumor.com/oembed.{format}', true ),
64 '#https?://(www\.)?mixcloud\.com/.*#i' => array( 'http://www.mixcloud.com/oembed', true ),
65 '#https?://(www\.|embed\.)?ted\.com/talks/.*#i' => array( 'http://www.ted.com/talks/oembed.{format}', true ),
66 '#https?://(www\.)?(animoto|video214)\.com/play/.*#i' => array( 'http://animoto.com/oembeds/create', true ),
69 if ( ! empty( self::$early_providers['add'] ) ) {
70 foreach ( self::$early_providers['add'] as $format => $data ) {
71 $providers[ $format ] = $data;
75 if ( ! empty( self::$early_providers['remove'] ) ) {
76 foreach ( self::$early_providers['remove'] as $format ) {
77 unset( $providers[ $format ] );
81 self::$early_providers = array();
84 * Filter the list of oEmbed providers.
86 * Discovery is disabled for users lacking the unfiltered_html capability.
87 * Only providers in this array will be used for those users.
89 * Supported providers:
91 * | ------------ | -------------------- | ----- | --------- |
92 * | Provider | Flavor | SSL | Since |
93 * | ------------ | -------------------- | ----- | --------- |
94 * | Blip | blip.tv | | 2.9.0 |
95 * | Dailymotion | dailymotion.com | Yes | 2.9.0 |
96 * | Flickr | flickr.com | Yes | 2.9.0 |
97 * | Hulu | hulu.com | Yes | 2.9.0 |
98 * | Photobucket | photobucket.com | | 2.9.0 |
99 * | Revision3 | revision3.com | | 2.9.0 |
100 * | Scribd | scribd.com | Yes | 2.9.0 |
101 * | Vimeo | vimeo.com | Yes | 2.9.0 |
102 * | WordPress.tv | wordpress.tv | Yes | 2.9.0 |
103 * | YouTube | youtube.com/watch | Yes | 2.9.0 |
104 * | ------------ | -------------------- | ----- | --------- |
105 * | Funny or Die | funnyordie.com | Yes | 3.0.0 |
106 * | Polldaddy | polldaddy.com | Yes | 3.0.0 |
107 * | SmugMug | smugmug.com | Yes | 3.0.0 |
108 * | YouTube | youtu.be | Yes | 3.0.0 |
109 * | ------------ | -------------------- | ----- | --------- |
110 * | Twitter | twitter.com | Yes | 3.4.0 |
111 * | ------------ | -------------------- | ----- | --------- |
112 * | Instagram | instagram.com | | 3.5.0 |
113 * | Instagram | instagr.am | | 3.5.0 |
114 * | Slideshare | slideshare.net | Yes | 3.5.0 |
115 * | SoundCloud | soundcloud.com | Yes | 3.5.0 |
116 * | ------------ | -------------------- | ----- | --------- |
117 * | Dailymotion | dai.ly | | 3.6.0 |
118 * | Flickr | flic.kr | Yes | 3.6.0 |
119 * | Rdio | rdio.com | Yes | 3.6.0 |
120 * | Rdio | rd.io | Yes | 3.6.0 |
121 * | Spotify | spotify.com | Yes | 3.6.0 |
122 * | ------------ | -------------------- | ----- | --------- |
123 * | Imgur | imgur.com | Yes | 3.9.0 |
124 * | Meetup.com | meetup.com | Yes | 3.9.0 |
125 * | Meetup.com | meetu.ps | Yes | 3.9.0 |
126 * | ------------ | -------------------- | ----- | --------- |
127 * | Animoto | animoto.com | Yes | 4.0.0 |
128 * | Animoto | video214.com | Yes | 4.0.0 |
129 * | CollegeHumor | collegehumor.com | Yes | 4.0.0 |
130 * | Issuu | issuu.com | Yes | 4.0.0 |
131 * | Mixcloud | mixcloud.com | Yes | 4.0.0 |
132 * | Polldaddy | poll.fm | Yes | 4.0.0 |
133 * | TED | ted.com | Yes | 4.0.0 |
134 * | YouTube | youtube.com/playlist | Yes | 4.0.0 |
135 * | ------------ | -------------------- | ----- | --------- |
137 * No longer supported providers:
139 * | ------------ | -------------------- | ----- | --------- | --------- |
140 * | Provider | Flavor | SSL | Since | Removed |
141 * | ------------ | -------------------- | ----- | --------- | --------- |
142 * | Qik | qik.com | Yes | 2.9.0 | 3.9.0 |
143 * | ------------ | -------------------- | ----- | --------- | --------- |
144 * | Viddler | viddler.com | Yes | 2.9.0 | 4.0.0 |
145 * | ------------ | -------------------- | ----- | --------- | --------- |
147 * @see wp_oembed_add_provider()
151 * @param array $providers An array of popular oEmbed providers.
153 $this->providers = apply_filters( 'oembed_providers', $providers );
155 // Fix any embeds that contain new lines in the middle of the HTML which breaks wpautop().
156 add_filter( 'oembed_dataparse', array($this, '_strip_newlines'), 10, 3 );
160 * Make private/protected methods readable for backwards compatibility.
165 * @param callable $name Method to call.
166 * @param array $arguments Arguments to pass when calling.
167 * @return mixed|bool Return value of the callback, false otherwise.
169 public function __call( $name, $arguments ) {
170 return call_user_func_array( array( $this, $name ), $arguments );
174 * Takes a URL and returns the corresponding oEmbed provider's URL, if there is one.
179 * @see WP_oEmbed::discover()
181 * @param string $url The URL to the content.
182 * @param string|array $args Optional provider arguments.
183 * @return bool|string False on failure, otherwise the oEmbed provider URL.
185 public function get_provider( $url, $args = '' ) {
189 if ( !isset($args['discover']) )
190 $args['discover'] = true;
192 foreach ( $this->providers as $matchmask => $data ) {
193 list( $providerurl, $regex ) = $data;
195 // Turn the asterisk-type provider URLs into regex
197 $matchmask = '#' . str_replace( '___wildcard___', '(.+)', preg_quote( str_replace( '*', '___wildcard___', $matchmask ), '#' ) ) . '#i';
198 $matchmask = preg_replace( '|^#http\\\://|', '#https?\://', $matchmask );
201 if ( preg_match( $matchmask, $url ) ) {
202 $provider = str_replace( '{format}', 'json', $providerurl ); // JSON is easier to deal with than XML
207 if ( !$provider && $args['discover'] )
208 $provider = $this->discover( $url );
214 * Add an oEmbed provider just-in-time when wp_oembed_add_provider() is called
215 * before the 'plugins_loaded' hook.
217 * The just-in-time addition is for the benefit of the 'oembed_providers' filter.
223 * @see wp_oembed_add_provider()
225 * @param string $format Format of URL that this provider can handle. You can use
226 * asterisks as wildcards.
227 * @param string $provider The URL to the oEmbed provider..
228 * @param bool $regex Optional. Whether the $format parameter is in a regex format.
231 public static function _add_provider_early( $format, $provider, $regex = false ) {
232 if ( empty( self::$early_providers['add'] ) ) {
233 self::$early_providers['add'] = array();
236 self::$early_providers['add'][ $format ] = array( $provider, $regex );
240 * Remove an oEmbed provider just-in-time when wp_oembed_remove_provider() is called
241 * before the 'plugins_loaded' hook.
243 * The just-in-time removal is for the benefit of the 'oembed_providers' filter.
249 * @see wp_oembed_remove_provider()
251 * @param string $format The format of URL that this provider can handle. You can use
252 * asterisks as wildcards.
254 public static function _remove_provider_early( $format ) {
255 if ( empty( self::$early_providers['remove'] ) ) {
256 self::$early_providers['remove'] = array();
259 self::$early_providers['remove'][] = $format;
263 * The do-it-all function that takes a URL and attempts to return the HTML.
265 * @see WP_oEmbed::fetch()
266 * @see WP_oEmbed::data2html()
268 * @param string $url The URL to the content that should be attempted to be embedded.
269 * @param array $args Optional arguments. Usually passed from a shortcode.
270 * @return bool|string False on failure, otherwise the UNSANITIZED (and potentially unsafe) HTML that should be used to embed.
272 function get_html( $url, $args = '' ) {
273 $provider = $this->get_provider( $url, $args );
275 if ( !$provider || false === $data = $this->fetch( $provider, $url, $args ) )
279 * Filter the HTML returned by the oEmbed provider.
283 * @param string $data The returned oEmbed HTML.
284 * @param string $url URL of the content to be embedded.
285 * @param array $args Optional arguments, usually passed from a shortcode.
287 return apply_filters( 'oembed_result', $this->data2html( $data, $url ), $url, $args );
291 * Attempts to find oEmbed provider discovery <link> tags at the given URL.
293 * @param string $url The URL that should be inspected for discovery <link> tags.
294 * @return bool|string False on failure, otherwise the oEmbed provider URL.
296 public function discover( $url ) {
297 $providers = array();
300 * Filter oEmbed remote get arguments.
304 * @see WP_Http::request()
306 * @param array $args oEmbed remote get arguments.
307 * @param string $url URL to be inspected.
309 $args = apply_filters( 'oembed_remote_get_args', array(), $url );
312 $request = wp_safe_remote_get( $url, $args );
313 if ( $html = wp_remote_retrieve_body( $request ) ) {
316 * Filter the link types that contain oEmbed provider URLs.
320 * @param array $format Array of oEmbed link types. Accepts 'application/json+oembed',
321 * 'text/xml+oembed', and 'application/xml+oembed' (incorrect,
322 * used by at least Vimeo).
324 $linktypes = apply_filters( 'oembed_linktypes', array(
325 'application/json+oembed' => 'json',
326 'text/xml+oembed' => 'xml',
327 'application/xml+oembed' => 'xml',
331 $html = substr( $html, 0, stripos( $html, '</head>' ) );
335 foreach ( $linktypes as $linktype => $format ) {
336 if ( stripos($html, $linktype) ) {
342 if ( $tagfound && preg_match_all( '/<link([^<>]+)>/i', $html, $links ) ) {
343 foreach ( $links[1] as $link ) {
344 $atts = shortcode_parse_atts( $link );
346 if ( !empty($atts['type']) && !empty($linktypes[$atts['type']]) && !empty($atts['href']) ) {
347 $providers[$linktypes[$atts['type']]] = $atts['href'];
349 // Stop here if it's JSON (that's all we need)
350 if ( 'json' == $linktypes[$atts['type']] )
357 // JSON is preferred to XML
358 if ( !empty($providers['json']) )
359 return $providers['json'];
360 elseif ( !empty($providers['xml']) )
361 return $providers['xml'];
367 * Connects to a oEmbed provider and returns the result.
369 * @param string $provider The URL to the oEmbed provider.
370 * @param string $url The URL to the content that is desired to be embedded.
371 * @param array $args Optional arguments. Usually passed from a shortcode.
372 * @return bool|object False on failure, otherwise the result in the form of an object.
374 public function fetch( $provider, $url, $args = '' ) {
375 $args = wp_parse_args( $args, wp_embed_defaults( $url ) );
377 $provider = add_query_arg( 'maxwidth', (int) $args['width'], $provider );
378 $provider = add_query_arg( 'maxheight', (int) $args['height'], $provider );
379 $provider = add_query_arg( 'url', urlencode($url), $provider );
382 * Filter the oEmbed URL to be fetched.
386 * @param string $provider URL of the oEmbed provider.
387 * @param string $url URL of the content to be embedded.
388 * @param array $args Optional arguments, usually passed from a shortcode.
390 $provider = apply_filters( 'oembed_fetch_url', $provider, $url, $args );
392 foreach( array( 'json', 'xml' ) as $format ) {
393 $result = $this->_fetch_with_format( $provider, $format );
394 if ( is_wp_error( $result ) && 'not-implemented' == $result->get_error_code() )
396 return ( $result && ! is_wp_error( $result ) ) ? $result : false;
402 * Fetches result from an oEmbed provider for a specific format and complete provider URL
406 * @param string $provider_url_with_args URL to the provider with full arguments list (url, maxheight, etc.)
407 * @param string $format Format to use
408 * @return bool|object False on failure, otherwise the result in the form of an object.
410 private function _fetch_with_format( $provider_url_with_args, $format ) {
411 $provider_url_with_args = add_query_arg( 'format', $format, $provider_url_with_args );
413 /** This filter is documented in wp-includes/class-oembed.php */
414 $args = apply_filters( 'oembed_remote_get_args', array(), $provider_url_with_args );
416 $response = wp_safe_remote_get( $provider_url_with_args, $args );
417 if ( 501 == wp_remote_retrieve_response_code( $response ) )
418 return new WP_Error( 'not-implemented' );
419 if ( ! $body = wp_remote_retrieve_body( $response ) )
421 $parse_method = "_parse_$format";
422 return $this->$parse_method( $body );
426 * Parses a json response body.
431 private function _parse_json( $response_body ) {
432 return ( ( $data = json_decode( trim( $response_body ) ) ) && is_object( $data ) ) ? $data : false;
436 * Parses an XML response body.
441 private function _parse_xml( $response_body ) {
442 if ( ! function_exists( 'libxml_disable_entity_loader' ) )
445 $loader = libxml_disable_entity_loader( true );
446 $errors = libxml_use_internal_errors( true );
448 $return = $this->_parse_xml_body( $response_body );
450 libxml_use_internal_errors( $errors );
451 libxml_disable_entity_loader( $loader );
457 * Helper function for parsing an XML response body.
462 private function _parse_xml_body( $response_body ) {
463 if ( ! function_exists( 'simplexml_import_dom' ) || ! class_exists( 'DOMDocument' ) )
466 $dom = new DOMDocument;
467 $success = $dom->loadXML( $response_body );
471 if ( isset( $dom->doctype ) )
474 foreach ( $dom->childNodes as $child ) {
475 if ( XML_DOCUMENT_TYPE_NODE === $child->nodeType )
479 $xml = simplexml_import_dom( $dom );
483 $return = new stdClass;
484 foreach ( $xml as $key => $value ) {
485 $return->$key = (string) $value;
492 * Converts a data object from {@link WP_oEmbed::fetch()} and returns the HTML.
494 * @param object $data A data object result from an oEmbed provider.
495 * @param string $url The URL to the content that is desired to be embedded.
496 * @return bool|string False on error, otherwise the HTML needed to embed.
498 public function data2html( $data, $url ) {
499 if ( ! is_object( $data ) || empty( $data->type ) )
504 switch ( $data->type ) {
506 if ( empty( $data->url ) || empty( $data->width ) || empty( $data->height ) )
508 if ( ! is_string( $data->url ) || ! is_numeric( $data->width ) || ! is_numeric( $data->height ) )
511 $title = ! empty( $data->title ) && is_string( $data->title ) ? $data->title : '';
512 $return = '<a href="' . esc_url( $url ) . '"><img src="' . esc_url( $data->url ) . '" alt="' . esc_attr($title) . '" width="' . esc_attr($data->width) . '" height="' . esc_attr($data->height) . '" /></a>';
517 if ( ! empty( $data->html ) && is_string( $data->html ) )
518 $return = $data->html;
522 if ( ! empty( $data->title ) && is_string( $data->title ) )
523 $return = '<a href="' . esc_url( $url ) . '">' . esc_html( $data->title ) . '</a>';
531 * Filter the returned oEmbed HTML.
533 * Use this filter to add support for custom data types, or to filter the result.
537 * @param string $return The returned oEmbed HTML.
538 * @param object $data A data object result from an oEmbed provider.
539 * @param string $url The URL of the content to be embedded.
541 return apply_filters( 'oembed_dataparse', $return, $data, $url );
545 * Strip any new lines from the HTML.
548 * @param string $html Existing HTML.
549 * @param object $data Data object from WP_oEmbed::data2html()
550 * @param string $url The original URL passed to oEmbed.
551 * @return string Possibly modified $html
553 private function _strip_newlines( $html, $data, $url ) {
554 if ( false !== strpos( $html, "\n" ) )
555 $html = str_replace( array( "\r\n", "\n" ), '', $html );
562 * Returns the initialized {@link WP_oEmbed} object
570 * @return WP_oEmbed object.
572 function _wp_oembed_get_object() {
575 if ( is_null($wp_oembed) )
576 $wp_oembed = new WP_oEmbed();