2011-08-24 22:16:44 +02:00
|
|
|
<?php
|
|
|
|
|
|
|
|
function getURLMetadata($url) {
|
|
|
|
//allow only http(s) and (s)ftp
|
|
|
|
$protocols = '/^[hs]{0,1}[tf]{0,1}tp[s]{0,1}\:\/\//i';
|
|
|
|
//if not (allowed) protocol is given, assume http
|
|
|
|
if(preg_match($protocols, $url) == 0) {
|
|
|
|
$url = 'http://' . $url;
|
|
|
|
}
|
2011-08-25 13:23:52 +02:00
|
|
|
$metadata['url'] = $url;
|
2011-08-24 22:16:44 +02:00
|
|
|
|
2011-09-23 12:49:14 +02:00
|
|
|
$ch = curl_init();
|
|
|
|
curl_setopt($ch, CURLOPT_URL, $url);
|
|
|
|
curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);
|
|
|
|
$page = curl_exec($ch);
|
|
|
|
curl_close($ch);
|
|
|
|
|
2011-08-24 22:16:44 +02:00
|
|
|
@preg_match( "/<title>(.*)<\/title>/si", $page, $match );
|
2011-08-25 13:51:48 +02:00
|
|
|
$metadata['title'] = htmlspecialchars_decode(@$match[1]);
|
2011-08-24 22:16:44 +02:00
|
|
|
|
|
|
|
$meta = get_meta_tags($url);
|
|
|
|
|
|
|
|
if(array_key_exists('description', $meta)) {
|
|
|
|
$metadata['description'] = $meta['description'];
|
|
|
|
}
|
|
|
|
|
|
|
|
return $metadata;
|
|
|
|
}
|