3 require_once('library/HTML5/Parser.php');
4 require_once('library/HTMLPurifier.auto.php');
6 function parse_url_content(&$a) {
8 logger('parse_url: ' . $_GET['url']);
10 $url = trim(hex2bin($_GET['url']));
12 logger('parse_url: ' . $url);
16 $template = "<a href=\"%s\" >%s</a>\n%s";
19 $arr = array('url' => $url, 'text' => '');
21 call_hooks('parse_link', $arr);
23 if(strlen($arr['text'])) {
35 logger('parse_url: data: ' . $s, LOGGER_DATA);
38 echo sprintf($template,$url,$url,'');
42 $config = HTMLPurifier_Config::createDefault();
43 $config->set('Cache.DefinitionImpl', null);
45 $purifier = new HTMLPurifier($config);
46 $s = $purifier->purify($s);
48 $dom = @HTML5_Parser::parse($s);
51 echo sprintf($template,$url,$url,'');
55 $items = $dom->getElementsByTagName('title');
58 foreach($items as $item) {
59 $title = trim($item->textContent);
64 $divs = $dom->getElementsByTagName('div');
66 foreach($divs as $div) {
67 $class = $div->getAttribute('class');
68 if($class && stristr($class,'article')) {
69 $items = $div->getElementsByTagName('p');
71 foreach($items as $item) {
72 if($item->getElementsByTagName('script'))
74 $text = $item->textContent;
75 $text = strip_tags($text);
76 if(strlen($text) < 100)
78 $text = substr($text,0,250) . '...' ;
87 $items = $dom->getElementsByTagName('p');
89 foreach($items as $item) {
90 if($item->getElementsByTagName('script'))
92 $text = $item->textContent;
93 $text = strip_tags($text);
94 if(strlen($text) < 100)
96 $text = substr($text,0,250) . '...' ;
103 $text = '<br />' . $text;
106 echo sprintf($template,$url,($title) ? $title : $url,$text);