]> git.wh0rd.org - tt-rss.git/blame - plugins/af_unburn/init.php
remove $link
[tt-rss.git] / plugins / af_unburn / init.php
CommitLineData
9b725068
AD
1<?php
2class Af_Unburn extends Plugin {
9b725068
AD
3 private $host;
4
5 function about() {
6 return array(1.0,
6368785e 7 "Resolves feedburner and similar feed redirector URLs (requires CURL)",
9b725068
AD
8 "fox");
9 }
10
11 function init($host) {
9b725068
AD
12 $this->host = $host;
13
14 $host->add_hook($host::HOOK_ARTICLE_FILTER, $this);
15 }
16
17 function hook_article_filter($article) {
18 $owner_uid = $article["owner_uid"];
19
20 if (!function_exists("curl_init"))
21 return $article;
22
eb161344 23 if ((strpos($article["link"], "feedproxy.google.com") !== FALSE ||
a90952ec 24 strpos($article["link"], "/~r/") !== FALSE ||
e02555c1 25 strpos($article["link"], "feedsportal.com") !== FALSE)) {
9b725068 26
e02555c1 27 if (strpos($article["plugin_data"], "unburn,$owner_uid:") === FALSE) {
9b725068 28
438a3ecb 29 if (ini_get("safe_mode") || ini_get("open_basedir")) {
81153e6b
AD
30 $ch = curl_init(geturl($article["link"]));
31 } else {
32 $ch = curl_init($article["link"]);
33 }
34
e02555c1
AD
35 curl_setopt($ch, CURLOPT_TIMEOUT, 5);
36 curl_setopt($ch, CURLOPT_RETURNTRANSFER, true);
37 curl_setopt($ch, CURLOPT_HEADER, true);
438a3ecb 38 curl_setopt($ch, CURLOPT_FOLLOWLOCATION, !ini_get("safe_mode") && !ini_get("open_basedir"));
e02555c1 39 curl_setopt($ch, CURLOPT_USERAGENT, SELF_USER_AGENT);
9b725068 40
e02555c1 41 $contents = @curl_exec($ch);
9b725068 42
e02555c1 43 $real_url = curl_getinfo($ch, CURLINFO_EFFECTIVE_URL);
8c685908 44
e02555c1 45 curl_close($ch);
8c685908 46
e02555c1
AD
47 if ($real_url) {
48 /* remove the rest of it */
8c685908 49
e02555c1 50 $query = parse_url($real_url, PHP_URL_QUERY);
8c685908 51
e02555c1
AD
52 if ($query && strpos($query, "utm_source") !== FALSE) {
53 $args = array();
54 parse_str($query, $args);
55
56 foreach (array("utm_source", "utm_medium", "utm_campaign") as $param) {
57 if (isset($args[$param])) unset($args[$param]);
58 }
8c685908 59
e02555c1 60 $new_query = http_build_query($args);
8c685908 61
e02555c1
AD
62 if ($new_query != $query) {
63 $real_url = str_replace("?$query", "?$new_query", $real_url);
64 }
8c685908 65 }
8c685908 66
e02555c1 67 $real_url = preg_replace("/\?$/", "", $real_url);
1e6463fd 68
e02555c1
AD
69 $article["plugin_data"] = "unburn,$owner_uid:" . $article["plugin_data"];
70 $article["link"] = $real_url;
71 }
72 } else if (isset($article["stored"]["link"])) {
73 $article["link"] = $article["stored"]["link"];
9b725068
AD
74 }
75 }
76
77 return $article;
78 }
81153e6b 79
e2b0054b
AD
80 function geturl($url){
81
82 (function_exists('curl_init')) ? '' : die('cURL Must be installed for geturl function to work. Ask your host to enable it or uncomment extension=php_curl.dll in php.ini');
83
84 $curl = curl_init();
85 $header[0] = "Accept: text/xml,application/xml,application/xhtml+xml,";
86 $header[0] .= "text/html;q=0.9,text/plain;q=0.8,image/png,*/*;q=0.5";
87 $header[] = "Cache-Control: max-age=0";
88 $header[] = "Connection: keep-alive";
89 $header[] = "Keep-Alive: 300";
90 $header[] = "Accept-Charset: ISO-8859-1,utf-8;q=0.7,*;q=0.7";
91 $header[] = "Accept-Language: en-us,en;q=0.5";
92 $header[] = "Pragma: ";
93
94 curl_setopt($curl, CURLOPT_URL, $url);
95 curl_setopt($curl, CURLOPT_USERAGENT, 'Mozilla/5.0 (Windows NT 5.1; rv:5.0) Gecko/20100101 Firefox/5.0 Firefox/5.0');
96 curl_setopt($curl, CURLOPT_HTTPHEADER, $header);
97 curl_setopt($curl, CURLOPT_HEADER, true);
98 curl_setopt($curl, CURLOPT_REFERER, $url);
99 curl_setopt($curl, CURLOPT_ENCODING, 'gzip,deflate');
100 curl_setopt($curl, CURLOPT_AUTOREFERER, true);
101 curl_setopt($curl, CURLOPT_RETURNTRANSFER, true);
102 //curl_setopt($curl, CURLOPT_FOLLOWLOCATION, true); //CURLOPT_FOLLOWLOCATION Disabled...
103 curl_setopt($curl, CURLOPT_TIMEOUT, 60);
104
105 $html = curl_exec($curl);
106
107 $status = curl_getinfo($curl);
108 curl_close($curl);
109
110 if($status['http_code']!=200){
111 if($status['http_code'] == 301 || $status['http_code'] == 302) {
112 list($header) = explode("\r\n\r\n", $html, 2);
113 $matches = array();
114 preg_match("/(Location:|URI:)[^(\n)]*/", $header, $matches);
115 $url = trim(str_replace($matches[1],"",$matches[0]));
116 $url_parsed = parse_url($url);
117 return (isset($url_parsed))? geturl($url, $referer):'';
118 }
119 $oline='';
120 foreach($status as $key=>$eline){$oline.='['.$key.']'.$eline.' ';}
121 $line =$oline." \r\n ".$url."\r\n-----------------\r\n";
122 $handle = @fopen('./curl.error.log', 'a');
123 fwrite($handle, $line);
124 return FALSE;
125 }
126 return $url;
127 }
9b725068
AD
128}
129?>