]> git.wh0rd.org - tt-rss.git/blob - plugins/af_pennyarcade/init.php
always mangle guid in af_ plugins
[tt-rss.git] / plugins / af_pennyarcade / init.php
1 <?php
2 class Af_PennyArcade extends Plugin {
3
4 private $link;
5 private $host;
6
7 function about() {
8 return array(1.0,
9 "Strip unnecessary stuff from PA feeds",
10 "fox");
11 }
12
13 function init($host) {
14 $this->link = $host->get_link();
15 $this->host = $host;
16
17 $host->add_hook($host::HOOK_ARTICLE_FILTER, $this);
18 }
19
20 function hook_article_filter($article) {
21 $owner_uid = $article["owner_uid"];
22
23 if (strpos($article["link"], "penny-arcade.com") !== FALSE && strpos($article["title"], "Comic:") !== FALSE &&
24 strpos($article["guid"], "pennyarcade,$owner_uid:") === FALSE) {
25
26 $doc = new DOMDocument();
27 @$doc->loadHTML(fetch_file_contents($article["link"]));
28
29 $basenode = false;
30
31 if ($doc) {
32 $xpath = new DOMXPath($doc);
33 $entries = $xpath->query('(//img[@src])'); // we might also check for img[@class='strip'] I guess...
34
35 $matches = array();
36
37 foreach ($entries as $entry) {
38
39 if (preg_match("/(http:\/\/art.penny-arcade.com\/.*)/i", $entry->getAttribute("src"), $matches)) {
40
41 $basenode = $entry;
42 break;
43 }
44 }
45
46 if ($basenode) {
47 $article["content"] = $doc->saveXML($basenode, LIBXML_NOEMPTYTAG);
48 }
49 }
50
51 $article["guid"] = "pennyarcade,$owner_uid:" . $article["guid"];
52 }
53
54 return $article;
55 }
56 }
57 ?>