]> git.wh0rd.org - tt-rss.git/blame - classes/feeditem/rss.php
parser: properly support tag subtrees instead of text content for article content
[tt-rss.git] / classes / feeditem / rss.php
CommitLineData
04d2f9c8 1<?php
b4d16900 2class FeedItem_RSS extends FeedItem_Common {
04d2f9c8 3 function get_id() {
b09a4cdc
AD
4 $id = $this->elem->getElementsByTagName("guid")->item(0);
5
6 if ($id) {
7 return $id->nodeValue;
8 } else {
9 return $this->get_link();
10 }
04d2f9c8
AD
11 }
12
13 function get_date() {
14 $pubDate = $this->elem->getElementsByTagName("pubDate")->item(0);
15
16 if ($pubDate) {
17 return strtotime($pubDate->nodeValue);
18 }
ce5d234d
AD
19
20 $date = $this->xpath->query("dc:date", $this->elem)->item(0);
21
22 if ($date) {
23 return strtotime($date->nodeValue);
24 }
04d2f9c8
AD
25 }
26
27 function get_link() {
df2655e0 28 $links = $this->xpath->query("atom:link", $this->elem);
04d2f9c8 29
df2655e0
AD
30 foreach ($links as $link) {
31 if ($link && $link->hasAttribute("href") &&
32 (!$link->hasAttribute("rel")
33 || $link->getAttribute("rel") == "alternate"
34 || $link->getAttribute("rel") == "standout")) {
35
31bd6f76 36 return trim($link->getAttribute("href"));
df2655e0 37 }
04d2f9c8 38 }
f7d64d03 39
042003d5
AD
40 $link = $this->elem->getElementsByTagName("guid")->item(0);
41
42 if ($link && $link->hasAttributes() && $link->getAttribute("isPermaLink") == "true") {
31bd6f76 43 return trim($link->nodeValue);
042003d5
AD
44 }
45
2f6b75d5 46 $link = $this->elem->getElementsByTagName("link")->item(0);
f7d64d03
AD
47
48 if ($link) {
31bd6f76 49 return trim($link->nodeValue);
f7d64d03 50 }
04d2f9c8
AD
51 }
52
53 function get_title() {
2b4853f5 54 $title = $this->xpath->query("title", $this->elem)->item(0);
04d2f9c8 55
2b4853f5 56 if ($title) {
57 return trim($title->nodeValue);
04d2f9c8 58 }
206326c2
AD
59
60 // if the document has a default namespace then querying for
61 // title would fail because of reasons so let's try the old way
62 $title = $this->elem->getElementsByTagName("title")->item(0);
63
64 if ($title) {
65 return trim($title->nodeValue);
66 }
04d2f9c8
AD
67 }
68
69 function get_content() {
f6c61b2d
AD
70 $contentA = $this->xpath->query("content:encoded", $this->elem)->item(0);
71 $contentB = $this->elem->getElementsByTagName("description")->item(0);
04d2f9c8 72
f6c61b2d 73 if ($contentA && !$contentB) {
7d1e15c3 74 return $this->subtree_or_text($contentA);
04d2f9c8 75 }
8a95d630 76
d2bb392b 77
f6c61b2d 78 if ($contentB && !$contentA) {
7d1e15c3 79 return $this->subtree_or_text($contentB);
f6c61b2d
AD
80 }
81
82 if ($contentA && $contentB) {
7d1e15c3
AD
83 $resultA = $this->subtree_or_text($contentA);
84 $resultB = $this->subtree_or_text($contentB);
85
86 return mb_strlen($resultA) > mb_strlen($resultB) ? $resultA : $resultB;
8a95d630 87 }
04d2f9c8
AD
88 }
89
90 function get_description() {
91 $summary = $this->elem->getElementsByTagName("description")->item(0);
92
93 if ($summary) {
d2bb392b 94 return $summary->nodeValue;
04d2f9c8
AD
95 }
96 }
97
04d2f9c8
AD
98 function get_categories() {
99 $categories = $this->elem->getElementsByTagName("category");
100 $cats = array();
101
102 foreach ($categories as $cat) {
31bd6f76 103 array_push($cats, trim($cat->nodeValue));
04d2f9c8
AD
104 }
105
d4992d6b
AD
106 $categories = $this->xpath->query("dc:subject", $this->elem);
107
108 foreach ($categories as $cat) {
31bd6f76 109 array_push($cats, trim($cat->nodeValue));
d4992d6b
AD
110 }
111
04d2f9c8
AD
112 return $cats;
113 }
114
115 function get_enclosures() {
116 $enclosures = $this->elem->getElementsByTagName("enclosure");
117
118 $encs = array();
119
120 foreach ($enclosures as $enclosure) {
121 $enc = new FeedEnclosure();
122
123 $enc->type = $enclosure->getAttribute("type");
124 $enc->link = $enclosure->getAttribute("url");
125 $enc->length = $enclosure->getAttribute("length");
523bd90b
FE
126 $enc->height = $enclosure->getAttribute("height");
127 $enc->width = $enclosure->getAttribute("width");
04d2f9c8
AD
128
129 array_push($encs, $enc);
130 }
131
ed449a9a 132 $enclosures = $this->xpath->query("media:content", $this->elem);
4289b68f
AD
133
134 foreach ($enclosures as $enclosure) {
135 $enc = new FeedEnclosure();
136
137 $enc->type = $enclosure->getAttribute("type");
138 $enc->link = $enclosure->getAttribute("url");
139 $enc->length = $enclosure->getAttribute("length");
523bd90b
FE
140 $enc->height = $enclosure->getAttribute("height");
141 $enc->width = $enclosure->getAttribute("width");
4289b68f 142
5c54e683
AD
143 $desc = $this->xpath->query("media:description", $enclosure)->item(0);
144 if ($desc) $enc->title = strip_tags($desc->nodeValue);
145
4289b68f
AD
146 array_push($encs, $enc);
147 }
148
ed449a9a
JT
149
150 $enclosures = $this->xpath->query("media:group", $this->elem);
151
152 foreach ($enclosures as $enclosure) {
153 $enc = new FeedEnclosure();
154
155 $content = $this->xpath->query("media:content", $enclosure)->item(0);
156
2ab7ccb6
AD
157 if ($content) {
158 $enc->type = $content->getAttribute("type");
159 $enc->link = $content->getAttribute("url");
160 $enc->length = $content->getAttribute("length");
523bd90b
FE
161 $enc->height = $content->getAttribute("height");
162 $enc->width = $content->getAttribute("width");
2ab7ccb6
AD
163
164 $desc = $this->xpath->query("media:description", $content)->item(0);
165 if ($desc) {
166 $enc->title = strip_tags($desc->nodeValue);
167 } else {
168 $desc = $this->xpath->query("media:description", $enclosure)->item(0);
169 if ($desc) $enc->title = strip_tags($desc->nodeValue);
170 }
171
172 array_push($encs, $enc);
ed449a9a 173 }
ed449a9a
JT
174 }
175
e23aedd4
AD
176 $enclosures = $this->xpath->query("media:thumbnail", $this->elem);
177
178 foreach ($enclosures as $enclosure) {
179 $enc = new FeedEnclosure();
180
181 $enc->type = "image/generic";
182 $enc->link = $enclosure->getAttribute("url");
523bd90b
FE
183 $enc->height = $enclosure->getAttribute("height");
184 $enc->width = $enclosure->getAttribute("width");
e23aedd4
AD
185
186 array_push($encs, $enc);
187 }
188
04d2f9c8
AD
189 return $encs;
190 }
191
04d2f9c8
AD
192}
193?>