| |
48 |
48 |
} { |
| |
49 |
49 |
set items [$doc_node selectNodes {//*[local-name()='item' or local-name()='entry']}] |
| |
50 |
50 |
return $items |
| |
51 |
51 |
} |
| |
52 |
52 |
|
| |
53 |
53 |
ad_proc -private feed_parser::item_parse { |
| |
54 |
54 |
{-item_node:required} |
| |
55 |
55 |
} { |
| |
56 |
56 |
Takes a tDOM node which is supposed to represent an RSS item, |
| |
57 |
57 |
and returns a list with the RSS/RDF elements of that node. |
| |
58 |
58 |
|
| |
59 |
59 |
@author Simon Carstensen |
| |
60 |
60 |
@author Guan Yang (guan@unicast.org) |
| |
61 |
61 |
} { |
| |
62 |
62 |
set title "" |
| |
63 |
63 |
set link "" |
| |
64 |
64 |
set guid "" |
| |
65 |
65 |
set permalink_p false |
| |
66 |
66 |
set description "" |
| |
67 |
67 |
set content_encoded "" |
| |
|
68 |
set comments "" |
| |
|
69 |
set author "" |
| |
68 |
70 |
|
| |
69 |
71 |
feed_parser::dom::set_child_text -node $item_node -child title |
| |
70 |
72 |
feed_parser::dom::set_child_text -node $item_node -child link |
| |
71 |
73 |
feed_parser::dom::set_child_text -node $item_node -child guid |
| |
72 |
74 |
feed_parser::dom::set_child_text -node $item_node -child description |
| |
|
75 |
feed_parser::dom::set_child_text -node $item_node -child comments |
| |
|
76 |
feed_parser::dom::set_child_text -node $item_node -child author |
| |
|
77 |
feed_parser::dom::set_child_text -node $item_node -child pubDate |
| |
73 |
78 |
|
| |
|
79 |
set pub_date_rfc822 $pubDate |
| |
|
80 |
feed_parser::dom::set_child_text -node $item_node -child pubDate |
| |
|
81 |
if { $pub_date_rfc822 eq "" || |
| |
|
82 |
[catch {set pub_date [clock scan $pub_date_rfc822]}] } { |
| |
|
83 |
set pub_date {} |
| |
|
84 |
} |
| |
|
85 |
|
| |
74 |
86 |
set maybe_atom_p 0 |
| |
75 |
87 |
|
| |
76 |
88 |
# Try to handle Atom link |
| |
77 |
89 |
if { [string equal $link ""] } { |
| |
78 |
90 |
set link_attr [$item_node selectNodes {*[local-name()='link']/@href}] |
| |
79 |
91 |
if { [llength $link_attr] == 1 } { |
| |
80 |
92 |
set link [lindex [lindex $link_attr 0] 1] |
| |
81 |
93 |
set maybe_atom_p 1 |
| |
82 |
94 |
} |
| |
83 |
95 |
} |
| |
84 |
96 |
|
| |
85 |
97 |
set encoded_nodes [$item_node selectNodes {*[local-name()='encoded' and namespace-uri()='http://purl.org/rss/1.0/modules/content/']}] |
| |
86 |
98 |
if { [llength $encoded_nodes] == 1 } { |
| |
87 |
99 |
set encoded_node [lindex $encoded_nodes 0] |
| |
88 |
100 |
set content_encoded [$encoded_node text] |
| |
89 |
101 |
} |
| |
90 |
102 |
|
| |
91 |
103 |
if { [llength [$item_node selectNodes "*\[local-name()='guid'\]"]] } { |
| |
92 |
104 |
# If guid exists, we assume that it's a permalink |
| |
93 |
105 |
set permalink_p true |
|
| |
125 |
137 |
} |
| |
126 |
138 |
} |
| |
127 |
139 |
} |
| |
128 |
140 |
|
| |
129 |
141 |
# For Atom, description is summary, content is content_encoded |
| |
130 |
142 |
if { $maybe_atom_p } { |
| |
131 |
143 |
feed_parser::dom::set_child_text -node $item_node -child summary |
| |
132 |
144 |
if { [info exists summary] } { |
| |
133 |
145 |
set description $summary |
| |
134 |
146 |
} |
| |
135 |
147 |
|
| |
136 |
148 |
feed_parser::dom::set_child_text -node $item_node -child content |
| |
137 |
149 |
if { [info exists content] } { |
| |
138 |
150 |
set content_encoded $content |
| |
139 |
151 |
} |
| |
140 |
152 |
} |
| |
141 |
153 |
|
| |
142 |
154 |
#remove unsafe html |
| |
143 |
155 |
set description [feed_parser::remove_unsafe_html -html $description] |
| |
144 |
156 |
|
| |
145 |
|
return [list title $title link $link guid $guid permalink_p $permalink_p description $description content_encoded $content_encoded] |
| |
|
157 |
return [list title $title link $link guid $guid permalink_p $permalink_p description $description content_encoded $content_encoded author $author comments $comments pub_date $pub_date] |
| |
146 |
158 |
} |
| |
147 |
159 |
|
| |
148 |
160 |
ad_proc -private feed_parser::channel_parse { |
| |
149 |
161 |
{-channel_node:required} |
| |
150 |
162 |
} { |
| |
151 |
163 |
Takes a tDOM node which is supposed to represent an RSS |
| |
152 |
164 |
channel, and returns a list with the RSS/RDF elements |
| |
153 |
165 |
of that node. This proc should later be extended to |
| |
154 |
166 |
support Dublin Core elements and other funk. |
| |
155 |
167 |
|
| |
156 |
168 |
@author Guan Yang (guan@unicast.org) |
| |
157 |
169 |
@creation-date 2003-07-03 |
| |
158 |
170 |
} { |
| |
159 |
171 |
set properties [list title link description language copyright lastBuildDate docs generator managingEditor webMaster] |
| |
160 |
172 |
|
| |
161 |
173 |
foreach property $properties { |
| |
162 |
174 |
set $property "" |
| |
163 |
175 |
feed_parser::dom::set_child_text -node $channel_node -child $property |
| |
164 |
176 |
set channel($property) [set $property] |
| |
165 |
177 |
} |