gyang
committed
on 30 May 04
Use ns_encodingforcharset to find Tcl encoding name in feed_parser::parse_feed.
openacs-4/.../tcl/feed-parser-procs.tcl (+14 -2)
48 48 } {
49 49     set items [$doc_node selectNodes {//*[local-name()='item' or local-name()='entry']}]
50 50     return $items
51 51 }
52 52
53 53 ad_proc -private feed_parser::item_parse {
54 54     {-item_node:required}
55 55 } {
56 56     Takes a tDOM node which is supposed to represent an RSS item,
57 57     and returns a list with the RSS/RDF elements of that node.
58 58
59 59     @author Simon Carstensen
60 60     @author Guan Yang (guan@unicast.org)
61 61 } {
62 62     set title ""
63 63     set link ""
64 64     set guid ""
65 65     set permalink_p false
66 66     set description ""
67 67     set content_encoded ""
  68     set comments ""
  69     set author ""
68 70
69 71     feed_parser::dom::set_child_text -node $item_node -child title
70 72     feed_parser::dom::set_child_text -node $item_node -child link
71 73     feed_parser::dom::set_child_text -node $item_node -child guid
72 74     feed_parser::dom::set_child_text -node $item_node -child description
  75     feed_parser::dom::set_child_text -node $item_node -child comments
  76     feed_parser::dom::set_child_text -node $item_node -child author
  77     feed_parser::dom::set_child_text -node $item_node -child pubDate
73 78    
  79     set pub_date_rfc822 $pubDate
  80     feed_parser::dom::set_child_text -node $item_node -child pubDate
  81     if { $pub_date_rfc822 eq "" ||
  82          [catch {set pub_date [clock scan $pub_date_rfc822]}] } {
  83         set pub_date {}
  84     }
  85        
74 86     set maybe_atom_p 0
75 87    
76 88     # Try to handle Atom link
77 89     if { [string equal $link ""] } {
78 90         set link_attr [$item_node selectNodes {*[local-name()='link']/@href}]
79 91         if { [llength $link_attr] == 1 } {
80 92             set link [lindex [lindex $link_attr 0] 1]
81 93             set maybe_atom_p 1
82 94         }
83 95     }
84 96
85 97     set encoded_nodes [$item_node selectNodes {*[local-name()='encoded' and namespace-uri()='http://purl.org/rss/1.0/modules/content/']}]
86 98     if { [llength $encoded_nodes] == 1 } {
87 99         set encoded_node [lindex $encoded_nodes 0]
88 100             set content_encoded [$encoded_node text]
89 101     }
90 102
91 103     if { [llength [$item_node selectNodes "*\[local-name()='guid'\]"]] } {
92 104         # If guid exists, we assume that it's a permalink
93 105         set permalink_p true
 
125 137             }
126 138         }
127 139     }
128 140    
129 141     # For Atom, description is summary, content is content_encoded
130 142     if { $maybe_atom_p } {
131 143         feed_parser::dom::set_child_text -node $item_node -child summary
132 144         if { [info exists summary] } {
133 145             set description $summary
134 146         }
135 147        
136 148         feed_parser::dom::set_child_text -node $item_node -child content
137 149         if { [info exists content] } {
138 150             set content_encoded $content
139 151         }
140 152     }
141 153
142 154     #remove unsafe html
143 155     set description [feed_parser::remove_unsafe_html -html $description]
144 156
145       return [list title $title link $link guid $guid permalink_p $permalink_p description $description content_encoded $content_encoded]
  157     return [list title $title link $link guid $guid permalink_p $permalink_p description $description content_encoded $content_encoded author $author comments $comments pub_date $pub_date]
146 158 }
147 159
148 160 ad_proc -private feed_parser::channel_parse {
149 161     {-channel_node:required}
150 162 } {
151 163     Takes a tDOM node which is supposed to represent an RSS
152 164     channel, and returns a list with the RSS/RDF elements
153 165     of that node. This proc should later be extended to
154 166     support Dublin Core elements and other funk.
155 167
156 168     @author Guan Yang (guan@unicast.org)
157 169     @creation-date 2003-07-03
158 170 } {
159 171     set properties [list title link description language copyright lastBuildDate docs generator managingEditor webMaster]
160 172
161 173     foreach property $properties {
162 174         set $property ""
163 175             feed_parser::dom::set_child_text -node $channel_node -child $property
164 176         set channel($property) [set $property]
165 177     }