22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
|
# File 'lib/ape/feed.rb', line 22
def Feed.read(uri, name, reporter, report = true)
Feed.reporter = reporter
entries = []
uris = []
next_page = uri
page_num = 1
while (next_page) && (page_num < 10) do
label = "Page #{page_num} of #{name}"
uris << next_page
page = check_resource(next_page, label, Names::AtomMediaType, report)
break unless page
Validator.instance(:schema, reporter).validate(:schema => Samples.atom_RNC,
:title => label, :doc => page) if report
error = "not well-formed"
feed = nil
begin
feed = REXML::Document.new(page.body, { :raw => nil })
rescue Exception
error = $!.to_s
feed = nil
end
if feed == nil
reporter.error(self, "Can't parse #{label} at #{next_page}, Parser said: #{$!}") if report
break
end
feed = feed.root
if feed == nil
reporter.warning(self, "#{label} is empty.")
break
end
page_entries = REXML::XPath.match(feed, "./atom:entry", Names::XmlNamespaces)
if page_entries.empty? && report
reporter.info(self, "#{label} has no entries.")
end
entries += page_entries.map { |e| Entry.new(:xml => e, :uri => next_page)}
next_link = REXML::XPath.first(feed, "./atom:link[@rel=\"next\"]", Names::XmlNamespaces)
if next_link
next_link = next_link.attributes['href']
base = AtomURI.new(next_page)
next_link = base.absolutize(next_link, feed)
if uris.index(next_link)
reporter.error(self, "Collection contains circular 'next' linkage: #{next_link}") if report
break
end
page_num += 1
end
next_page = next_link
end
if report && next_page
reporter.warning(self, "Stopped reading collection after #{page_num} pages.")
end
return entries unless report
last_date = nil
with_app_date = 0
clean = true
entries.each do |e|
datestr = e.child_content("edited", Names::AppNamespace)
error = nil
if datestr
if datestr =~ /\d\d\d\d-\d\d-\d\dT\d\d:\d\d:\d\d(\.\d+)?(Z|([-+]\d\d:\d\d))/
begin
date = Time.parse(datestr)
with_app_date += 1
if last_date && (date > last_date)
error = "app:edited values out of order, d #{date} ld #{last_date}"
end
last_date = date
rescue ArgumentError
error = "invalid app:edited value: #{datestr}"
end
else
error = "invalid app:edited child: #{datestr}"
end
if error
title = e.child_content "title"
reporter.error(self, "In entry with title '#{title}', #{error}.")
clean = false
end
end
end
if with_app_date < entries.size
reporter.error(self, "#{entries.size - with_app_date} of #{entries.size} entries in #{name} lack app:edited elements.")
clean = false
end
reporter.success(self, "#{name} has correct app:edited value order.") if clean
entries
end
|