blob: 990974d8f548f38efadf27a9359c50308cf9e6f9 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
|
#!/usr/bin/env ruby
require "nkf"
class String
# From tdiary.rb
def shorten( len = 120 )
lines = NKF::nkf( "-t -m0 -f#{len}", self.gsub( /\n/, ' ' ) ).split( /\n/ )
lines[0].concat( '...' ) if lines[0] and lines[1]
lines[0]
end
end
require "rss"
channels = {}
verbose = false
def error(exception)
mark = "=" * 20
mark = "#{mark} error #{mark}"
puts mark
puts exception.class
puts exception.message
puts exception.backtrace
puts mark
end
before_time = Time.now
ARGV.each do |fname|
if fname == '-v'
verbose = true
next
end
rss = nil
f = File.new(fname).read
begin
## do validate parse
rss = RSS::Parser.parse(f)
rescue RSS::InvalidRSSError
error($!) if verbose
## do non validate parse for invalid RSS 1.0
begin
rss = RSS::Parser.parse(f, false)
rescue RSS::Error
## invalid RSS.
error($!) if verbose
end
rescue RSS::Error
error($!) if verbose
end
if rss.nil?
puts "#{fname} does not include RSS 1.0 or 0.9x/2.0"
else
begin
rss.output_encoding = "utf-8"
rescue RSS::UnknownConversionMethodError
error($!) if verbose
end
rss = rss.to_rss("1.0") do |maker|
maker.channel.about ||= maker.channel.link
maker.channel.description ||= "No description"
maker.items.each do |item|
item.title ||= "No title"
item.link ||= "UNKNOWN"
end
end
next if rss.nil?
rss.items.each do |item|
channels[rss.channel.title] ||= []
channels[rss.channel.title] << item if item.description
end
end
end
processing_time = Time.now - before_time
channels.sort do |x, y|
x[0] <=> y[0]
end[0..20].each do |title, items|
puts "Channel: #{title}" unless items.empty?
items.sort do |x, y|
x.title <=> y.title
end[0..10].each do |item|
puts " Item: #{item.title.shorten(50)}"
puts " Description: #{item.description.shorten(50)}"
end
end
puts "Used XML parser: #{RSS::Parser.default_parser}"
puts "Processing time: #{processing_time}s"
|