summaryrefslogtreecommitdiff
path: root/sample/rss/list_description.rb
blob: edb9ba07a44c22cb27c0cb444b32b85e0efbf6bb (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
#!/usr/bin/env ruby

require "nkf"
class String
	# From tdiary.rb
	def shorten( len = 120 )
		lines = NKF::nkf( "-e -m0 -f#{len}", self.gsub( /\n/, ' ' ) ).split( /\n/ )
		lines[0].concat( '...' ) if lines[0] and lines[1]
		lines[0]
	end
end

require "rss/parser"
require "rss/1.0"
require "rss/2.0"
require "rss/dublincore"

channels = {}
verbose = false

def error(exception)
	mark = "=" * 20
	mark = "#{mark} error #{mark}"
	puts mark
	puts exception.class
	puts exception.message
	puts exception.backtrace
	puts mark
end

before_time = Time.now
ARGV.each do |fname|
	if fname == '-v'
		verbose = true
		next
	end
	rss = nil
	f = File.new(fname).read
	begin
		## do validate parse
		rss = RSS::Parser.parse(f)
	rescue RSS::InvalidRSSError
		error($!) if verbose
		## do non validate parse for invalid RSS 1.0
		begin
			rss = RSS::Parser.parse(f, false)
		rescue RSS::Error
			## invalid RSS.
			error($!) if verbose
		end
	rescue RSS::Error
		error($!) if verbose
	end
	if rss.nil?
		puts "#{fname} does not include RSS 1.0 or 0.9x/2.0"
	else
		begin
			rss.output_encoding = "euc-jp"
		rescue RSS::UnknownConversionMethodError
			error($!) if verbose
		end
		rss.channel.title ||= "Unknown"
		rss.items.each do |item|
			item.title ||= "Unknown"
			channels[rss.channel.title] ||= []
			channels[rss.channel.title] << item if item.description
		end
	end
end
processing_time = Time.now - before_time

channels.sort do |x, y|
	x[0] <=> y[0]
end[0..20].each do |title, items|
	puts "Channel : #{title}" unless items.empty?
	items.sort do |x, y|
		x.title <=> y.title
	end[0..10].each do |item|
		puts "  Item : #{item.title.shorten(50)}"
		puts "    Description : #{item.description.shorten(50)}"
	end
end

puts "Processing Time : #{processing_time}s"