ruby--ruby/sample/rss/tdiary_plugin/rss-recent.rb

214 lines
4.7 KiB
Ruby
Raw Normal View History

# rss-recent.rb: RSS recent plugin
#
# rss_recnet: show recnet list from RSS
# parameters (default):
# url: URL of RSS
# max: max of list itmes(5)
# cache_time: cache time(second) of RSS(60*60)
#
#
# Copyright (c) 2003-2004 Kouhei Sutou <kou@cozmixng.org>
# Distributed under the GPL
#
require "rss/rss"
RSS_RECENT_FIELD_SEPARATOR = "\0"
RSS_RECENT_ENTRY_SEPARATOR = "\1"
RSS_RECENT_VERSION = "0.0.5"
RSS_RECENT_HTTP_HEADER = {
"User-Agent" => "tDiary RSS recent plugin version #{RSS_RECENT_VERSION}. " <<
"Using RSS parser version is #{::RSS::VERSION}.",
}
def rss_recent(url, max=5, cache_time=3600)
url.untaint
cache_file = "#{@cache_path}/rss-recent.#{CGI.escape(url)}"
rss_recent_cache_rss(url, cache_file, cache_time.to_i)
return '' unless test(?r, cache_file)
rv = "<ul>\n"
i = 0
rss_recent_read_from_cache(cache_file).each do |title, url, time|
break if i >= max
next if title.nil?
rv << '<li>'
rv << %Q[<span class="#{rss_recent_modified_class(time)}">]
unless url.nil?
rv << %Q[<a href="#{CGI.escapeHTML(url)}" title="#{CGI.escapeHTML(title)}]
rv << %Q[ (#{CGI.escapeHTML(time.localtime.to_s)})] unless time.nil?
rv << %Q[">]
end
rv << CGI::escapeHTML(title)
rv << '</a>' unless url.nil?
rv << "(#{rss_recent_modified(time)})"
rv << %Q[</span>]
rv << "</li>\n"
i += 1
end
rv << "</ul>\n"
rv
end
class InvalidResourceError < StandardError; end
def rss_recent_cache_rss(url, cache_file, cache_time)
cached_time = nil
cached_time = File.mtime(cache_file) if File.exist?(cache_file)
if cached_time.nil? or Time.now > cached_time + cache_time
require 'time'
require 'open-uri'
require 'net/http'
require 'uri/generic'
require 'rss/parser'
require 'rss/1.0'
require 'rss/2.0'
require 'rss/dublincore'
begin
uri = URI.parse(url)
raise URI::InvalidURIError if uri.scheme != "http"
rss_source = rss_recent_fetch_rss(uri, cached_time)
raise InvalidResourceError if rss_source.nil?
# parse RSS
rss = ::RSS::Parser.parse(rss_source, false)
raise ::RSS::Error if rss.nil?
# pre processing
begin
rss.output_encoding = @conf.charset || charset
rescue ::RSS::UnknownConversionMethodError
end
rss_infos = rss.items.collect do |item|
rss_recent_pubDate_to_dc_date(item)
[item.title, item.link, item.dc_date]
end
rss_recent_write_to_cache(cache_file, rss_infos)
rescue URI::InvalidURIError
rss_recent_write_to_cache(cache_file, [['Invalid URI', url]])
rescue InvalidResourceError, ::RSS::Error
rss_recent_write_to_cache(cache_file, [['Invalid Resource', url]])
end
end
end
def rss_recent_fetch_rss(uri, cache_time)
rss = nil
begin
uri.open(rss_recent_http_header(cache_time)) do |f|
case f.status.first
when "200"
rss = f.read
# STDERR.puts "Got RSS of #{uri}"
when "304"
# not modified
# STDERR.puts "#{uri} does not modified"
else
raise InvalidResourceError
end
end
rescue TimeoutError, SocketError, StandardError,
SecurityError # occured in redirect
raise InvalidResourceError
end
rss
end
def rss_recent_http_header(cache_time)
header = RSS_RECENT_HTTP_HEADER.dup
if cache_time.respond_to?(:rfc2822)
header["If-Modified-Since"] = cache_time.rfc2822
end
header
end
def rss_recent_write_to_cache(cache_file, rss_infos)
File.open(cache_file, 'w') do |f|
f.flock(File::LOCK_EX)
rss_infos.each do |info|
f << info.join(RSS_RECENT_FIELD_SEPARATOR)
f << RSS_RECENT_ENTRY_SEPARATOR
end
f.flock(File::LOCK_UN)
end
end
def rss_recent_read_from_cache(cache_file)
require 'time'
infos = []
File.open(cache_file) do |f|
while info = f.gets(RSS_RECENT_ENTRY_SEPARATOR)
info = info.chomp(RSS_RECENT_ENTRY_SEPARATOR)
infos << info.split(RSS_RECENT_FIELD_SEPARATOR)
end
end
infos.collect do |title, url, time|
[
rss_recent_convert(title),
rss_recent_convert(url),
rss_recent_convert(time) {|time| Time.parse(time)},
]
end
end
def rss_recent_convert(str)
if str.nil? or str.empty?
nil
else
if block_given?
yield str
else
str
end
end
end
# from RWiki
def rss_recent_modified(t)
return '-' unless t
dif = (Time.now - t).to_i
dif = dif / 60
return "#{dif}m" if dif <= 60
dif = dif / 60
return "#{dif}h" if dif <= 24
dif = dif / 24
return "#{dif}d"
end
# from RWiki
def rss_recent_modified_class(t)
return 'dangling' unless t
dif = (Time.now - t).to_i
dif = dif / 60
return "modified-hour" if dif <= 60
dif = dif / 60
return "modified-today" if dif <= 24
dif = dif / 24
return "modified-month" if dif <= 30
return "modified-year" if dif <= 365
return "modified-old"
end
def rss_recent_pubDate_to_dc_date(target)
if target.respond_to?(:pubDate)
class << target
alias_method(:dc_date, :pubDate)
end
end
end