OSDN Git Service

added sn_uploader
[tdcgexplorer/nimono-crawlers.git] / bin / mmdacc2-idx.rb
1 #!/usr/bin/ruby
2 # download from mikumikudance
3 # http://www9.atpages.jp/~mmdaccessory/uploader2/index.html
4
5 $LOAD_PATH.unshift File.expand_path(File.dirname(__FILE__) + '/../lib')
6 require 'sn_uploader'
7
8 def each_filename(text)
9   file_href = 'http://www9.atpages.jp/~mmdaccessory/uploader2/src/'
10   file_re = Regexp.new(Regexp.escape(file_href) + '(.+)\.html')
11   text.scan(/href="(.+?)"/) do |href, |
12     if md = file_re.match(href)
13       yield md[1]
14     end
15   end
16 end
17
18 uploader = SnUploader.new
19 uploader.host = "www9.atpages.jp"
20 uploader.root_path = "/~mmdaccessory/uploader2"
21 uploader.local_dir = File.dirname(__FILE__) + '/../arc/mmdacc2'
22   uploader.base_html = "index.html"
23   body = uploader.get_base
24   each_filename(body) do |filename|
25     exist = uploader.local_file_exist?(filename)
26     puts [ filename, exist ? 'exist' : 'download' ].join("\t")
27     uploader.download_file_through_counter(filename) unless exist
28   end