cosmere-books/oathbringer-reread.rb

74 lines
2.6 KiB
Ruby

require 'date'
require 'fileutils'
require 'nokogiri'
require_relative './methods'
FileUtils.mkdir_p('oathbringer-reread')
BASE = 'https://www.tor.com'.freeze
links = [
"/2018/01/25/introducing-the-oathbringer-reread/",
"/2018/02/01/oathbringer-reread-prologue/",
"/2018/02/08/oathbringer-reread-chapter-one/",
"/2018/02/15/oathbringer-reread-chapter-two/",
"/2018/02/22/oathbringer-reread-chapter-three/",
"/2018/03/01/oathbringer-reread-chapter-four/",
"/2018/03/08/oathbringer-reread-chapters-five-and-six/",
"/2018/03/15/oathbringer-reread-chapter-seven/",
"/2018/03/22/oathbringer-reread-chapters-eight-and-nine/",
"/2018/03/29/oathbringer-reread-chapter-ten/",
"/2018/04/05/oathbringer-reread-chapter-eleven/",
"/2018/04/12/oathbringer-reread-chapter-12/",
"/2018/04/19/oathbringer-reread-chapter-thirteen/",
"/2018/04/26/oathbringer-reread-chapters-fourteen-and-fifteen/",
"/2018/05/03/oathbringer-reread-chapter-16/",
"/2018/05/10/oathbringer-reread-chapter-seventeen/",
"/2018/05/17/oathbringer-reread-chapter-eighteen/",
"/2018/05/24/oathbringer-reread-chapters-19-and-20-brandon-sanderson/",
"/2018/05/31/oathbringer-reread-chapters-twenty-one-and-twenty-two/",
"/2018/06/07/oathbringer-reread-chapters-twenty-three-and-twenty-four/",
"/2018/06/14/oathbringer-reread-chapter-twenty-five/",
"/2018/06/21/oathbringer-reread-chapters-twenty-six-and-twenty-seven/",
"/2018/06/28/oathbringer-reread-chapter-twenty-eight/",
"/2018/07/05/oathbringer-reread-chapters-twenty-nine-and-thirty/",
"/2018/07/12/oathbringer-reread-chapters-thirty-one-and-thirty-two/",
"/2018/07/19/oathbringer-reread-interludes-one-two-and-three/",
"/2018/07/26/oathbringer-reread-chapter-thirty-three/"
]
episode = 1
links.each do |link|
url = BASE + link
puts "Download #{url}"
unless File.exist? "wor/#{episode}.html"
`wget --no-clobber "#{url}" --output-document "oathbringer-reread/#{episode}.html" -o /dev/null`
end
episode += 1
end
# Now we have all the files
html = ''
for i in 1..(links.length)
complete_html = Nokogiri::HTML(open("oathbringer-reread/#{i}.html"))
page = complete_html.css('.entry-content')
title = complete_html.css('.entry-title>a').inner_html
ending = false
page.children.each do |e|
ending = true if e.class?('squib') || e.class?('post-end-spacer')
e.remove if ending
end
html += "<h1>#{title}</h1>"
html += page.inner_html
url = BASE + links[i - 1]
html += "<p>Visit <a href='#{url}'>tor.com</a> for discussion.</p>"
end
File.open('books/oathbringer-reread.html', 'w') { |file| file.write(html) }
puts '[html] Generated HTML file'
generate('oathbringer-reread', :all)