diff --git a/.gitignore b/.gitignore index 9f74db7..48d36d8 100644 --- a/.gitignore +++ b/.gitignore @@ -1,4 +1,5 @@ /wok/*.html /wor/*.html /oathbringer/*.html +/edgedancer/*.html /books/* diff --git a/covers/edgedancer-reread.jpg b/covers/edgedancer-reread.jpg new file mode 100644 index 0000000..bfde8e9 Binary files /dev/null and b/covers/edgedancer-reread.jpg differ diff --git a/covers/edgedancer-reread.pdf b/covers/edgedancer-reread.pdf new file mode 100644 index 0000000..c3eaf56 Binary files /dev/null and b/covers/edgedancer-reread.pdf differ diff --git a/edgedancer-reread.rb b/edgedancer-reread.rb new file mode 100644 index 0000000..043df6e --- /dev/null +++ b/edgedancer-reread.rb @@ -0,0 +1,50 @@ +require 'date' +require 'fileutils' +require 'nokogiri' +require_relative './methods' + +FileUtils.mkdir_p('edgedancer') + +BASE = 'https://www.tor.com/'.freeze + +links = [ + "2017/08/24/edgedancer-reread-chapter-1/", + "2017/08/31/edgedancer-reread-chapter-2/", + "2017/09/07/edgedancer-reread-chapters-3-and-4/", + "2017/09/14/edgedancer-reread-chapters-5-and-6/" +] + +episode = 1 + +links.each do |link| + url = BASE + link + puts "Download #{url}" + unless File.exist? "edgedancer/#{episode}.html" + `wget --no-clobber "#{url}" --output-document "edgedancer/#{episode}.html" -o /dev/null` + end + episode += 1 +end + +# Now we have all the files +html = '' +for i in 1..(links.length) + complete_html = Nokogiri::HTML(open("edgedancer/#{i}.html")) + page = complete_html.css('.entry-content') + title = complete_html.css('.entry-title>a').inner_html + ending = false + page.children.each do |e| + ending = true if e.class? 'squib' + e.remove if ending + end + html += "

#{title}

" + html += page.inner_html + + url = BASE + links[i - 1] + + html += "

Visit tor.com for discussion.

" +end + +File.open('books/edgedancer-reread.html', 'w') { |file| file.write(html) } +puts '[html] Generated HTML file' + +generate('edgedancer-reread', :all) diff --git a/metadata/edgedancer-reread.xml b/metadata/edgedancer-reread.xml new file mode 100644 index 0000000..0953eab --- /dev/null +++ b/metadata/edgedancer-reread.xml @@ -0,0 +1,5 @@ +Edgedancer Reread +2017-09-14 +en-US +Alice Arneson +Lyndsey Luther diff --git a/wok-reread.rb b/wok-reread.rb index d9a4903..6cafc30 100644 --- a/wok-reread.rb +++ b/wok-reread.rb @@ -94,7 +94,7 @@ for i in 1..(links.length) html += "

#{title}

" html += page.inner_html - url = links[i - 1] + url = BASE + links[i - 1] html += "

Visit tor.com for discussion.

" end diff --git a/wor-reread.rb b/wor-reread.rb index f872644..e224047 100644 --- a/wor-reread.rb +++ b/wor-reread.rb @@ -140,7 +140,7 @@ for i in 1..(links.length) html += "

#{title}

" html += page.inner_html - url = links[i - 1] + url = BASE + links[i - 1] html += "

Visit tor.com for discussion.

" end