-
Notifications
You must be signed in to change notification settings - Fork 0
/
therealist.rb
50 lines (35 loc) · 1.75 KB
/
therealist.rb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
require 'rubygems'
require 'open-uri'
#downloads a "The Realist" issue you choose to your disk
DATA_DIR = "the_realist"
Dir.mkdir(DATA_DIR) unless File.exists?(DATA_DIR)
BASE_realist_URL = "http://www.ep.tc/realist/" #this is the site where the issues are
puts "issue"
issue = gets.chomp
puts "total pages"
total_pages = gets.chomp #I have to set the number of pages of the issue, since it varies from one to the other.
page = BASE_realist_URL + issue + "/" #"page" is the webpage where the specified issue is. (ex: issue one is in
#http://www.ep.tc/realist/01)
ISSUE_DIR = DATA_DIR + "/" + issue
Dir.mkdir(ISSUE_DIR) unless File.exists?(ISSUE_DIR) #creates folder to store the issue on the DATA_DIR and gives it the
#name of the issue
puts "Creating #{ISSUE_DIR} folder"
for number in 1..9 # this loop downloads the first 9 pages of the issue
pagina = page + "0" + number.to_s + ".jpg" # this defines a specific page of the magazine, starting with 1,
#it directs to the url where the .jpg file with the scan can be found. the format of the first 9 pages
#of each issue is "00", so, when I'm converting it to string (with ".to_s", I need to add a zero)
puts "Downloading page #{number}"
open(pagina) {|f|
File.open("#{ISSUE_DIR}/#{number}.jpg","wb") do |file|
file.puts f.read #creates a file with the page number and writes the image there
end }
end
for number in 10..total_pages.to_i #to_i turns the number I set before from a string to an integer.
pagina = page + number.to_s + ".jpg" #we don't need to add the "0" anymore, since all page number have two digits now.
puts "Downloading page #{number}"
open(pagina) {|f|
File.open("#{ISSUE_DIR}/#{number}.jpg","wb") do |file|
file.puts f.read
end }
end
puts "done"