Get snapshot result page per page index

This commit is contained in:
hartator
2016-09-24 10:04:57 -07:00
parent ec6aa17a07
commit 7eedc1a183

View File

@@ -1,20 +1,20 @@
module ArchiveAPI module ArchiveAPI
def get_raw_list_from_api url def get_raw_list_from_api url, page_index
request_url = "http://web.archive.org/cdx/search/xd?url=" request_url = "http://web.archive.org/cdx/search/xd?url="
request_url += url request_url += url
request_url += parameters_for_api request_url += parameters_for_api page_index
request_uri = URI.parse request_url request_uri = URI.parse request_url
response = Net::HTTP.get_response request_uri response = Net::HTTP.get_response request_uri
response.body response.body
end end
def parameters_for_api def parameters_for_api page_index
parameters = "&fl=timestamp,original&gzip=false" parameters = "&fl=timestamp,original&collapse=digest&gzip=false"
if @all if @all
parameters += "&collapse=digest" parameters += ""
else else
parameters += "&filter=statuscode:200&collapse=original" parameters += "&filter=statuscode:200"
end end
if @from_timestamp and @from_timestamp != 0 if @from_timestamp and @from_timestamp != 0
parameters += "&from=" + @from_timestamp.to_s parameters += "&from=" + @from_timestamp.to_s
@@ -22,6 +22,9 @@ module ArchiveAPI
if @to_timestamp and @to_timestamp != 0 if @to_timestamp and @to_timestamp != 0
parameters += "&to=" + @to_timestamp.to_s parameters += "&to=" + @to_timestamp.to_s
end end
if page_index
parameters += "&page=#{page_index}"
end
parameters parameters
end end