webgalen/lib/webgalien/actors/screenshot_actor.rb

106 lines
2.8 KiB
Ruby

USER_AGENT = 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_6) ' \
'AppleWebKit/601.7.7 (KHTML, like Gecko) Version/9.1.2 Safari/601.7.7'.freeze
# configure the driver to run in headless mode
# Selenium::WebDriver.logger.level =
module Webgalien
class ScreenshotActor
include Celluloid
def initialize(output_path)
@output_path = output_path
end
def perform(future_work)
driver = initialize_selenium_driver
work = future_work.value
work.shift!
url = work.input[:url]
# Go to wanted page
driver.manage.window.resize_to(1440, 900)
puts "(#{work.id}) loading page #{url}"
driver.navigate.to url
puts "(#{work.id}) waiting DOM stability"
wait_dom_stability(driver)
# get page size
element = driver.find_element(:css, "body")
height = element.size.height.to_i + 1
puts "(#{work.id}) resizing to 1440x#{height}"
driver.manage.window.resize_to(1440, height)
puts "(#{work.id}) waiting DOM stability"
wait_dom_stability(driver)
puts "(#{work.id}) getting page dimensions"
element = driver.find_element(:css, "body")
location = element.location
size = element.size
bbox = {
w: size.width.to_i,
h: size.height.to_i,
x: location.x.to_i,
y: 0 # location.y.to_i
}
tmp_path = File.join(@output_path, 'capture-' + work.id.to_s + '.png')
puts "(#{work.id}) saving page to #{tmp_path}"
FileUtils.mkdir_p(@output_path)
driver.save_screenshot tmp_path
driver.quit
work.output = {
bbox: bbox,
path: tmp_path
}
work
end
private
def initialize_selenium_driver
client = Selenium::WebDriver::Remote::Http::Default.new
client.read_timeout = 120
client.open_timeout = 120
options = Selenium::WebDriver::Chrome::Options.new
options.add_argument('--headless')
options.add_argument('--disable-gpu')
options.add_argument('--dns-prefetch-disable')
options.add_argument("--user-agent=#{USER_AGENT}")
# driver.timeout = 90 # instead of the default 60
Selenium::WebDriver.for(
:chrome,
options: options,
http_client: client
)
end
# wait for DOM structure to be stabilizer for 5 consecutive tries
def wait_dom_stability(driver)
dom_before = nil
dom_now = nil
dom_stability = 0
wait = Selenium::WebDriver::Wait.new(timeout: 120)
wait.until do
# save old dom
dom_before = dom_now
# get new dom
dom_now = driver.find_element(:css, 'body').attribute('innerHTML')
# test stability
dom_stability += 1
dom_stability = 0 if dom_before != dom_now
(dom_stability > 15)
end
end
end
end