clemfromspace/scrapy-puppeteer

View on GitHub
scrapy_puppeteer/http.py

Summary

Maintainability
A
50 mins
Test Coverage
F
0%
"""This module contains the ``SeleniumRequest`` class"""

from scrapy import Request


class PuppeteerRequest(Request):
    """Scrapy ``Request`` subclass providing additional arguments"""

    def __init__(self, url, callback=None, screenshot=False, wait_until=None, wait_for=None, *args, **kwargs):
        """Initialize a new Puppeteer request

        Parameters
        ----------
        wait_until: basestring
            One of "load", "domcontentloaded", "networkidle0", "networkidle2".
            See https://miyakogi.github.io/pyppeteer/reference.html#pyppeteer.page.Page.goto
        screenshot: bool
            If True, a screenshot of the page will be taken and the data of the screenshot
            will be returned in the response "meta" attribute.

        """

        self.wait_until = wait_until or 'domcontentloaded'
        self.wait_for = wait_for
        self.screenshot = screenshot

        super().__init__(url, callback, *args, **kwargs)