t
Size: a a a
OS
OS
t
OS
OS
A
class MyParser(scrapy.Spider):
name = "myparser"
start_urls = ['https://site.net/', 'https://site1.net/', 'https://site2.net/']
def __init__(self):
self.profile = webdriver.FirefoxProfile()
self.profile.set_preference("intl.accept_languages", "ua_RU")
self.profile.set_preference("dom.disable_open_during_load", False)
#self.profile.set_preference("general.useragent.override", "[Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Safari/537.36]")
self.fireFoxOptions = webdriver.FirefoxOptions()
# self.fireFoxOptions.set_headless()
self.driver = webdriver.Firefox(firefox_profile=self.profile, seleniumwire_options=self.options)
def parse(self, response):
pass
OS
class MyParser(scrapy.Spider):
name = "myparser"
start_urls = ['https://site.net/', 'https://site1.net/', 'https://site2.net/']
def __init__(self):
self.profile = webdriver.FirefoxProfile()
self.profile.set_preference("intl.accept_languages", "ua_RU")
self.profile.set_preference("dom.disable_open_during_load", False)
#self.profile.set_preference("general.useragent.override", "[Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Safari/537.36]")
self.fireFoxOptions = webdriver.FirefoxOptions()
# self.fireFoxOptions.set_headless()
self.driver = webdriver.Firefox(firefox_profile=self.profile, seleniumwire_options=self.options)
def parse(self, response):
pass
AR
A
CONCURRENT_REQUESTS = 5
# Configure a delay for requests for the same website (default: 0)
# See https://docs.scrapy.org/en/latest/topics/settings.html#download-delay
# See also autothrottle settings and docs
DOWNLOAD_DELAY = 3
# The download delay setting will honor only one of:
CONCURRENT_REQUESTS_PER_DOMAIN = 3
CONCURRENT_REQUESTS_PER_IP = 1
A
AR
AR