mirror of
https://github.com/quatalog/quatalog.git
synced 2024-11-15 19:42:44 +00:00
Fix issue where only 1 page per school would get scraped properly
This commit is contained in:
parent
5ea6816c90
commit
baa74b8ee6
|
@ -126,6 +126,10 @@ def main():
|
||||||
|
|
||||||
user_agent = UserAgent().random
|
user_agent = UserAgent().random
|
||||||
options.set_preference("general.useragent.override", user_agent)
|
options.set_preference("general.useragent.override", user_agent)
|
||||||
|
# options.set_preference("network.proxy.socks", )
|
||||||
|
# options.set_preference("network.proxy.socks_port", )
|
||||||
|
# options.set_preference("network.proxy.socks_remote_dns", True)
|
||||||
|
# options.set_preference("network.proxy.type", 1)
|
||||||
print(f"Using randomized user agent {user_agent}", file=sys.stderr)
|
print(f"Using randomized user agent {user_agent}", file=sys.stderr)
|
||||||
|
|
||||||
driver = webdriver.Firefox(options=options)
|
driver = webdriver.Firefox(options=options)
|
||||||
|
@ -211,7 +215,7 @@ def main():
|
||||||
try:
|
try:
|
||||||
course_pages_len = int(
|
course_pages_len = int(
|
||||||
driver.find_element(
|
driver.find_element(
|
||||||
"id", "lblInstWithEQPaginationInfo"
|
"id", "lblCourseEQPaginationInfo"
|
||||||
).text.split()[-1]
|
).text.split()[-1]
|
||||||
)
|
)
|
||||||
except NoSuchElementException:
|
except NoSuchElementException:
|
||||||
|
|
Loading…
Reference in a new issue