-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdriver_instance.py
66 lines (57 loc) · 1.9 KB
/
driver_instance.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
import time
from selenium import webdriver
from selenium.webdriver import ChromeOptions
class DriverInstance():
""" Class containing driver and methods to scrape webpages
Args:
logger: The logger.
is_headless: Run in headless mode.
"""
def __init__(
self,
logger,
is_headless=True,
debug=False,
):
self.logger = logger
self.is_headless = is_headless
self.debug = debug
self.count = 1
self.logger.info('Creating a DriverInstance...')
self.create_driver()
def create_driver(self):
chrome_options = ChromeOptions()
if self.is_headless:
chrome_options.add_argument('--headless') # headless mode
self.driver = webdriver.Chrome(chrome_options=chrome_options)
def load_site(self, link):
out = 'Loading page #{}'.format(self.count)
self.logger.info(out)
if self.debug:
self.logger.info(link)
self.driver.get(link)
self.count+=1
def close_window(self):
self.driver.close()
def get_topics(self):
topics = []
try:
time.sleep(2) # wait for page to load
elements = self.driver.find_elements_by_class_name("tag__2PqS")
for e in elements:
topics.append(e.get_attribute("innerHTML"))
except:
self.logger.error('An error occured while looking for topics')
if self.debug:
print(topics)
return topics
def get_stats(self):
upvote = self.driver.find_element_by_xpath('//*[@id="app"]/div/div[2]/div[1]/div/div[1]/div/div[1]/div[1]/div/div[2]/div/div[1]/div[2]/button[1]/span').get_attribute("innerHTML")
downvote = self.driver.find_element_by_xpath('//*[@id="app"]/div/div[2]/div[1]/div/div[1]/div/div[1]/div[1]/div/div[2]/div/div[1]/div[2]/button[2]/span').get_attribute("innerHTML")
if self.debug:
print(upvote,downvote)
return upvote, downvote
def run_automation(self):
self.logger.info("Running automation...")
self.load_site()
self.load