-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbrowser_class.py
40 lines (30 loc) · 1.05 KB
/
browser_class.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
import mechanicalsoup
from selenium import webdriver
from selenium.webdriver.chrome.options import Options
import validators
class Browser(object):
"""docstring for Browser"""
def __init__(self):
self.browser = mechanicalsoup.StatefulBrowser()
self.current_url = None
self._BASE_URL = 'https://bbc.co.uk'
def get_page(self, url):
self.browser.open(url)
self.current_url = url
return self.browser.get_current_page()
def get_url(self):
return self.current_url
class JSBrowser(object):
def __init__(self):
options = Options()
options.add_argument('--headless')
options.add_argument('--no-sandbox')
options.add_argument("--disable-setuid-sandbox")
self.driver = webdriver.Chrome(options=options)
def get_page(self, url):
if validators.url(url):
self.driver.get(url)
html = self.driver.execute_script("return document.body.innerHTML")
return html
def get_curr_url(self):
return self.driver.current_url