1
|
|
|
from __future__ import annotations |
|
|
|
|
2
|
|
|
from dataclasses import dataclass |
3
|
|
|
from typing import Sequence |
4
|
|
|
|
5
|
|
|
from pocketutils.core.query_utils import QueryExecutor |
|
|
|
|
6
|
|
|
|
7
|
|
|
from mandos.model.settings import MANDOS_SETTINGS |
8
|
|
|
|
9
|
|
|
from mandos import logger |
10
|
|
|
|
11
|
|
|
# noinspection PyBroadException |
12
|
|
|
try: |
13
|
|
|
from selenium import webdriver |
|
|
|
|
14
|
|
|
from selenium.webdriver.common.by import By |
|
|
|
|
15
|
|
|
from selenium.webdriver.remote.webdriver import WebDriver |
|
|
|
|
16
|
|
|
from selenium.webdriver.remote.webelement import WebElement |
|
|
|
|
17
|
|
|
except Exception: |
|
|
|
|
18
|
|
|
webdriver = None |
|
|
|
|
19
|
|
|
WebDriver = None |
|
|
|
|
20
|
|
|
By = None |
|
|
|
|
21
|
|
|
|
22
|
|
|
if webdriver is not None: |
23
|
|
|
# noinspection PyBroadException |
24
|
|
|
try: |
25
|
|
|
driver_fn = getattr(webdriver, MANDOS_SETTINGS.selenium_driver) |
26
|
|
|
except AttributeError: |
27
|
|
|
driver_fn = None |
|
|
|
|
28
|
|
|
logger.warning(f"Selenium driver {MANDOS_SETTINGS.selenium_driver} not found") |
29
|
|
|
|
30
|
|
|
|
31
|
|
|
@dataclass(frozen=True) |
|
|
|
|
32
|
|
|
class Scraper: |
33
|
|
|
driver: WebDriver |
34
|
|
|
executor: QueryExecutor |
35
|
|
|
|
36
|
|
|
@classmethod |
37
|
|
|
def create(cls, executor: QueryExecutor) -> Scraper: |
|
|
|
|
38
|
|
|
if driver_fn is None: |
|
|
|
|
39
|
|
|
raise ValueError(f"Selenium driver {MANDOS_SETTINGS.selenium_driver} not found") |
40
|
|
|
return Scraper(driver_fn(), executor) |
41
|
|
|
|
42
|
|
|
def go(self, url: str) -> Scraper: |
|
|
|
|
43
|
|
|
self.driver.get(url) |
44
|
|
|
# self.driver.find_elements_by_link_text("1") |
45
|
|
|
return self |
46
|
|
|
|
47
|
|
|
def find_element(self, thing: str, by: str) -> WebElement: |
|
|
|
|
48
|
|
|
by = by.upper() |
49
|
|
|
return self.driver.find_element(thing, by) |
50
|
|
|
|
51
|
|
|
def find_elements(self, thing: str, by: str) -> Sequence[WebElement]: |
|
|
|
|
52
|
|
|
by = by.upper() |
53
|
|
|
return self.driver.find_elements(thing, by) |
54
|
|
|
|
55
|
|
|
def click_element(self, thing: str, by: str) -> None: |
|
|
|
|
56
|
|
|
by = by.upper() |
57
|
|
|
element = self.driver.find_element(thing, by) |
58
|
|
|
element.click() |
59
|
|
|
|
60
|
|
|
|
61
|
|
|
__all__ = ["Scraper", "By"] |
62
|
|
|
|