1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
|
import logging
import datetime
from contextlib import contextmanager
import re
from selenium import webdriver
from selenium.webdriver.firefox.options import Options
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
from selenium.webdriver.common.by import By
from serenitas.utils.env import DAILY_DIR
from serenitas.analytics.dates import prev_business_day
logger = logging.getLogger(__name__)
def download_report(account_username, password, report_dir, workdate):
with create_driver(report_dir) as driver:
login(driver, account_username, password)
navigate_to_msg(driver, workdate)
attachment_element = get_attachment_element(driver)
driver.implicitly_wait(3)
attachment_element.click()
fname = attachment_element.text.split()[0]
return fname
def login(driver, account_username, password):
driver.get("https://web1.mail.scotiabank.com/webmail/do/Home")
wait = WebDriverWait(driver, 10)
username_element = wait.until(EC.presence_of_element_located((By.ID, "username")))
username_element.send_keys(account_username)
password_element = wait.until(EC.presence_of_element_located((By.ID, "passwordid")))
password_element.send_keys(password)
login_button = driver.find_element(By.ID, "loginbutton")
login_button.click()
def navigate_to_msg(driver, workdate):
driver.get(
"https://web1.mail.scotiabank.com/webmail/do/FolderDisplay?paths=INBOX&path=INBOX"
)
wait = WebDriverWait(driver, 10)
wait.until(EC.presence_of_element_located((By.CLASS_NAME, "zfolder-msg")))
for msg in driver.find_elements(By.CLASS_NAME, "zfolder-msg"):
date_string = re.search(
r"\d{4}-\d{2}-\d{2}|\d{1,2}/\d{1,2}/\d{4}", msg.text
).group()
date = datetime.datetime.strptime(date_string, "%Y-%m-%d").date()
if date == workdate:
msg.click()
return
raise ValueError(f"Could not find a file for this date {workdate}")
def get_attachment_element(driver):
wait = WebDriverWait(driver, 10)
attach = wait.until(
EC.presence_of_element_located((By.CLASS_NAME, "zmessage-attachment-link"))
)
return driver.find_element(By.CLASS_NAME, "zmessage-attachment-link")
@contextmanager
def create_driver(download_dir):
options = Options()
options.add_argument("--headless")
fp = webdriver.FirefoxProfile()
fp.set_preference("browser.download.dir", str(download_dir))
fp.set_preference("browser.download.folderList", 2)
fp.set_preference(
"browser.helperApps.neverAsk.saveToDisk", "application/octet-stream"
)
driver = webdriver.Firefox(
firefox_profile=fp,
options=options,
service_log_path="/home/serenitas/CorpCDOs/logs/selenium_scotia.log",
)
yield driver
driver.quit()
def download_scotia_report(workdate):
username, password = ("selene-ops@lmcg.com", "oeujG*UF!53o")
REPORT_DIR = DAILY_DIR / "Selene" / "Scotia_reports"
try:
fname = next(
REPORT_DIR.glob(
f"IsoSelene_{prev_business_day(workdate):%d-%b-%Y}_*_xlsx.JOAAPKO3.JOAAPKO1"
)
)
logger.info(f"{fname} already exists in {REPORT_DIR}")
except StopIteration: # File doesn't exist, let's get it"
fname = download_report(username, password, REPORT_DIR, workdate)
logger.info(f"Downloaded Scotia Report for {workdate}: {fname}")
|