Files
btgo-playwright/btgo_scraper.py
Marius Mutu 0fff07c55b Rescrie complet fluxul de descarcare tranzactii pentru noul UI BT George
Modificari principale:
- Noul flux download: expand -> tranzactii -> CSV -> Genereaza -> download
- Detectie inteligenta buton Tranzactii (evita butonul Delete)
- Verificare daca primul cont e deja expandat inainte de click
- Selectie conturi cu 6 strategii fallback + debug logging
- Handler pentru cookie consent "Accept toate" si "Am inteles"
- Screenshot automat la erori de selectie cont

Documentatie:
- README: sectiuni noi pentru inregistrare Playwright si testare manuala
- CLAUDE.md: selectori actualizati pentru noul UI

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2025-12-09 15:18:44 +02:00

1072 lines
43 KiB
Python

"""
BTGO Scraper - Automatizare citire solduri conturi bancare
Folosește Playwright pentru automatizare browser
"""
from playwright.sync_api import sync_playwright, TimeoutError as PlaywrightTimeout
import logging
import csv
import json
import time
import os
from datetime import datetime
from pathlib import Path
from config import Config
class BTGoScraper:
"""Scraper pentru extragerea soldurilor de pe btgo.ro"""
def __init__(self):
"""Initializare scraper cu logging si configurare"""
self.config = Config()
Config.validate()
self._setup_logging()
self._ensure_directories()
self.page = None
self.login_page = None # Pagina de login (popup)
# Setup pentru progress updates prin Telegram (optional)
self.telegram_chat_id = os.getenv('TELEGRAM_CHAT_ID')
self.telegram_message_id = os.getenv('TELEGRAM_MESSAGE_ID')
self.progress_notifier = None
logging.info(f"Environment: TELEGRAM_CHAT_ID={self.telegram_chat_id}, TELEGRAM_MESSAGE_ID={self.telegram_message_id}")
# Inițializează notifier pentru progress updates dacă avem chat_id
if self.telegram_chat_id and self.telegram_message_id:
try:
from notifications import TelegramNotifier
self.progress_notifier = TelegramNotifier(self.config)
logging.info(f"Progress updates activate pentru chat_id={self.telegram_chat_id}, message_id={self.telegram_message_id}")
except Exception as e:
logging.warning(f"Nu am putut inițializa progress notifier: {e}")
else:
logging.warning("Progress updates dezactivate - lipsesc TELEGRAM_CHAT_ID sau TELEGRAM_MESSAGE_ID")
def _setup_logging(self):
"""Configurare logging in consola si fisier zilnic"""
# Creaza director logs daca nu exista
Path(self.config.LOG_DIR).mkdir(exist_ok=True)
# Nume fisier cu data curenta
log_file = Path(self.config.LOG_DIR) / f"scraper_{datetime.now().strftime('%Y-%m-%d')}.log"
# Format log
log_format = '[%(asctime)s] [%(levelname)s] %(message)s'
date_format = '%Y-%m-%d %H:%M:%S'
# Configurare logging
logging.basicConfig(
level=getattr(logging, self.config.LOG_LEVEL),
format=log_format,
datefmt=date_format,
handlers=[
logging.StreamHandler(), # Console
logging.FileHandler(log_file, encoding='utf-8') # Fisier
]
)
logging.info(f"Logging initializat: {log_file}")
def _ensure_directories(self):
"""Creaza directoarele data/ si logs/ daca nu exista"""
Path(self.config.OUTPUT_DIR).mkdir(exist_ok=True)
Path(self.config.LOG_DIR).mkdir(exist_ok=True)
logging.info(f"Directoare verificate: {self.config.OUTPUT_DIR}, {self.config.LOG_DIR}")
def _update_progress(self, message: str):
"""
Trimite update de progres către Telegram (editează mesajul inițial)
Args:
message: Mesajul de progres
"""
if self.progress_notifier and self.telegram_chat_id and self.telegram_message_id:
full_message = f"*{message}*"
self.progress_notifier._edit_message(
self.telegram_chat_id,
self.telegram_message_id,
full_message
)
logging.info(f"Progress update: {message}")
def _dismiss_gdpr_cookies(self, page):
"""
Inchide GDPR cookie banner daca este vizibil
Args:
page: Pagina Playwright pe care sa verifice
"""
try:
# Strategii pentru cookie consent (in ordinea probabilitatii)
cookie_strategies = [
# 1. Noul buton BT (2024+)
("role", "button", "Accept toate"),
("role", "button", "Accepta toate"),
# 2. Vechiul GDPR wrapper
("css", ".gdprcookie-wrapper button:has-text('Accept')"),
("css", ".gdprcookie-wrapper button:has-text('Sunt de acord')"),
("css", ".gdprcookie-wrapper button"),
# 3. Fallback generic
("role", "button", "Accept"),
("role", "button", "Accepta"),
("role", "button", "OK"),
]
for strategy in cookie_strategies:
try:
if strategy[0] == "role":
btn = page.get_by_role(strategy[1], name=strategy[2])
else:
btn = page.locator(strategy[2]).first
if btn.is_visible(timeout=2000):
btn.click()
logging.info(f" [OK] Cookies acceptate ({strategy})")
time.sleep(1)
return True
except:
continue
logging.info(" Nu exista cookie banner (sau deja acceptat)")
return False
except:
logging.info(" Nu exista cookie banner (sau deja acceptat)")
return False
def _dismiss_one_time_consent(self, page):
"""
Inchide dialoguri one-time (ex: 'Am inteles') daca apar
Args:
page: Pagina Playwright pe care sa verifice
"""
consent_buttons = [
("text", "Am înțeles"),
("text", "Am inteles"),
("role", "button", "Am înțeles"),
("role", "button", "OK"),
("role", "button", "Continua"),
]
for strategy in consent_buttons:
try:
if strategy[0] == "text":
btn = page.get_by_text(strategy[1], exact=True)
elif strategy[0] == "role":
btn = page.get_by_role(strategy[1], name=strategy[2])
if btn.is_visible(timeout=2000):
btn.click()
logging.info(f" [OK] Consent inchis ({strategy})")
time.sleep(1)
return True
except:
continue
return False
def _find_username_field(self, page):
"""
Detecteaza inteligent campul de username folosind multiple strategii.
Ordinea: selectori specifici -> selectori generici -> detectie structurala
Returns:
Locator daca gasit, None altfel
"""
strategies = [
# 1. Selectori specifici BT (pot sa se schimbe)
("placeholder_exact", "ID logare"),
("placeholder_exact", "ID de logare"),
("id", "user"),
("name", "user"),
# 2. Selectori generici (mai stabili)
("placeholder_contains", "logare"),
("placeholder_contains", "user"),
("placeholder_contains", "utilizator"),
("name_contains", "user"),
("name_contains", "login"),
("id_contains", "user"),
("id_contains", "login"),
# 3. Selectori structurali (foarte stabili)
("css", "form input[type='text']:not([type='hidden'])"),
("css", "form input:not([type='password']):not([type='hidden']):not([type='submit'])"),
("css", "input[type='text']"),
("css", ".form-control[type='text']"),
# 4. Fallback - primul input vizibil care nu e password/submit
("first_text_input", None),
]
for strategy_type, value in strategies:
try:
field = self._try_field_strategy(page, strategy_type, value)
if field and field.is_visible(timeout=1000):
logging.info(f" [USERNAME] Gasit cu strategia: {strategy_type}='{value}'")
return field
except Exception:
continue
logging.error(" [USERNAME] Nu am gasit campul cu nicio strategie!")
return None
def _find_password_field(self, page):
"""
Detecteaza inteligent campul de parola.
Campul password e foarte stabil - type='password' e standard HTML.
Returns:
Locator daca gasit, None altfel
"""
strategies = [
# 1. Cel mai stabil - type='password' (standard HTML)
("css", "input[type='password']"),
# 2. Selectori specifici BT
("id", "password"),
("name", "password"),
("name", "pass"),
("placeholder_exact", "Parola"),
("placeholder_exact", "Password"),
# 3. Selectori generici
("placeholder_contains", "parola"),
("placeholder_contains", "password"),
("name_contains", "pass"),
("id_contains", "pass"),
# 4. Fallback structural
("css", "form input[type='password']"),
("css", ".form-control[type='password']"),
]
for strategy_type, value in strategies:
try:
field = self._try_field_strategy(page, strategy_type, value)
if field and field.is_visible(timeout=1000):
logging.info(f" [PASSWORD] Gasit cu strategia: {strategy_type}='{value}'")
return field
except Exception:
continue
logging.error(" [PASSWORD] Nu am gasit campul cu nicio strategie!")
return None
def _find_submit_button(self, page):
"""
Detecteaza inteligent butonul de submit.
Returns:
Locator daca gasit, None altfel
"""
strategies = [
# 1. Selectori specifici BT
("css", "input[value='Autentifică-te']"),
("css", "button:has-text('Autentifică-te')"),
("css", "input[value*='Autentific']"),
# 2. Selectori generici pentru login buttons
("css", "input[type='submit']"),
("css", "button[type='submit']"),
("css", "form button.btn-primary"),
("css", "form input.btn-primary"),
# 3. Text-based (mai putin stabil dar functional)
("text_contains", "Login"),
("text_contains", "Conectare"),
("text_contains", "Autentificare"),
("text_contains", "Intra"),
("text_contains", "Submit"),
# 4. Fallback - orice buton din form
("css", "form button"),
("css", "form input[type='button']"),
("css", ".btn-primary"),
]
for strategy_type, value in strategies:
try:
button = self._try_button_strategy(page, strategy_type, value)
if button and button.is_visible(timeout=1000):
logging.info(f" [SUBMIT] Gasit cu strategia: {strategy_type}='{value}'")
return button
except Exception:
continue
logging.error(" [SUBMIT] Nu am gasit butonul cu nicio strategie!")
return None
def _try_field_strategy(self, page, strategy_type, value):
"""Helper pentru a incerca o strategie de gasire a unui camp"""
if strategy_type == "placeholder_exact":
return page.get_by_placeholder(value, exact=True)
elif strategy_type == "placeholder_contains":
return page.locator(f"input[placeholder*='{value}' i]").first
elif strategy_type == "id":
return page.locator(f"#{value}")
elif strategy_type == "id_contains":
return page.locator(f"input[id*='{value}' i]").first
elif strategy_type == "name":
return page.locator(f"input[name='{value}']")
elif strategy_type == "name_contains":
return page.locator(f"input[name*='{value}' i]").first
elif strategy_type == "css":
return page.locator(value).first
elif strategy_type == "label":
return page.get_by_label(value)
elif strategy_type == "first_text_input":
# Gaseste primul input care nu e password, hidden sau submit
inputs = page.locator("input:visible").all()
for inp in inputs:
try:
inp_type = inp.get_attribute("type", timeout=500) or "text"
if inp_type.lower() not in ["password", "hidden", "submit", "button", "checkbox", "radio"]:
return inp
except:
continue
return None
def _try_button_strategy(self, page, strategy_type, value):
"""Helper pentru a incerca o strategie de gasire a butonului"""
if strategy_type == "css":
return page.locator(value).first
elif strategy_type == "text_contains":
return page.locator(f"button:has-text('{value}'), input[value*='{value}' i]").first
elif strategy_type == "role":
return page.get_by_role("button", name=value)
return None
def run(self):
"""Entry point principal - orchestreaza tot flow-ul"""
try:
# Check dacă rulăm în mod balances_only
balances_only = os.getenv('BALANCES_ONLY', 'false').lower() == 'true'
logging.info("=" * 60)
if balances_only:
logging.info("Start BTGO Scraper (DOAR SOLDURI)")
else:
logging.info("Start BTGO Scraper")
logging.info("=" * 60)
with sync_playwright() as p:
# Lansare browser
browser = p.chromium.launch(
headless=self.config.HEADLESS,
slow_mo=100 if not self.config.HEADLESS else 0 # Slow motion pentru debugging
)
# Creaza pagina cu viewport standard
self.page = browser.new_page(viewport={'width': 1920, 'height': 1080})
logging.info(f"Browser lansat (headless={self.config.HEADLESS})")
# Flow complet
self.login()
self.handle_2fa_wait()
self._update_progress("2FA aprobat! Incarc conturi...")
accounts = self.read_accounts()
csv_path, json_path = self.save_results(accounts)
# Descarcă tranzacții pentru toate conturile (doar dacă nu e balances_only)
downloaded_files = []
if balances_only:
logging.info("Mod DOAR SOLDURI - skip download tranzactii")
elif self.config.DOWNLOAD_TRANSACTIONS:
downloaded_files = self.download_transactions(accounts)
else:
logging.info("Download tranzacții dezactivat (DOWNLOAD_TRANSACTIONS=false)")
# Screenshot final de confirmare
screenshot_path = Path(self.config.OUTPUT_DIR) / f"dashboard_{datetime.now().strftime('%Y-%m-%d_%H-%M-%S')}.png"
self.page.screenshot(path=str(screenshot_path))
logging.info(f"Screenshot final salvat: {screenshot_path}")
# Trimite notificări (email, Discord)
if self.config.ENABLE_NOTIFICATIONS:
self.send_notifications(csv_path, downloaded_files, accounts)
# Afișează rezumat final
logging.info("=" * 60)
logging.info("REZUMAT FINAL")
logging.info("=" * 60)
logging.info(f"Conturi citite: {len(accounts)}")
if self.config.DOWNLOAD_TRANSACTIONS:
logging.info(f"Tranzacții descărcate: {len(downloaded_files)}")
for df in downloaded_files:
logging.info(f" - {df['cont']}: {df['fisier']}")
logging.info("=" * 60)
browser.close()
# Nu mai trimitem update progress aici - mesajul final cu soldurile a fost deja editat de notifications.py
logging.info("=" * 60)
logging.info("✓ Scraper finalizat cu succes!")
logging.info("=" * 60)
return True
except Exception as e:
self._handle_error(e)
return False
def login(self):
"""Autentificare cu username si password"""
self._update_progress("Deschid pagina de login...")
logging.info("Navigare catre https://go.bancatransilvania.ro/")
self.page.goto('https://go.bancatransilvania.ro/', wait_until='networkidle')
logging.info("Pagina incarcata")
try:
# Cookie consent - asteapta si accepta (GDPR wrapper)
logging.info("Verificare GDPR cookie banner...")
self._dismiss_gdpr_cookies(self.page)
# Click pe butonul LOGIN - deschide popup
logging.info("Click pe butonul LOGIN...")
with self.page.expect_popup() as popup_info:
login_link = self.page.get_by_role("link", name="LOGIN")
login_link.click()
# Preia referinta la popup-ul de login
self.login_page = popup_info.value
logging.info("✓ Popup login deschis")
# Verifica GDPR cookies si pe popup
self._dismiss_gdpr_cookies(self.login_page)
# Asteapta sa se incarce pagina de login
time.sleep(2)
# Screenshot debug pentru a vedea starea paginii
debug_path = Path(self.config.OUTPUT_DIR) / f"debug_login_popup_{datetime.now().strftime('%Y%m%d_%H%M%S')}.png"
self.login_page.screenshot(path=str(debug_path))
logging.info(f"Screenshot debug salvat: {debug_path}")
# Completare username - detectie inteligenta cu fallback
logging.info("Detectie camp username...")
username_field = self._find_username_field(self.login_page)
if not username_field:
raise Exception("Nu am gasit campul de username cu nicio strategie!")
username_field.fill(self.config.BTGO_USERNAME)
logging.info("[OK] Username completat")
# Completare password - detectie inteligenta cu fallback
logging.info("Detectie camp password...")
password_field = self._find_password_field(self.login_page)
if not password_field:
raise Exception("Nu am gasit campul de parola cu nicio strategie!")
password_field.fill(self.config.BTGO_PASSWORD)
logging.info("[OK] Password completat")
# Click pe butonul de submit - detectie inteligenta cu fallback
logging.info("Detectie buton submit...")
submit_button = self._find_submit_button(self.login_page)
if not submit_button:
raise Exception("Nu am gasit butonul de submit cu nicio strategie!")
submit_button.click()
logging.info("[OK] Credentials trimise, astept 2FA...")
self._update_progress("Astept aprobare 2FA pe telefon...")
except PlaywrightTimeout as e:
logging.error(f"Timeout la login: {e}")
raise Exception("Nu am gasit elementele de login. Verifica selectors!")
except Exception as e:
logging.error(f"Eroare la login: {e}")
raise
def handle_2fa_wait(self):
"""Asteapta aprobare 2FA cu auto-detect"""
logging.info("=" * 60)
logging.info("🔐 APROBARE 2FA NECESARA")
logging.info("=" * 60)
logging.info("Verifica aplicatia George pe telefon si aproba autentificarea.")
logging.info(f"Timeout: {self.config.TIMEOUT_2FA_SECONDS} secunde")
logging.info("=" * 60)
# Detectam login reusit prin schimbarea URL-ului la goapp.bancatransilvania.ro
# sau prin aparitia butonului de conturi (#accountsBtn)
post_login_selectors = [
"#accountsBtn", # Butonul pentru conturi (apare post-login)
]
start_time = datetime.now()
timeout = self.config.TIMEOUT_2FA_SECONDS
while (datetime.now() - start_time).seconds < timeout:
# Verifică dacă butonul de conturi este CLICKABLE (nu doar vizibil)
# Aceasta este singura verificare sigură - butonul apare doar după 2FA reușit
try:
# Așteaptă ca #accountsBtn să fie clickable (nu doar vizibil în DOM)
accounts_btn = self.login_page.locator("#accountsBtn")
if accounts_btn.is_visible(timeout=1000):
# Verifică că este și clickable (enabled)
if accounts_btn.is_enabled():
logging.info("[OK] Autentificare 2FA reusita! (Buton conturi activ)")
time.sleep(2) # Asteapta ca pagina sa se stabilizeze complet
# Update page reference la login_page pentru restul operatiilor
self.page = self.login_page
# Inchide dialoguri one-time (ex: "Am inteles") daca apar
self._dismiss_one_time_consent(self.page)
return True
except:
pass
# Afiseaza countdown
elapsed = (datetime.now() - start_time).seconds
remaining = timeout - elapsed
print(f"\rAsteptam aprobare 2FA... {remaining}s ramas", end='', flush=True)
time.sleep(2)
print() # New line dupa countdown
raise TimeoutError(f"Timeout 2FA dupa {timeout} secunde. Verifica ca ai aprobat pe telefon!")
def download_transactions(self, accounts):
"""
Descarca CSV-uri cu tranzactiile pentru fiecare cont.
Flux nou (2024+):
1. Primul cont: expand card -> click tranzactii -> select CSV -> Genereaza -> download
2. Conturile urmatoare: #selectAccountBtn -> select cont by heading -> Genereaza -> download
"""
logging.info("=" * 60)
logging.info("Descarcare tranzactii pentru toate conturile...")
logging.info("=" * 60)
downloaded_files = []
for idx, account in enumerate(accounts, 1):
try:
nume_cont = account['nume_cont']
iban = account['iban']
self._update_progress(f"Descarc tranzactii ({idx}/{len(accounts)})...")
logging.info(f"[{idx}/{len(accounts)}] Descarcare tranzactii pentru: {nume_cont}")
if idx == 1:
# PRIMUL CONT: expand -> click tranzactii -> select CSV
downloaded = self._download_first_account(account)
else:
# CONTURILE URMATOARE: selecteaza din dropdown -> Genereaza -> download
downloaded = self._download_subsequent_account(account)
if downloaded:
downloaded_files.append(downloaded)
except Exception as e:
logging.error(f" [EROARE] Eroare la descarcarea tranzactiilor pentru {nume_cont}: {e}")
# Incearca sa revii la o stare stabila
try:
self.page.keyboard.press("Escape")
time.sleep(1)
except:
pass
continue
logging.info("=" * 60)
logging.info(f"[OK] Descarcate {len(downloaded_files)}/{len(accounts)} fisiere CSV cu tranzactii")
logging.info("=" * 60)
return downloaded_files
def _download_first_account(self, account):
"""
Descarca tranzactii pentru primul cont.
Flow: expand card (daca nu e deja) -> click buton tranzactii -> select CSV -> Genereaza -> download
"""
nume_cont = account['nume_cont']
iban = account['iban']
try:
# Gaseste primul card
first_card = self.page.locator("fba-account-details-card").first
time.sleep(1)
# Verifica daca butonul de tranzactii e DEJA vizibil (cont expandat)
transactions_btn = first_card.locator("fba-account-buttons svg, fba-account-buttons, .account-transactions-btn").first
is_already_expanded = False
try:
is_already_expanded = transactions_btn.is_visible(timeout=2000)
except:
pass
if is_already_expanded:
logging.info(" Contul deja expandat - skip expand click")
else:
# Click pe expand icon (sageata din card)
logging.info(" Contul collapsed - expandez...")
expand_icon = first_card.locator(".mx-auto .mat-icon svg, .collapse-account-btn").first
expand_icon.click()
time.sleep(2)
logging.info(" Contul expandat")
# Click pe butonul de tranzactii (NU pe delete/inchide cont!)
# Butonul corect are: clasa .account-transactions-btn, SVG cu documentChartList, <p> cu "Tranzactii"
transactions_btn = None
# Strategie 1 (PRINCIPALA): container cu clasa account-transactions-btn
try:
btn = first_card.locator(".account-transactions-btn").first
if btn.is_visible(timeout=2000):
transactions_btn = btn
logging.info(" Buton tranzactii gasit prin .account-transactions-btn")
except:
pass
# Strategie 2: SVG cu data-mat-icon-name="documentChartList"
if not transactions_btn:
try:
btn = first_card.locator("mat-icon[data-mat-icon-name='documentChartList']").first
if btn.is_visible(timeout=1000):
transactions_btn = btn
logging.info(" Buton tranzactii gasit prin documentChartList icon")
except:
pass
# Strategie 3: element care contine <p> cu text "Tranzactii"
if not transactions_btn:
try:
btn = first_card.locator("div:has(p:text('Tranzacții')), div:has(p:text('Tranzactii'))").first
if btn.is_visible(timeout=1000):
transactions_btn = btn
logging.info(" Buton tranzactii gasit prin <p> text")
except:
pass
# Strategie 4: click direct pe textul "Tranzactii" din card
if not transactions_btn:
try:
btn = first_card.get_by_text("Tranzacții", exact=True)
if btn.is_visible(timeout=1000):
transactions_btn = btn
logging.info(" Buton tranzactii gasit prin get_by_text")
except:
pass
if not transactions_btn:
raise Exception("Nu am gasit butonul de tranzactii!")
transactions_btn.click()
time.sleep(3)
logging.info(" Pagina tranzactii se incarca...")
# Selecteaza format CSV (click pe text "CSV")
csv_option = self.page.get_by_text("CSV", exact=True)
csv_option.click()
time.sleep(1)
logging.info(" Format CSV selectat")
# Click pe butonul Genereaza
generate_btn = self.page.get_by_role("button", name="Generează")
generate_btn.click()
time.sleep(2)
logging.info(" Click Genereaza - astept generare...")
# Asteapta si descarca fisierul
return self._wait_and_download(nume_cont, iban)
except Exception as e:
logging.error(f" [EROARE] Download primul cont: {e}")
return None
def _download_subsequent_account(self, account):
"""
Descarca tranzactii pentru conturile 2+.
Flow: click #selectAccountBtn -> select cont by heading -> Genereaza -> download
"""
nume_cont = account['nume_cont']
iban = account['iban']
try:
# Click pe butonul de selectare cont (#selectAccountBtn)
select_btn = self.page.locator("#selectAccountBtn svg, #selectAccountBtn").first
select_btn.click()
time.sleep(2)
logging.info(" Dropdown conturi deschis")
# Debug: listeaza toate heading-urile vizibile din dropdown
try:
headings = self.page.locator("fba-account-details h4, .account-name, h4").all()
visible_names = []
for h in headings[:10]: # Max 10
try:
if h.is_visible(timeout=500):
visible_names.append(h.inner_text().strip())
except:
pass
if visible_names:
logging.info(f" Conturi in dropdown: {visible_names}")
except:
pass
# Selecteaza contul dupa nume - strategii multiple
account_selected = False
# Strategie 1: heading cu numele exact
try:
heading = self.page.get_by_role("heading", name=nume_cont, exact=True)
if heading.is_visible(timeout=2000):
heading.click()
account_selected = True
logging.info(f" Cont selectat prin heading exact: {nume_cont}")
except Exception as e:
logging.debug(f" Heading exact failed: {e}")
# Strategie 2: heading cu numele partial (fara exact match)
if not account_selected:
try:
heading = self.page.get_by_role("heading", name=nume_cont)
if heading.is_visible(timeout=2000):
heading.click()
account_selected = True
logging.info(f" Cont selectat prin heading partial: {nume_cont}")
except Exception as e:
logging.debug(f" Heading partial failed: {e}")
# Strategie 3: fba-account-details cu has_text
if not account_selected:
try:
account_item = self.page.locator("fba-account-details").filter(has_text=nume_cont).first
if account_item.is_visible(timeout=2000):
account_item.click()
account_selected = True
logging.info(f" Cont selectat prin fba-account-details: {nume_cont}")
except Exception as e:
logging.debug(f" fba-account-details failed: {e}")
# Strategie 4: locator h4 care contine textul
if not account_selected:
try:
h4_elem = self.page.locator(f"h4:has-text('{nume_cont}')").first
if h4_elem.is_visible(timeout=2000):
h4_elem.click()
account_selected = True
logging.info(f" Cont selectat prin h4:has-text: {nume_cont}")
except Exception as e:
logging.debug(f" h4:has-text failed: {e}")
# Strategie 5: orice element cu textul contului
if not account_selected:
try:
text_elem = self.page.get_by_text(nume_cont, exact=True)
if text_elem.is_visible(timeout=2000):
text_elem.click()
account_selected = True
logging.info(f" Cont selectat prin text exact: {nume_cont}")
except Exception as e:
logging.debug(f" text exact failed: {e}")
# Strategie 6: text partial match
if not account_selected:
try:
text_elem = self.page.get_by_text(nume_cont)
if text_elem.is_visible(timeout=2000):
text_elem.click()
account_selected = True
logging.info(f" Cont selectat prin text partial: {nume_cont}")
except Exception as e:
logging.debug(f" text partial failed: {e}")
if not account_selected:
logging.error(f" [EROARE] Nu am putut selecta contul: {nume_cont}")
# Screenshot pentru debug
try:
debug_path = Path(self.config.OUTPUT_DIR) / f"debug_dropdown_{nume_cont.replace(' ', '_')}_{datetime.now().strftime('%H%M%S')}.png"
self.page.screenshot(path=str(debug_path))
logging.error(f" Screenshot debug salvat: {debug_path}")
except:
pass
return None
time.sleep(2)
# Click pe butonul Genereaza (CSV deja selectat de la primul cont)
generate_btn = self.page.get_by_role("button", name="Generează")
generate_btn.click()
time.sleep(2)
logging.info(" Click Genereaza - astept generare...")
# Asteapta si descarca fisierul
return self._wait_and_download(nume_cont, iban)
except Exception as e:
logging.error(f" [EROARE] Download cont ulterior {nume_cont}: {e}")
return None
def _wait_and_download(self, nume_cont, iban, timeout=20000):
"""
Asteapta generarea fisierului si il descarca.
Args:
nume_cont: Numele contului (pentru filename)
iban: IBAN-ul contului
timeout: Timeout pentru download (ms)
Returns:
Dict cu informatii despre fisierul descarcat sau None
"""
try:
# Asteapta sa apara fba-document-item (indica ca fisierul e gata)
self.page.wait_for_selector("fba-document-item", timeout=timeout)
logging.info(" Document generat - descarc...")
# Click pe document item pentru a descarca
with self.page.expect_download(timeout=timeout) as download_info:
download_btn = self.page.locator("fba-document-item svg, fba-document-item path").first
download_btn.click()
download = download_info.value
# Salveaza fisierul cu nume descriptiv
timestamp = datetime.now().strftime('%Y-%m-%d_%H-%M-%S')
nume_safe = nume_cont.replace(' ', '_').replace('/', '_').replace('\\', '_')
filename = f"tranzactii_{nume_safe}_{timestamp}.csv"
save_path = Path(self.config.OUTPUT_DIR) / filename
download.save_as(save_path)
logging.info(f" [OK] Salvat: {save_path}")
return {
'cont': nume_cont,
'iban': iban,
'fisier': str(save_path)
}
except Exception as e:
logging.error(f" [EROARE] Download fisier: {e}")
return None
def read_accounts(self):
"""Extrage soldurile tuturor conturilor"""
logging.info("Citire conturi si solduri...")
try:
# Click pe butonul de conturi pentru a afisa lista
logging.info("Click pe butonul Conturi...")
# Simplu selector - doar butonul, nu div-ul interior
accounts_button = self.page.locator("#accountsBtn")
accounts_button.click()
time.sleep(3) # Asteapta ca lista sa se incarce
logging.info("✓ Sectiunea conturi deschisa")
# Update progres DUPĂ ce lista de conturi s-a încărcat
self._update_progress("Citesc solduri conturi...")
# Gaseste toate cardurile de conturi
account_cards = self.page.locator("fba-account-details-card").all()
logging.info(f"Gasit {len(account_cards)} conturi")
accounts = []
for idx, card in enumerate(account_cards, 1):
try:
# Extrage nume cont (din tag <h4>)
nume = card.locator("h4.fw-normal.mb-0").inner_text()
# Extrage IBAN (din span cu clasa specific)
iban = card.locator("span.small.text-grayscale-label").inner_text()
# Extrage sold (din <strong> cu clasa 'sold')
sold_text = card.locator("strong.sold").inner_text()
# Parsing sold: "7,223.26 RON" -> sold_numeric=7223.26, moneda="RON"
# Elimina spatii, inlocuieste virgula cu punct
sold_parts = sold_text.strip().split()
if len(sold_parts) >= 2:
sold_str = sold_parts[0] # "7,223.26"
moneda = sold_parts[1] # "RON"
else:
sold_str = sold_text
moneda = "RON" # Default
# Converteste la float (elimina virgule care sunt separator de mii)
# Format: "7,223.26" -> 7223.26
sold_numeric = float(sold_str.replace(',', ''))
# Determina tip cont din nume (optional)
nume_lower = nume.lower()
if 'colector' in nume_lower:
tip_cont = 'colector'
elif 'profit' in nume_lower:
tip_cont = 'profit'
elif 'operationale' in nume_lower or 'operational' in nume_lower:
tip_cont = 'operational'
elif 'taxe' in nume_lower:
tip_cont = 'taxe'
elif 'antreprenor' in nume_lower:
tip_cont = 'antreprenor'
else:
tip_cont = 'curent'
accounts.append({
'nume_cont': nume.strip(),
'iban': iban.strip(),
'sold': sold_numeric,
'moneda': moneda.strip(),
'tip_cont': tip_cont
})
logging.info(f" [{idx}] {nume}: {sold_numeric} {moneda}")
except Exception as e:
logging.warning(f"Eroare la citirea contului {idx}: {e}")
continue
if not accounts:
raise Exception("Nu am putut citi niciun cont din lista!")
logging.info(f"✓ Citite {len(accounts)} conturi cu succes")
self._update_progress(f"Gasite {len(accounts)} conturi")
return accounts
except Exception as e:
logging.error(f"Eroare la citirea conturilor: {e}")
raise
def save_results(self, accounts):
"""Salveaza rezultate in CSV si JSON"""
if not accounts:
logging.warning("Nu exista conturi de salvat!")
return
timestamp = datetime.now().strftime('%Y-%m-%d_%H-%M-%S')
# Salvare CSV
csv_path = Path(self.config.OUTPUT_DIR) / f'solduri_{timestamp}.csv'
with open(csv_path, 'w', newline='', encoding='utf-8') as f:
fieldnames = ['timestamp', 'nume_cont', 'iban', 'sold', 'moneda', 'tip_cont']
writer = csv.DictWriter(f, fieldnames=fieldnames)
writer.writeheader()
for account in accounts:
row = account.copy()
row['timestamp'] = datetime.now().strftime('%Y-%m-%d %H:%M:%S')
writer.writerow(row)
logging.info(f"✓ CSV salvat: {csv_path}")
# Salvare JSON
json_path = Path(self.config.OUTPUT_DIR) / f'solduri_{timestamp}.json'
# Calculeaza metadata
currencies = list(set(a.get('moneda', 'N/A') for a in accounts))
total_ron = sum(a['sold'] for a in accounts if a.get('moneda') == 'RON')
output = {
'metadata': {
'timestamp': datetime.now().isoformat(),
'scraper_version': '1.0.0',
'total_accounts': len(accounts),
'total_ron': round(total_ron, 2),
'currencies': currencies
},
'accounts': accounts
}
with open(json_path, 'w', encoding='utf-8') as f:
json.dump(output, f, indent=2, ensure_ascii=False)
logging.info(f"✓ JSON salvat: {json_path}")
logging.info(f"Total conturi: {len(accounts)}, Total RON: {total_ron:.2f}")
return csv_path, json_path
def send_notifications(self, csv_path, downloaded_files, accounts):
"""
Trimite notificări email și Discord cu fișierele descărcate
Args:
csv_path: Calea către fișierul CSV cu solduri
downloaded_files: Lista de dicționare cu fișierele de tranzacții descărcate
accounts: Lista cu datele conturilor (solduri, nume, etc.)
"""
try:
from notifications import NotificationService
self._update_progress("Trimit rezultate...")
logging.info("=" * 60)
logging.info("TRIMITERE NOTIFICĂRI")
logging.info("=" * 60)
# Colectează toate fișierele de trimis
files_to_send = [str(csv_path)] # CSV cu solduri
# Adaugă toate CSV-urile cu tranzacții
for df in downloaded_files:
if 'fisier' in df and Path(df['fisier']).exists():
files_to_send.append(df['fisier'])
logging.info(f"Adăugat pentru notificare: {Path(df['fisier']).name}")
logging.info(f"Total fișiere de trimis: {len(files_to_send)}")
# Trimite prin toate canalele configurate
service = NotificationService(self.config)
logging.info(f"Calling send_all with telegram_message_id={self.telegram_message_id}, telegram_chat_id={self.telegram_chat_id}")
results = service.send_all(
files_to_send,
accounts,
telegram_message_id=self.telegram_message_id,
telegram_chat_id=self.telegram_chat_id
)
# Afișează rezumat
if self.config.EMAIL_ENABLED:
status = "✓ Succes" if results['email'] else "✗ Eșuat"
logging.info(f"Email: {status}")
if self.config.TELEGRAM_ENABLED:
status = "✓ Succes" if results['telegram'] else "✗ Eșuat"
logging.info(f"Telegram: {status}")
logging.info("=" * 60)
except Exception as e:
logging.warning(f"Notificările au eșuat: {e}")
logging.warning("Scraper-ul a finalizat cu succes, dar notificările nu au fost trimise")
# Nu aruncă excepția mai departe - notificările sunt opționale
def _handle_error(self, error):
"""Error handling cu screenshot"""
logging.error("=" * 60)
logging.error(f"EROARE: {error}")
logging.error("=" * 60, exc_info=True)
# Salvare screenshot la eroare
if self.page and self.config.SCREENSHOT_ON_ERROR:
try:
error_path = Path(self.config.OUTPUT_DIR) / f"error_{datetime.now().strftime('%Y%m%d_%H%M%S')}.png"
self.page.screenshot(path=str(error_path))
logging.error(f"Screenshot eroare salvat: {error_path}")
except Exception as e:
logging.error(f"Nu am putut salva screenshot: {e}")
def main():
"""Functie main pentru rulare script"""
try:
scraper = BTGoScraper()
success = scraper.run()
exit(0 if success else 1)
except ValueError as e:
# Eroare de configurare
logging.error(f"Eroare configurare: {e}")
exit(4)
except NotImplementedError as e:
# Selectors nu sunt completati
print(str(e))
exit(5)
except Exception as e:
logging.error(f"Eroare neasteptata: {e}", exc_info=True)
exit(99)
if __name__ == "__main__":
main()