Files
janssen/IWRS/download_reports.py
T
2026-04-21 10:43:01 +02:00

96 lines
3.1 KiB
Python

from playwright.sync_api import sync_playwright
import os
# ── CONFIG ──────────────────────────────────────────────────────────────────
BASE_URL = "https://janssen.4gclinical.com"
EMAIL = "vbuzalka@its.jnj.com"
PASSWORD = "Vlado123++-+"
# STUDY = "42847922MDD3003"
STUDY = "77242113UCO3001"
SITES = {
"42847922MDD3003": [
"S10-CZ10002",
"S10-CZ10004",
"S10-CZ10005",
"S10-CZ10008",
"S10-CZ10011",
"S10-CZ10012",
],
"77242113UCO3001": [
"DD5-CZ10001",
"DD5-CZ10003",
"DD5-CZ10006",
"DD5-CZ10009",
"DD5-CZ10010",
"DD5-CZ10012",
"DD5-CZ10013",
"DD5-CZ10015",
"DD5-CZ10016",
"DD5-CZ10020",
"DD5-CZ10021",
"DD5-CZ10022",
],
}
OUTPUT_DIR = f"xls_reports_{STUDY}"
# ────────────────────────────────────────────────────────────────────────────
os.makedirs(OUTPUT_DIR, exist_ok=True)
def download_reports():
with sync_playwright() as p:
browser = p.chromium.launch(headless=False)
context = browser.new_context(accept_downloads=True)
page = context.new_page()
# Přihlášení
page.goto(BASE_URL)
page.wait_for_load_state("networkidle")
page.get_by_label("Email *").fill(EMAIL)
page.get_by_label("Password *").fill(PASSWORD)
page.locator('#login__submit').click()
page.wait_for_load_state("networkidle")
# Výběr studie
page.get_by_label("Study *").click()
page.get_by_role("option", name=STUDY).click()
page.get_by_role("button", name="SELECT").click()
page.wait_for_load_state("networkidle")
# Naviguj na report stránku
page.goto(f"{BASE_URL}/report/onsite_inventory_detail")
page.wait_for_load_state("networkidle", timeout=15000)
for site_id in SITES[STUDY]:
print(f"[{site_id}] Stahuji...")
# Otevři dropdown a vyber site
page.locator('input[placeholder="search"], input[type="text"]').first.click()
page.get_by_role("option", name=site_id).click()
# Počkej na dokončení načítání dat (síť se uklidní)
page.wait_for_load_state("networkidle", timeout=30000)
# Stáhni XLS
with page.expect_download(timeout=30000) as dl:
page.get_by_role("button", name="Download XLS").click()
download = dl.value
filename = os.path.join(OUTPUT_DIR, f"onsite_inventory_detail_{site_id}.xlsx")
download.save_as(filename)
print(f"[{site_id}] Ulozeno: {filename}")
# Zruš výběr site pro další iteraci
page.get_by_role("button", name="Clear").click()
page.wait_for_load_state("networkidle", timeout=15000)
browser.close()
print("\nHotovo! Všechny reporty staženy.")
download_reports()