z230

Merge remote-tracking branch 'origin/master'
2026-02-03 18:01:23 +01:00 · 2026-02-03 13:26:11 +01:00 · 2026-02-02 09:22:02 +01:00 · 2026-02-02 09:19:11 +01:00 · 2026-02-01 13:49:23 +01:00 · 2026-01-24 08:41:48 +01:00
13 changed files with 2135 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1,2 @@
+.venv/
+.idea/
--- a/Library/10
+++ b/Library/10
@@ -0,0 +1,200 @@
+import os
+import sys
+import pymysql
+import pymysql.cursors
+
+# ================= KONFIGURACE =================
+
+# --- BEZPEČNOSTNÍ POJISTKA ---
+# True  = POUZE VÝPIS (nic se nesmaže, databáze se nezmění)
+# False = OSTRÝ REŽIM (maže soubory i záznamy v DB!)
+DRY_MODE = True
+
+# 1. Přístup k MySQL
+DB_CONFIG = {
+    'host': '192.168.1.76',
+    'port': 3307,
+    'user': 'root',
+    'password': 'Vlado9674+',
+    'db': 'torrents',
+    'charset': 'utf8mb4',
+    'autocommit': True
+}
+
+TABULKA = "file_md5_index"
+
+# 2. Mapování cest
+SERVER_PREFIX = "/mnt/user/Library"
+# Používáme 'r' pro raw string, aby se zpětná lomítka chápala správně
+LOCAL_PREFIX = r"\\tower1\#library"
+
+
+# ===============================================
+
+def get_connection():
+    return pymysql.connect(
+        cursorclass=pymysql.cursors.DictCursor,
+        **DB_CONFIG
+    )
+
+
+def convert_path(db_path):
+    """Převede cestu z Linux serveru na lokální cestu Windows."""
+    if db_path.startswith(SERVER_PREFIX):
+        relative_path = db_path[len(SERVER_PREFIX):]
+        # Ořízneme počáteční lomítka z relativní cesty, aby fungoval join
+        relative_path = relative_path.lstrip("/").lstrip("\\")
+        # Spojí cesty a opraví lomítka
+        local_path = os.path.join(LOCAL_PREFIX, relative_path)
+        return os.path.normpath(local_path)
+    return None
+
+
+def step_1_mark_duplicates():
+    print(f"\n--- KROK 1: Hledání duplicit v DB (DRY_MODE={DRY_MODE}) ---")
+
+    try:
+        conn = get_connection()
+        with conn.cursor() as cursor:
+            if DRY_MODE:
+                # V DRY_MODE jen počítáme, co bychom označili (neprovádíme UPDATE)
+                sql = f"""
+                SELECT COUNT(*) as pocet
+                FROM {TABULKA} t1
+                JOIN {TABULKA} t2 ON t1.blake3 = t2.blake3
+                WHERE t1.host_name = 'TOWER1' 
+                  AND t2.host_name = 'SYNOLOGY'
+                  AND (t1.to_delete IS NULL OR t1.to_delete = 0);
+                """
+                cursor.execute(sql)
+                result = cursor.fetchone()
+                affected = result['pocet']
+                print(f"[DRY-RUN] Našel jsem {affected} shodných záznamů (DB nebude změněna).")
+            else:
+                # V OSTRÉM režimu provádíme UPDATE
+                sql = f"""
+                UPDATE {TABULKA} t1
+                JOIN {TABULKA} t2 ON t1.blake3 = t2.blake3
+                SET t1.to_delete = 1
+                WHERE t1.host_name = 'TOWER' 
+                  AND t2.host_name = 'SYNOLOGY'
+                  AND (t1.to_delete IS NULL OR t1.to_delete = 0);
+                """
+                print("Provádím UPDATE záznamů v databázi...")
+                cursor.execute(sql)
+                affected = cursor.rowcount
+                conn.commit()
+                print(f"Hotovo. Označeno {affected} záznamů ke smazání.")
+
+        conn.close()
+        return affected
+
+    except pymysql.MySQLError as e:
+        print(f"Chyba MySQL při označování: {e}")
+        sys.exit(1)
+
+
+def step_2_delete_files():
+    print(f"\n--- KROK 2: Mazání souborů (DRY_MODE={DRY_MODE}) ---")
+
+    try:
+        conn = get_connection()
+        files_to_process = []
+
+        with conn.cursor() as cursor:
+            print("Stahuji seznam souborů...")
+
+            if DRY_MODE:
+                # V DRY_MODE nemůžeme hledat podle 'to_delete=1' (protože jsme nic neoznačili),
+                # takže musíme použít JOIN dotaz přímo pro simulaci výpisu.
+                sql = f"""
+                SELECT t1.id, t1.full_path 
+                FROM {TABULKA} t1
+                JOIN {TABULKA} t2 ON t1.blake3 = t2.blake3
+                WHERE t1.host_name = 'TOWER' 
+                  AND t2.host_name = 'SYNOLOGY'
+                  AND (t1.to_delete IS NULL OR t1.to_delete = 0)
+                """
+            else:
+                # V OSTRÉM režimu bereme to, co jsme v kroku 1 označili
+                sql = f"SELECT id, full_path FROM {TABULKA} WHERE host_name = 'TOWER' AND to_delete = 1"
+
+            cursor.execute(sql)
+            files_to_process = cursor.fetchall()
+
+        count = len(files_to_process)
+        print(f"Nalezeno {count} souborů.")
+
+        if count == 0:
+            print("Žádné soubory k zpracování. Konec.")
+            return
+
+        # V ostrém režimu se zeptáme na potvrzení
+        if not DRY_MODE:
+            confirm = input(f"-> [POZOR] Opravdu chcete SMAZAT {count} souborů? (napište 'ano'): ")
+            if confirm.lower() != 'ano':
+                print("Operace zrušena.")
+                return
+        else:
+            print("-" * 40)
+            print("VÝPIS SOUBORŮ, KTERÉ BY BYLY SMAZÁNY:")
+            print("-" * 40)
+
+        deleted_counter = 0
+        errors = 0
+
+        for row in files_to_process:
+            db_id = row['id']
+            server_path = row['full_path']
+            local_path = convert_path(server_path)
+
+            if not local_path:
+                print(f"[SKIP PATH] Nesedí prefix: {server_path}")
+                continue
+
+            # --- LOGIKA DRY RUN vs REAL ---
+            if DRY_MODE:
+                # Pouze výpis
+                print(f"[DRY-RUN] Bylo by smazáno: {local_path}")
+                deleted_counter += 1
+            else:
+                # Ostré mazání
+                try:
+                    if os.path.exists(local_path):
+                        os.remove(local_path)
+                        print(f"[OK SMAZÁNO] {local_path}")
+
+                        # Smazání z DB
+                        with conn.cursor() as del_cursor:
+                            del_sql = f"DELETE FROM {TABULKA} WHERE id = %s"
+                            del_cursor.execute(del_sql, (db_id,))
+                        conn.commit()
+                        deleted_counter += 1
+                    else:
+                        print(f"[NENÍ NA DISKU] Mažu jen z DB: {local_path}")
+                        with conn.cursor() as del_cursor:
+                            del_sql = f"DELETE FROM {TABULKA} WHERE id = %s"
+                            del_cursor.execute(del_sql, (db_id,))
+                        conn.commit()
+                        deleted_counter += 1
+
+                except OSError as e:
+                    print(f"[CHYBA OS] {local_path}: {e}")
+                    errors += 1
+                except pymysql.MySQLError as e:
+                    print(f"[CHYBA DB] ID {db_id}: {e}")
+
+        conn.close()
+        print("-" * 30)
+        if DRY_MODE:
+            print(f"DRY RUN DOKONČEN. Zobrazena simulace pro {deleted_counter} souborů.")
+        else:
+            print(f"HOTOVO. Úspěšně smazáno: {deleted_counter}, Chyby: {errors}")
+
+    except pymysql.MySQLError as e:
+        print(f"Kritická chyba DB: {e}")
+
+
+if __name__ == "__main__":
+    step_1_mark_duplicates()
+    step_2_delete_files()
--- a/MazáníPrádnýchAdresářů.py
+++ b/MazáníPrádnýchAdresářů.py
@@ -0,0 +1,38 @@
+import os
+
+
+def cleanup_empty_folders(target_path, dry_run=True):
+    # Kontrola, zda cesta existuje
+    if not os.path.exists(target_path):
+        print(f"Chyba: Cesta {target_path} neexistuje.")
+        return
+
+    print(f"Prohledávám: {target_path}")
+    if dry_run:
+        print("POZOR: Spuštěno v režimu DRY RUN (nic se nemaže)\n")
+
+    # topdown=False je klíčové - začínáme od nejhlubších složek
+    for root, dirs, files in os.walk(target_path, topdown=False):
+        for name in dirs:
+            folder_path = os.path.join(root, name)
+
+            # Kontrola, zda je složka prázdná
+            # Listdir vypíše vše v adresáři (včetně skrytých souborů)
+            if not os.listdir(folder_path):
+                if dry_run:
+                    print(f"[DRY RUN] Složka by byla smazána: {folder_path}")
+                else:
+                    try:
+                        os.rmdir(folder_path)
+                        print(f"Smazáno: {folder_path}")
+                    except OSError as e:
+                        print(f"Chyba při mazání {folder_path}: {e}")
+
+
+if __name__ == "__main__":
+    # Cesta k vašemu síťovému sdílení
+    # V Pythonu na Windows použijte r"" (raw string) kvůli zpětným lomítkům
+    path_to_clean = r"\\tower1\#library"
+
+    # Prvně spusťte s dry_run=True, abyste viděli, co se stane
+    cleanup_empty_folders(path_to_clean, dry_run=True)
--- a/ReadKulhavaPST.py
+++ b/ReadKulhavaPST.py
@@ -0,0 +1,92 @@
+import win32com.client
+import os
+
+# Your specific file path
+pst_path = r'd:\Dropbox\!!!Days\Downloads Z230\PST\tkulhava.pst'
+
+
+def main():
+    if not os.path.exists(pst_path):
+        print(f"Error: File not found at {pst_path}")
+        return
+
+    try:
+        # Connect to Outlook
+        outlook = win32com.client.Dispatch("Outlook.Application").GetNamespace("MAPI")
+
+        # 1. Add the PST to Outlook (This makes it visible in the sidebar)
+        print(f"Mounting PST: {pst_path}...")
+        outlook.AddStore(pst_path)
+
+        # 2. Find the folder object for this PST
+        # We search specifically for the folder that matches the filename 'tkulhava'
+        # or grab the last added store if the name doesn't match exactly.
+        pst_name = "tkulhava"  # derived from filename usually
+        root_folder = None
+
+        # Loop through all stores to find the new one
+        for folder in outlook.Folders:
+            if pst_name.lower() in folder.Name.lower():
+                root_folder = folder
+                break
+
+        # Fallback: Just grab the last folder in the list if name didn't match
+        if not root_folder:
+            root_folder = outlook.Folders.GetLast()
+
+        print(f"Successfully opened root folder: {root_folder.Name}")
+        print("=" * 50)
+
+        # 3. Start the recursive walk
+        print_subjects_recursively(root_folder)
+
+        # 4. Cleanup: Remove the PST from Outlook
+        # (Comment this out if you want to keep it open in Outlook to inspect manually)
+        outlook.RemoveStore(root_folder)
+        print("\nDone. PST detached.")
+
+    except Exception as e:
+        print(f"An error occurred: {e}")
+
+
+def print_subjects_recursively(folder):
+    """
+    Recursively prints subjects of emails in a folder and its subfolders.
+    """
+    try:
+        # Print current folder name for context
+        # Check if folder has items
+        if folder.Items.Count > 0:
+            print(f"\n--- Folder: {folder.Name} ---")
+
+        # Iterate through items
+        for item in folder.Items:
+            try:
+                # Class 43 is a standard MailItem. 
+                # Other items (meeting requests, reports) might not have a Subject or behave differently.
+                if item.Class == 43:
+                    print(f"Subject: {item.Subject}")
+                else:
+                    # Attempt to print subject anyway (e.g., for Meeting Items)
+                    print(f"[{type_name(item.Class)}] Subject: {item.Subject}")
+            except Exception:
+                # Skip items that are corrupted or unreadable
+                pass
+
+        # Recursion: Go deeper into subfolders
+        for subfolder in folder.Folders:
+            print_subjects_recursively(subfolder)
+
+    except Exception as e:
+        print(f"Skipping restricted folder '{folder.Name}': {e}")
+
+
+def type_name(class_id):
+    # Helper to identify non-email items
+    if class_id == 53: return "Meeting"
+    if class_id == 46: return "Report"
+    return f"Type {class_id}"
+
+
+if __name__ == "__main__":
+    main()
--- a/ReadKulhavaSavePhotos.py
+++ b/ReadKulhavaSavePhotos.py
@@ -0,0 +1,142 @@
+import win32com.client
+import os
+import pathlib
+
+# --- CONFIGURATION ---
+pst_path = r'd:\Dropbox\!!!Days\Downloads Z230\PST\tkulhava.pst'
+output_dir = r'd:\Dropbox\!!!Days\Downloads Z230\PST\pictures'
+
+# Image extensions to look for (case insensitive)
+IMAGE_EXTENSIONS = {'.jpg', '.jpeg', '.png', '.gif', '.bmp', '.tif', '.tiff'}
+
+
+def fix_encoding(text):
+    """Repairs text wrongly decoded as cp1252 instead of cp1250."""
+    if not text: return ""
+    try:
+        return text.encode('cp1252').decode('cp1250')
+    except Exception:
+        return text
+
+
+def get_unique_filepath(directory, filename):
+    """
+    Checks if a file exists. If so, adds a counter (_1, _2) to the filename
+    until a unique name is found.
+    """
+    # Clean filename of illegal characters just in case
+    filename = "".join(x for x in filename if x.isalnum() or x in "._- ")
+
+    path = pathlib.Path(directory) / filename
+    if not path.exists():
+        return path
+
+    # Split name and extension
+    stem = path.stem
+    suffix = path.suffix
+    counter = 1
+
+    while True:
+        new_filename = f"{stem}_{counter}{suffix}"
+        new_path = pathlib.Path(directory) / new_filename
+        if not new_path.exists():
+            return new_path
+        counter += 1
+
+
+def process_item_attachments(item, save_folder):
+    """Checks an item for attachments and saves pictures."""
+    try:
+        # Check if item has attachments
+        if item.Attachments.Count > 0:
+            for attachment in item.Attachments:
+                try:
+                    # Get filename and extension
+                    fname = getattr(attachment, 'FileName', '')
+                    if not fname: continue
+
+                    # Fix encoding on filename if needed (sometimes attachments inherit bad encoding)
+                    fname = fix_encoding(fname)
+
+                    ext = os.path.splitext(fname)[1].lower()
+
+                    if ext in IMAGE_EXTENSIONS:
+                        # Determine unique path
+                        save_path = get_unique_filepath(save_folder, fname)
+
+                        # Save the file
+                        attachment.SaveAsFile(str(save_path))
+                        print(f"   [SAVED] {save_path.name}")
+                except Exception as e:
+                    print(f"   [ERROR saving attachment]: {e}")
+    except Exception:
+        # Some items (like corrupted notes) fail when accessing .Attachments
+        pass
+
+
+def scan_folder_recursively(folder, save_folder):
+    """Recursively walks folders and processes items."""
+    try:
+        folder_name = fix_encoding(folder.Name)
+
+        # Optional: Print folder progress
+        if folder.Items.Count > 0:
+            print(f"Scanning Folder: {folder_name}...")
+
+        # Process items in this folder
+        for item in folder.Items:
+            process_item_attachments(item, save_folder)
+
+        # Recursion
+        for subfolder in folder.Folders:
+            scan_folder_recursively(subfolder, save_folder)
+
+    except Exception as e:
+        print(f"Skipping folder '{fix_encoding(folder.Name)}': {e}")
+
+
+def main():
+    # 1. Ensure output directory exists
+    if not os.path.exists(output_dir):
+        os.makedirs(output_dir)
+        print(f"Created directory: {output_dir}")
+
+    if not os.path.exists(pst_path):
+        print(f"Error: PST file not found at {pst_path}")
+        return
+
+    try:
+        # 2. Connect to Outlook
+        outlook = win32com.client.Dispatch("Outlook.Application").GetNamespace("MAPI")
+
+        print(f"Mounting PST: {pst_path}...")
+        outlook.AddStore(pst_path)
+
+        # 3. Find the PST folder
+        pst_name = "tkulhava"  # Usually derived from filename
+        root_folder = None
+        for folder in outlook.Folders:
+            if pst_name.lower() in folder.Name.lower():
+                root_folder = folder
+                break
+
+        if not root_folder:
+            root_folder = outlook.Folders.GetLast()
+
+        print(f"Opened: {fix_encoding(root_folder.Name)}")
+        print(f"Saving pictures to: {output_dir}")
+        print("=" * 50)
+
+        # 4. Start processing
+        scan_folder_recursively(root_folder, output_dir)
+
+        # 5. Cleanup
+        outlook.RemoveStore(root_folder)
+        print("\nDone. PST detached.")
+
+    except Exception as e:
+        print(f"Critical Error: {e}")
+
+
+if __name__ == "__main__":
+    main()
--- a/DuplicateTest.py
+++ b/DuplicateTest.py
@@ -0,0 +1,67 @@
+import pandas as pd
+from sqlalchemy import create_engine
+import time
+
+# --- KONFIGURACE ---
+db_user = 'root'
+db_pass = 'Vlado9674+'
+db_host = '192.168.1.76'
+db_port = '3307'
+db_name = 'torrents'  # <--- ZDE DOPLNIT NÁZEV DATABÁZE
+
+# --- PŘIPOJENÍ ---
+connection_string = f'mysql+mysqlconnector://{db_user}:{db_pass}@{db_host}:{db_port}/{db_name}'
+engine = create_engine(connection_string)
+
+# SQL dotaz - vybíráme i full_path, abychom mohli v Pandas ukázat příklad cesty
+# POZOR: Načítání 5.8M textových řetězců (full_path) zabere dost RAM (odhadem 2-4 GB).
+query = """
+SELECT id, blake3, file_size, full_path 
+FROM file_md5_index FORCE INDEX (idx_full_path_prefix)
+WHERE host_name='Tower1' AND full_path LIKE '/mnt/user/#Library%'
+"""
+
+print("1. Začínám stahovat data z MySQL do RAM...")
+start_load = time.time()
+
+try:
+    # Stáhnutí dat
+    df = pd.read_sql(query, engine)
+    end_load = time.time()
+    print(f"-> Data stažena za: {end_load - start_load:.2f} sekund")
+    print(f"-> Počet řádků v paměti: {len(df)}")
+
+    print("\n2. Začínám hledat duplicity (Pandas GroupBy)...")
+    start_process = time.time()
+
+    # Logika hledání duplicit
+    # Najdeme jen ty, co mají duplicitní hash
+    duplicity = df[df.duplicated(subset=['blake3'], keep=False)]
+
+    if not duplicity.empty:
+        # Seskupení
+        vysledek = duplicity.groupby('blake3').agg({
+            'file_size': 'first',  # Velikost souboru (předpokládáme stejnou pro stejný hash)
+            'id': 'count',  # Počet výskytů
+            'full_path': lambda x: x.iloc[0]  # Ukázka první cesty (rychlejší než 'first')
+        }).rename(columns={'id': 'pocet_kopii'})
+
+        # Filtrujeme jen ty, co mají skutečně více kopií a seřadíme podle velikosti * počet kopií
+        # (Chceme vidět, kde plýtváme nejvíc místa)
+        vysledek['celkove_plytvani'] = vysledek['file_size'] * (vysledek['pocet_kopii'] - 1)
+        vysledek = vysledek.sort_values('celkove_plytvani', ascending=False)
+
+        end_process = time.time()
+        print(f"-> Zpracováno za: {end_process - start_process:.4f} sekund")
+
+        print("\n--- TOP 20 NEJVĚTŠÍCH DUPLICIT ---")
+        # Zobrazíme hash, počet kopií, velikost jednoho souboru a ukázku cesty
+        print(vysledek[['pocet_kopii', 'file_size', 'full_path']].head(20))
+
+        print(f"\nCelkem nalezeno {len(vysledek)} unikátních souborů, které mají duplicity.")
+    else:
+        print("Nebyly nalezeny žádné duplicity.")
+
+except Exception as e:
+    print(f"\nCHYBA: {e}")
+    print("Zkontrolujte prosím název databáze a jestli máte dost paměti RAM.")
--- a/WalkFilesOnBackupHDD/10
+++ b/WalkFilesOnBackupHDD/10
@@ -0,0 +1,295 @@
+#!/usr/bin/python3
+# -*- coding: utf-8 -*-
+
+"""
+FAST FILE HASH INDEXER – WINDOWS CLIENT (EXTERNAL DISKS)
+- Mode: PHYSICAL BACKUP
+- Hostname in DB = Disk Label (e.g., #HD015)
+- Path in DB     = Relative path (e.g., /Movies/Film.mkv)
+"""
+
+import os, time
+import pymysql
+import socket
+import platform
+import sys
+from blake3 import blake3
+
+# ==============================
+# CONFIG
+# ==============================
+CHUNK_SIZE = 5 * 1024 * 1024   # 5 MB
+PROGRESS_MIN_SIZE = 500 * 1024 * 1024  # 500 MB
+PROGRESS_INTERVAL = 1.0  # seconds
+
+EXCLUDED_DIRS = {"$RECYCLE.BIN", "System Volume Information", "RECYCLER", "msdownld.tmp"}
+
+# --- Limity velikosti ---
+FILE_MIN_SIZE = 0
+FILE_MAX_SIZE = 1024 * 1024 * 1024* 1024  # 1TB
+
+# --- Nastavení Databáze ---
+DB_CONFIG = {
+    "host": "192.168.1.76",
+    "port": 3307,
+    "user": "root",
+    "password": "Vlado9674+",
+    "database": "torrents",
+    "charset": "utf8mb4",
+    "autocommit": True,
+}
+
+CHUNK_SIZE = 4 * 1024 * 1024  # 4 MB
+PRINT_SKIPPED = False  # True = vypisovat i přeskočené
+
+# ==============================
+# SYSTEM INFO
+# ==============================
+
+# Fyzický název PC (jen pro výpis do konzole, do DB půjde název disku)
+REAL_PC_HOSTNAME = socket.gethostname()
+OS_NAME = platform.system()
+
+
+# ==============================
+# FUNCTIONS
+# ==============================
+
+def compute_blake3(path: str) -> bytes:
+    h = blake3()
+    total_size = os.path.getsize(path)
+    show_progress = total_size >= PROGRESS_MIN_SIZE
+
+    processed = 0
+    start_time = time.time()
+    last_report = start_time
+
+    try:
+        with open(path, "rb") as f:
+            while True:
+                chunk = f.read(CHUNK_SIZE)
+                if not chunk:
+                    break
+
+                h.update(chunk)
+                processed += len(chunk)
+
+                if show_progress:
+                    now = time.time()
+                    if now - last_report >= PROGRESS_INTERVAL:
+                        elapsed = now - start_time
+                        speed = processed / elapsed if elapsed > 0 else 0
+                        percent = processed / total_size * 100
+                        remaining = total_size - processed
+                        eta = remaining / speed if speed > 0 else 0
+
+                        print(
+                            f"   ⏳ {percent:6.2f}% | "
+                            f"{processed/1024/1024:8.1f} / {total_size/1024/1024:.1f} MB | "
+                            f"{speed/1024/1024:6.1f} MB/s | "
+                            f"ETA {time.strftime('%H:%M:%S', time.gmtime(eta))}",
+                            flush=True
+                        )
+                        last_report = now
+
+        if show_progress:
+            total_time = time.time() - start_time
+            avg_speed = total_size / total_time if total_time > 0 else 0
+            print(
+                f"   ✅ DONE | "
+                f"{total_size/1024/1024:.1f} MB | "
+                f"avg {avg_speed/1024/1024:.1f} MB/s | "
+                f"time {time.strftime('%H:%M:%S', time.gmtime(total_time))}",
+                flush=True
+            )
+
+        return h.digest()
+
+    except Exception as e:
+        print(f"⚠️ HASH ERROR: {path} - {e}")
+        raise
+
+
+
+def get_drive_info():
+    """Získá písmeno disku a jeho ID (které se použije jako host_name)."""
+    print("\n💿 --- NASTAVENÍ SKENOVÁNÍ (EXTERNÍ DISK) ---")
+
+    # 1. Písmeno disku
+    while True:
+        drive_input = input("📂 Zadejte písmeno disku ve Windows (např. 'E'): ").strip().upper()
+        drive_letter = drive_input.replace(":", "").replace("\\", "").replace("/", "")
+
+        if len(drive_letter) == 1 and drive_letter.isalpha():
+            drive_root = f"{drive_letter}:\\"
+            if os.path.isdir(drive_root):
+                break
+            else:
+                print(f"❌ Disk {drive_root} není dostupný.")
+        else:
+            print("❌ Neplatný formát.")
+
+    # 2. Název disku -> HOST_NAME
+    while True:
+        disk_label = input("🏷️  Zadejte ID disku (bude uloženo jako 'host_name', např. '#HD015'): ").strip()
+        if len(disk_label) >= 2:
+            break
+        print("❌ Název je příliš krátký.")
+
+    return drive_root, disk_label
+
+
+def size_allowed(size: int) -> bool:
+    if FILE_MIN_SIZE is not None and size < FILE_MIN_SIZE: return False
+    if FILE_MAX_SIZE is not None and size > FILE_MAX_SIZE: return False
+    return True
+
+
+# ==============================
+# MAIN
+# ==============================
+
+def main():
+    print("🚀 BLAKE3 External Disk Indexer", flush=True)
+    print(f"🖥 Running on PC: {REAL_PC_HOSTNAME}", flush=True)
+
+    # Získání vstupů
+    scan_root, disk_hostname = get_drive_info()
+
+    print(f"✅ Konfigurace:")
+    print(f"   Zdroj (Windows) : {scan_root}")
+    print(f"   DB Hostname     : {disk_hostname}")
+    print(f"   DB Cesty        : /Složka/Soubor...")
+
+    try:
+        db = pymysql.connect(**DB_CONFIG)
+        cur = db.cursor()
+    except Exception as e:
+        print(f"❌ DB Connection failed: {e}")
+        input("Enter pro konec...")
+        return
+
+    print(f"📥 Načítám index pro disk: '{disk_hostname}'...", flush=True)
+
+    # === OPTIMALIZACE: Hledáme přesně podle host_name ===
+    cur.execute("""
+        SELECT full_path, file_size, UNIX_TIMESTAMP(mtime)
+        FROM file_md5_index
+        WHERE host_name = %s
+    """, (disk_hostname,))
+
+    # Mapa: { "/Slozka/Soubor.ext": (size, mtime) }
+    indexed_map = {row[0]: (row[1], row[2]) for row in cur.fetchall()}
+
+    print(f"✅ Nalezeno {len(indexed_map):,} souborů v DB pro tento disk.", flush=True)
+    print("======================================", flush=True)
+
+    new_files = 0
+    skipped = 0
+    filtered = 0
+    errors = 0
+    seen_paths = set()
+
+    # --- SCAN ---
+    for root, dirs, files in os.walk(scan_root):
+        # Ignorace systémových složek
+        dirs[:] = [d for d in dirs if d not in EXCLUDED_DIRS]
+
+        for fname in files:
+            disk_path = os.path.join(root, fname)
+
+            # 1. Stat (velikost, čas)
+            try:
+                stat = os.stat(disk_path)
+            except OSError:
+                errors += 1
+                continue
+
+            size = stat.st_size
+            if not size_allowed(size):
+                filtered += 1
+                continue
+
+            # 2. Vytvoření čisté cesty pro DB
+            # E:\Filmy\Avatar.mkv -> Filmy\Avatar.mkv
+            try:
+                rel_path = os.path.relpath(disk_path, scan_root)
+            except ValueError:
+                errors += 1
+                continue
+
+            # Normalizace na Linux style: Filmy/Avatar.mkv
+            clean_path = rel_path.replace("\\", "/")
+
+            # Přidání lomítka na začátek: /Filmy/Avatar.mkv
+            if not clean_path.startswith("/"):
+                clean_path = "/" + clean_path
+
+            if clean_path in seen_paths:
+                continue
+            seen_paths.add(clean_path)
+
+            mtime = int(stat.st_mtime)
+
+            # === STRICT CHECK ===
+            is_match = False
+            if clean_path in indexed_map:
+                db_size, db_mtime = indexed_map[clean_path]
+                if size == db_size and mtime == db_mtime:
+                    is_match = True
+
+            if is_match:
+                skipped += 1
+                if PRINT_SKIPPED:
+                    print(f"⏭ SKIP {clean_path}", flush=True)
+                continue
+
+            # === INSERT / UPDATE ===
+            print("➕ NEW / UPDATED", flush=True)
+            print(f"   File: {clean_path}", flush=True)
+            print(f"   Size: {size:,} B", flush=True)
+
+            try:
+                b3 = compute_blake3(disk_path)
+            except Exception:
+                errors += 1
+                continue
+
+            cur.execute("""
+                INSERT INTO file_md5_index
+                    (os_name, host_name, full_path, file_name, directory,
+                     file_size, mtime, blake3)
+                VALUES (%s, %s, %s, %s, %s, %s, FROM_UNIXTIME(%s), %s)
+                ON DUPLICATE KEY UPDATE
+                    file_size  = VALUES(file_size),
+                    mtime      = VALUES(mtime),
+                    blake3     = VALUES(blake3),
+                    updated_at = CURRENT_TIMESTAMP
+            """, (
+                OS_NAME,  # Např. 'Windows' (kde se to skenovalo)
+                disk_hostname,  # ZDE SE UKLÁDÁ '#HD015'
+                clean_path,  # ZDE SE UKLÁDÁ '/Filmy/Avatar.mkv'
+                fname,
+                os.path.dirname(clean_path),
+                size,
+                mtime,
+                b3,
+            ))
+
+            new_files += 1
+            print(f"   Hash: {b3.hex()}", flush=True)
+            print("--------------------------------------", flush=True)
+
+    print("======================================", flush=True)
+    print(f"✅ Hotovo : {new_files}")
+    print(f"⏭ Shoda  : {skipped}")
+    print(f"⚠️ Chyby  : {errors}")
+    print("🏁 Konec.")
+
+    cur.close()
+    db.close()
+    # input("\nStiskněte Enter pro ukončení...")
+
+
+if __name__ == "__main__":
+    main()
--- a/WalkFilesOnBackupHDD/20
+++ b/WalkFilesOnBackupHDD/20
@@ -0,0 +1,355 @@
+#!/usr/bin/python3
+# -*- coding: utf-8 -*-
+
+r"""
+FAST FILE HASH INDEXER – WINDOWS CLIENT (HARDCODED CONFIG)
+- Mode: PHYSICAL BACKUP
+- Hostname in DB = Disk Label (e.g., #HD015)
+- Path in DB     = Relative path (e.g., /Movies/Film.mkv)
+"""
+
+import os, time
+import pymysql
+import socket
+import platform
+import sys
+from blake3 import blake3
+
+def get_path_hash(path_str: str) -> bytes:
+    """Calculates MD5 hash of the path and returns raw 16 bytes for BINARY(16)."""
+    return hashlib.md5(path_str.encode('utf-8')).digest()
+
+# ==============================
+# ⚙️ USER CONFIGURATION
+# ==============================
+DISK_DRIVE_LETTER = "z"  # (e.g., "E", "F", "P")
+DISK_HOSTNAME = "TW22"  # (e.g., "#HD015")
+
+# 🔒 SAFETY SWITCH
+# True  = LIST ONLY (No DB changes). "Simulates" the run.
+# False = EXECUTE (Deletes and Inserts into DB).
+DRY_RUN = False
+
+# ==============================
+# TECHNICAL CONFIG
+# ==============================
+CHUNK_SIZE = 5 * 1024 * 1024  # 5 MB
+PROGRESS_MIN_SIZE = 500 * 1024 * 1024  # 500 MB
+PROGRESS_INTERVAL = 1.0  # seconds
+
+EXCLUDED_DIRS = {"$RECYCLE.BIN", "System Volume Information", "RECYCLER", "msdownld.tmp"}
+
+# --- File Size Limits ---
+FILE_MIN_SIZE = 0
+FILE_MAX_SIZE = 1024 * 1024*1024*1024  # 1TB
+
+# --- DB Config ---
+DB_CONFIG = {
+    "host": "192.168.1.76",
+    "port": 3307,
+    "user": "root",
+    "password": "Vlado9674+",
+    "database": "torrents",
+    "charset": "utf8mb4",
+    "autocommit": True,
+}
+
+PRINT_SKIPPED = False  # Set True to see files that were already in DB
+
+# ==============================
+# SYSTEM INFO
+# ==============================
+REAL_PC_HOSTNAME = socket.gethostname()
+OS_NAME = platform.system()
+
+
+# ==============================
+# FUNCTIONS
+# ==============================
+
+def compute_blake3(path: str) -> bytes:
+    h = blake3()
+    total_size = os.path.getsize(path)
+    show_progress = total_size >= PROGRESS_MIN_SIZE
+
+    processed = 0
+    start_time = time.time()
+    last_report = start_time
+
+    try:
+        with open(path, "rb") as f:
+            while True:
+                chunk = f.read(CHUNK_SIZE)
+                if not chunk:
+                    break
+
+                h.update(chunk)
+                processed += len(chunk)
+
+                if show_progress:
+                    now = time.time()
+                    if now - last_report >= PROGRESS_INTERVAL:
+                        elapsed = now - start_time
+                        speed = processed / elapsed if elapsed > 0 else 0
+                        percent = processed / total_size * 100
+                        remaining = total_size - processed
+                        eta = remaining / speed if speed > 0 else 0
+
+                        print(
+                            f"   ⏳ {percent:6.2f}% | "
+                            f"{processed / 1024 / 1024:8.1f} / {total_size / 1024 / 1024:.1f} MB | "
+                            f"{speed / 1024 / 1024:6.1f} MB/s | "
+                            f"ETA {time.strftime('%H:%M:%S', time.gmtime(eta))}",
+                            flush=True
+                        )
+                        last_report = now
+
+        if show_progress:
+            total_time = time.time() - start_time
+            avg_speed = total_size / total_time if total_time > 0 else 0
+            print(
+                f"   ✅ DONE | "
+                f"{total_size / 1024 / 1024:.1f} MB | "
+                f"avg {avg_speed / 1024 / 1024:.1f} MB/s | "
+                f"time {time.strftime('%H:%M:%S', time.gmtime(total_time))}",
+                flush=True
+            )
+
+        return h.digest()
+
+    except Exception as e:
+        print(f"⚠️ HASH ERROR: {path} - {e}")
+        raise
+
+
+def size_allowed(size: int) -> bool:
+    if FILE_MIN_SIZE is not None and size < FILE_MIN_SIZE: return False
+    if FILE_MAX_SIZE is not None and size > FILE_MAX_SIZE: return False
+    return True
+
+
+def normalize_db_path(scan_root, disk_path):
+    """
+    Converts a physical Windows path to the standardized DB format.
+    E:\Movies\File.mkv -> /Movies/File.mkv
+    """
+    try:
+        rel_path = os.path.relpath(disk_path, scan_root)
+    except ValueError:
+        return None
+
+    # Windows backslash to slash
+    clean_path = rel_path.replace("\\", "/")
+
+    # Ensure leading slash
+    if not clean_path.startswith("/"):
+        clean_path = "/" + clean_path
+
+    return clean_path
+
+
+# ==============================
+# MAIN
+# ==============================
+
+def main():
+    print("🚀 BLAKE3 External Disk Indexer", flush=True)
+    print(f"🖥 Running on PC: {REAL_PC_HOSTNAME}", flush=True)
+
+    if DRY_RUN:
+        print("🛡️  DRY RUN MODE ACTIVE: No changes will be made to DB.", flush=True)
+    else:
+        print("⚠️  LIVE MODE: Changes WILL be committed to DB.", flush=True)
+
+    # Build root path
+    scan_root = f"{DISK_DRIVE_LETTER}:\\"
+
+    if not os.path.isdir(scan_root):
+        print(f"❌ ERROR: Drive '{scan_root}' not found!")
+        print(f"   Please check DISK_DRIVE_LETTER in config.")
+        return
+
+    print(f"✅ Config:")
+    print(f"   Source (Win) : {scan_root}")
+    print(f"   DB Hostname  : {DISK_HOSTNAME}")
+
+    try:
+        db = pymysql.connect(**DB_CONFIG)
+        cur = db.cursor()
+    except Exception as e:
+        print(f"❌ DB Connection failed: {e}")
+        return
+
+    print(f"📥 Loading DB index for: '{DISK_HOSTNAME}'...", flush=True)
+
+    # === LOAD EXISTING DB RECORDS ===
+    cur.execute("""
+        SELECT full_path, file_size, UNIX_TIMESTAMP(mtime)
+        FROM file_md5_index
+        WHERE host_name = %s
+    """, (DISK_HOSTNAME,))
+
+    indexed_map = {row[0]: (row[1], row[2]) for row in cur.fetchall()}
+
+    print(f"✅ Found {len(indexed_map):,} files in DB for this disk.", flush=True)
+
+    # =========================================================
+    # PHASE 1: CLEANUP (DELETE MISSING FILES)
+    # =========================================================
+    print("======================================", flush=True)
+    print("🧹 PHASE 1: Checking for deleted files...", flush=True)
+
+    current_disk_paths = set()
+
+    # Fast walk just to get paths
+    for root, dirs, files in os.walk(scan_root):
+        dirs[:] = [d for d in dirs if d not in EXCLUDED_DIRS]
+
+        for fname in files:
+            disk_path = os.path.join(root, fname)
+            clean_path = normalize_db_path(scan_root, disk_path)
+            if clean_path:
+                current_disk_paths.add(clean_path)
+
+    paths_to_delete = set(indexed_map.keys()) - current_disk_paths
+
+    if paths_to_delete:
+        print(f"🗑️  Found {len(paths_to_delete):,} files to delete from DB.")
+
+        if DRY_RUN:
+            print("🛡️  [DRY RUN] Listing files to be deleted (No action taken):")
+            for p in sorted(list(paths_to_delete))[:20]:  # Print first 20
+                print(f"   - {p}")
+            if len(paths_to_delete) > 20:
+                print(f"   ... and {len(paths_to_delete) - 20} more.")
+        else:
+            # Delete in batches
+            batch_size = 1000
+            to_delete_list = list(paths_to_delete)
+
+            for i in range(0, len(to_delete_list), batch_size):
+                batch = to_delete_list[i: i + batch_size]
+                format_strings = ','.join(['%s'] * len(batch))
+
+                query = f"DELETE FROM file_md5_index WHERE host_name = %s AND full_path IN ({format_strings})"
+
+                try:
+                    cur.execute(query, [DISK_HOSTNAME] + batch)
+                    print(f"   ... deleted batch {i}-{i + len(batch)}")
+                except Exception as e:
+                    print(f"❌ Error deleting batch: {e}")
+
+            # Update local map
+            for p in paths_to_delete:
+                del indexed_map[p]
+            print("✅ Cleanup complete.")
+    else:
+        print("✅ No deleted files detected.")
+
+    # =========================================================
+    # PHASE 2: SCAN & UPDATE (HASHING)
+    # =========================================================
+    print("======================================", flush=True)
+    print("🚀 PHASE 2: Scanning for changes & new files...", flush=True)
+
+    new_files = 0
+    skipped = 0
+    filtered = 0
+    errors = 0
+    seen_paths = set()
+
+    for root, dirs, files in os.walk(scan_root):
+        dirs[:] = [d for d in dirs if d not in EXCLUDED_DIRS]
+
+        for fname in files:
+            disk_path = os.path.join(root, fname)
+
+            try:
+                stat = os.stat(disk_path)
+            except OSError:
+                errors += 1
+                continue
+
+            size = stat.st_size
+            if not size_allowed(size):
+                filtered += 1
+                continue
+
+            clean_path = normalize_db_path(scan_root, disk_path)
+            if not clean_path:
+                errors += 1
+                continue
+
+            if clean_path in seen_paths:
+                continue
+            seen_paths.add(clean_path)
+
+            mtime = int(stat.st_mtime)
+
+            # === MATCH CHECK ===
+            is_match = False
+            if clean_path in indexed_map:
+                db_size, db_mtime = indexed_map[clean_path]
+                if size == db_size and mtime == db_mtime:
+                    is_match = True
+
+            if is_match:
+                skipped += 1
+                if PRINT_SKIPPED:
+                    print(f"⏭ SKIP {clean_path}", flush=True)
+                continue
+
+            # === INSERT / UPDATE ===
+            print("➕ NEW / UPDATED", flush=True)
+            print(f"   File: {clean_path}", flush=True)
+            print(f"   Size: {size:,} B", flush=True)
+
+            try:
+                b3 = compute_blake3(disk_path)
+            except Exception:
+                errors += 1
+                continue
+
+            if DRY_RUN:
+                print(f"🛡️  [DRY RUN] Would INSERT/UPDATE: {clean_path}")
+                print(f"   Hash: {b3.hex()}")
+                new_files += 1
+            else:
+                cur.execute("""
+                    INSERT INTO file_md5_index
+                        (os_name, host_name, full_path, file_name, directory,
+                        file_size, mtime, blake3)
+                    VALUES (%s, %s, %s, %s, %s, %s, FROM_UNIXTIME(%s), %s)
+                    ON DUPLICATE KEY UPDATE
+                        file_size  = VALUES(file_size),
+                        mtime      = VALUES(mtime),
+                        blake3     = VALUES(blake3),
+                        updated_at = CURRENT_TIMESTAMP
+                """, (
+                    OS_NAME,
+                    DISK_HOSTNAME,
+                    clean_path,
+                    fname,
+                    os.path.dirname(clean_path),
+                    size,
+                    mtime,
+                    b3,
+                ))
+                new_files += 1
+                print(f"   Hash: {b3.hex()}", flush=True)
+
+            print("--------------------------------------", flush=True)
+
+    print("======================================", flush=True)
+    print(f"✅ Processed  : {new_files}")
+    print(f"⏭ Skipped    : {skipped}")
+    print(f"🗑 Deleted    : {len(paths_to_delete)} " + ("(DRY RUN)" if DRY_RUN else ""))
+    print(f"⚠️ Errors     : {errors}")
+    print("🏁 Done.")
+
+    cur.close()
+    db.close()
+
+
+if __name__ == "__main__":
+    main()
--- a/WalkFilesOnBackupHDD/30
+++ b/WalkFilesOnBackupHDD/30
@@ -0,0 +1,313 @@
+#!/usr/bin/python3
+# -*- coding: utf-8 -*-
+
+r"""
+FAST FILE HASH INDEXER – WINDOWS CLIENT (HARDCODED CONFIG)
+- Mode: PHYSICAL BACKUP
+- Hostname in DB = Disk Label (e.g., #HD015)
+- Path in DB     = Relative path (e.g., /Movies/Film.mkv)
+"""
+
+import os
+import time
+import pymysql
+import socket
+import platform
+import sys
+import hashlib
+from blake3 import blake3
+
+# ==============================
+# ⚙️ USER CONFIGURATION
+# ==============================
+DISK_DRIVE_LETTER = "z"  # (e.g., "E", "F", "P")
+DISK_HOSTNAME = "TW22"  # (e.g., "#HD015")
+
+# 🔒 SAFETY SWITCH
+DRY_RUN = False
+
+# ==============================
+# TECHNICAL CONFIG
+# ==============================
+CHUNK_SIZE = 5 * 1024 * 1024  # 5 MB
+PROGRESS_MIN_SIZE = 500 * 1024 * 1024  # 500 MB
+PROGRESS_INTERVAL = 1.0  # seconds
+
+EXCLUDED_DIRS = {"$RECYCLE.BIN", "System Volume Information", "RECYCLER", "msdownld.tmp"}
+
+# --- File Size Limits ---
+FILE_MIN_SIZE = 0
+FILE_MAX_SIZE = 1024 * 1024 * 1024 * 1024  # 1TB
+
+# --- DB Config ---
+DB_CONFIG = {
+    "host": "192.168.1.50",
+    "port": 3306,
+    "user": "root",
+    "password": "Vlado9674+",
+    "database": "torrents",
+    "charset": "utf8mb4",
+    "autocommit": True,
+}
+
+PRINT_SKIPPED = False  # Set True to see files that were already in DB
+
+# ==============================
+# SYSTEM INFO
+# ==============================
+REAL_PC_HOSTNAME = socket.gethostname()
+OS_NAME = platform.system()
+
+
+# ==============================
+# FUNCTIONS
+# ==============================
+
+def get_path_hash(path_str: str) -> bytes:
+    """Calculates MD5 hash of the path and returns raw 16 bytes for BINARY(16)."""
+    return hashlib.md5(path_str.encode('utf-8')).digest()
+
+
+def compute_blake3(path: str) -> bytes:
+    h = blake3()
+    total_size = os.path.getsize(path)
+    show_progress = total_size >= PROGRESS_MIN_SIZE
+
+    processed = 0
+    start_time = time.time()
+    last_report = start_time
+
+    try:
+        with open(path, "rb") as f:
+            while True:
+                chunk = f.read(CHUNK_SIZE)
+                if not chunk:
+                    break
+
+                h.update(chunk)
+                processed += len(chunk)
+
+                if show_progress:
+                    now = time.time()
+                    if now - last_report >= PROGRESS_INTERVAL:
+                        elapsed = now - start_time
+                        speed = processed / elapsed if elapsed > 0 else 0
+                        percent = processed / total_size * 100
+                        remaining = total_size - processed
+                        eta = remaining / speed if speed > 0 else 0
+
+                        print(
+                            f"   ⏳ {percent:6.2f}% | "
+                            f"{processed / 1024 / 1024:8.1f} / {total_size / 1024 / 1024:.1f} MB | "
+                            f"{speed / 1024 / 1024:6.1f} MB/s | "
+                            f"ETA {time.strftime('%H:%M:%S', time.gmtime(eta))}",
+                            flush=True
+                        )
+                        last_report = now
+
+        if show_progress:
+            total_time = time.time() - start_time
+            avg_speed = total_size / total_time if total_time > 0 else 0
+            print(
+                f"   ✅ DONE | "
+                f"{total_size / 1024 / 1024:.1f} MB | "
+                f"avg {avg_speed / 1024 / 1024:.1f} MB/s | "
+                f"time {time.strftime('%H:%M:%S', time.gmtime(total_time))}",
+                flush=True
+            )
+
+        return h.digest()
+
+    except Exception as e:
+        print(f"⚠️ HASH ERROR: {path} - {e}")
+        raise
+
+
+def size_allowed(size: int) -> bool:
+    if FILE_MIN_SIZE is not None and size < FILE_MIN_SIZE: return False
+    if FILE_MAX_SIZE is not None and size > FILE_MAX_SIZE: return False
+    return True
+
+
+def normalize_db_path(scan_root, disk_path):
+    """
+    Converts a physical Windows path to the standardized DB format.
+    E:\Movies\File.mkv -> /Movies/File.mkv
+    """
+    try:
+        rel_path = os.path.relpath(disk_path, scan_root)
+    except ValueError:
+        return None
+
+    clean_path = rel_path.replace("\\", "/")
+    if not clean_path.startswith("/"):
+        clean_path = "/" + clean_path
+
+    return clean_path
+
+
+# ==============================
+# MAIN
+# ==============================
+
+def main():
+    print("🚀 BLAKE3 External Disk Indexer (MySQL 9 Compatible)", flush=True)
+    print(f"🖥 Running on PC: {REAL_PC_HOSTNAME}", flush=True)
+
+    if DRY_RUN:
+        print("🛡️  DRY RUN MODE ACTIVE: No changes will be made to DB.", flush=True)
+    else:
+        print("⚠️  LIVE MODE: Changes WILL be committed to DB.", flush=True)
+
+    scan_root = f"{DISK_DRIVE_LETTER}:\\"
+
+    if not os.path.isdir(scan_root):
+        print(f"❌ ERROR: Drive '{scan_root}' not found!")
+        return
+
+    try:
+        db = pymysql.connect(**DB_CONFIG)
+        cur = db.cursor()
+    except Exception as e:
+        print(f"❌ DB Connection failed: {e}")
+        return
+
+    print(f"📥 Loading DB index for: '{DISK_HOSTNAME}'...", flush=True)
+
+    # === LOAD EXISTING DB RECORDS ===
+    # We load path_hash as well for precise deletion
+    cur.execute("""
+        SELECT full_path, file_size, UNIX_TIMESTAMP(mtime)
+        FROM file_md5_index
+        WHERE host_name = %s
+    """, (DISK_HOSTNAME,))
+
+    indexed_map = {row[0]: (row[1], row[2]) for row in cur.fetchall()}
+    print(f"✅ Found {len(indexed_map):,} files in DB for this disk.", flush=True)
+
+    # =========================================================
+    # PHASE 1: CLEANUP (DELETE MISSING FILES)
+    # =========================================================
+    print("======================================", flush=True)
+    print("🧹 PHASE 1: Checking for deleted files...", flush=True)
+
+    current_disk_paths = set()
+    for root, dirs, files in os.walk(scan_root):
+        dirs[:] = [d for d in dirs if d not in EXCLUDED_DIRS]
+        for fname in files:
+            disk_path = os.path.join(root, fname)
+            clean_path = normalize_db_path(scan_root, disk_path)
+            if clean_path:
+                current_disk_paths.add(clean_path)
+
+    paths_to_delete = set(indexed_map.keys()) - current_disk_paths
+
+    if paths_to_delete:
+        print(f"🗑️  Found {len(paths_to_delete):,} files to delete from DB.")
+        if DRY_RUN:
+            for p in sorted(list(paths_to_delete))[:20]:
+                print(f"   - {p}")
+        else:
+            # Delete using path_hash for index efficiency
+            batch_size = 500
+            to_delete_list = list(paths_to_delete)
+            for i in range(0, len(to_delete_list), batch_size):
+                batch_paths = to_delete_list[i: i + batch_size]
+                # Map paths to their MD5 hashes
+                batch_hashes = [get_path_hash(p) for p in batch_paths]
+
+                format_strings = ','.join(['%s'] * len(batch_hashes))
+                query = f"DELETE FROM file_md5_index WHERE host_name = %s AND path_hash IN ({format_strings})"
+
+                try:
+                    cur.execute(query, [DISK_HOSTNAME] + batch_hashes)
+                except Exception as e:
+                    print(f"❌ Error deleting batch: {e}")
+
+            for p in paths_to_delete:
+                del indexed_map[p]
+            print("✅ Cleanup complete.")
+    else:
+        print("✅ No deleted files detected.")
+
+    # =========================================================
+    # PHASE 2: SCAN & UPDATE (HASHING)
+    # =========================================================
+    print("======================================", flush=True)
+    print("🚀 PHASE 2: Scanning for changes & new files...", flush=True)
+
+    new_files = 0
+    skipped = 0
+    errors = 0
+    seen_paths = set()
+
+    for root, dirs, files in os.walk(scan_root):
+        dirs[:] = [d for d in dirs if d not in EXCLUDED_DIRS]
+        for fname in files:
+            disk_path = os.path.join(root, fname)
+            try:
+                stat = os.stat(disk_path)
+            except OSError:
+                errors += 1
+                continue
+
+            size = stat.st_size
+            if not size_allowed(size):
+                continue
+
+            clean_path = normalize_db_path(scan_root, disk_path)
+            if not clean_path or clean_path in seen_paths:
+                continue
+            seen_paths.add(clean_path)
+
+            mtime = int(stat.st_mtime)
+
+            # Match Check
+            if clean_path in indexed_map:
+                db_size, db_mtime = indexed_map[clean_path]
+                if size == db_size and mtime == db_mtime:
+                    skipped += 1
+                    continue
+
+            # Compute Hashes
+            try:
+                b3_hash = compute_blake3(disk_path)
+                p_hash = get_path_hash(clean_path)  # Essential for MySQL 9 Unique Index
+            except Exception:
+                errors += 1
+                continue
+
+            if DRY_RUN:
+                print(f"🛡️  [DRY RUN] NEW/UPDATE: {clean_path}")
+                new_files += 1
+            else:
+                cur.execute("""
+                    INSERT INTO file_md5_index
+                        (os_name, host_name, full_path, path_hash, file_name, directory,
+                        file_size, mtime, blake3)
+                    VALUES (%s, %s, %s, %s, %s, %s, %s, FROM_UNIXTIME(%s), %s)
+                    ON DUPLICATE KEY UPDATE
+                        file_size  = VALUES(file_size),
+                        mtime      = VALUES(mtime),
+                        blake3     = VALUES(blake3),
+                        updated_at = CURRENT_TIMESTAMP
+                """, (
+                    OS_NAME, DISK_HOSTNAME, clean_path, p_hash, fname,
+                    os.path.dirname(clean_path), size, mtime, b3_hash
+                ))
+                new_files += 1
+                print(f"➕ ADDED: {clean_path} | {b3_hash.hex()[:8]}...")
+
+    print("======================================", flush=True)
+    print(f"✅ Processed  : {new_files}")
+    print(f"⏭ Skipped    : {skipped}")
+    print(f"🗑 Deleted    : {len(paths_to_delete)}")
+    print(f"⚠️ Errors     : {errors}")
+    print("🏁 Done.")
+
+    cur.close()
+    db.close()
+
+
+if __name__ == "__main__":
+    main()
--- a/TestPathNormalizedinTable.py
+++ b/TestPathNormalizedinTable.py
@@ -0,0 +1,158 @@
+#!/opt/bin/python3
+# -*- coding: utf-8 -*-
+
+import pymysql
+import hashlib
+import posixpath
+import unicodedata
+from binascii import hexlify
+
+# ============================================================
+# CONFIG
+# ============================================================
+
+DB_CONFIG = {
+    "host": "192.168.1.50",
+    "port": 3306,
+    "user": "root",
+    "password": "Vlado9674+",
+    "database": "torrents",
+    "charset": "utf8mb4",
+}
+
+HOST_FILTER = "tower1"   # None = all hosts
+LIMIT = None               # e.g. 50000 for testing
+SHOW_EXAMPLES = 20
+
+# ============================================================
+# CANONICAL PATH
+# ============================================================
+
+def canonical_path(path_str: str) -> str:
+    if not path_str:
+        return path_str
+
+    path_str = path_str.replace("\\", "/")
+    path_str = posixpath.normpath(path_str)
+    path_str = unicodedata.normalize("NFC", path_str)
+
+    return path_str
+
+def md5_bytes(path_str: str) -> bytes:
+    return hashlib.md5(path_str.encode("utf-8")).digest()
+
+# ============================================================
+# MAIN
+# ============================================================
+
+def main():
+
+    db = pymysql.connect(**DB_CONFIG)
+    cur = db.cursor(pymysql.cursors.SSCursor)
+
+    sql = """
+        SELECT id, full_path, path_hash
+        FROM file_md5_index
+    """
+
+    params = []
+
+    if HOST_FILTER:
+        sql += " WHERE host_name = %s"
+        params.append(HOST_FILTER)
+
+    if LIMIT:
+        sql += " LIMIT %s"
+        params.append(LIMIT)
+
+    cur.execute(sql, params)
+
+    total = 0
+    ok = 0
+    path_change = 0
+    hash_change = 0
+
+    examples_path = []
+    examples_hash = []
+
+    for rec_id, full_path, stored_hash in cur:
+
+        total += 1
+
+        canonical = canonical_path(full_path)
+
+        raw_hash = md5_bytes(full_path)
+        canonical_hash = md5_bytes(canonical)
+
+        # ---------------------------------------------------
+        # CASE 1: fully OK
+        # ---------------------------------------------------
+        if full_path == canonical and stored_hash == canonical_hash:
+            ok += 1
+
+        # ---------------------------------------------------
+        # CASE 2: path string would change
+        # ---------------------------------------------------
+        if full_path != canonical:
+            path_change += 1
+
+            if len(examples_path) < SHOW_EXAMPLES:
+                examples_path.append((rec_id, full_path, canonical))
+
+        # ---------------------------------------------------
+        # CASE 3: hash would change
+        # ---------------------------------------------------
+        if stored_hash != canonical_hash:
+            hash_change += 1
+
+            if len(examples_hash) < SHOW_EXAMPLES:
+                examples_hash.append(
+                    (rec_id, full_path,
+                     hexlify(stored_hash).decode(),
+                     hexlify(canonical_hash).decode())
+                )
+
+        if total % 100000 == 0:
+            print(f"Checked {total:,} rows...")
+
+    # ============================================================
+    # REPORT
+    # ============================================================
+
+    print("\n" + "=" * 70)
+    print("AUDIT SUMMARY")
+    print("=" * 70)
+
+    print(f"Total rows checked : {total:,}")
+    print(f"OK (already canonical + hash OK) : {ok:,}")
+    print(f"Paths that would change         : {path_change:,}")
+    print(f"Hashes that would change        : {hash_change:,}")
+
+    print("=" * 70)
+
+    # ------------------------------------------------------------
+    # SHOW EXAMPLES
+    # ------------------------------------------------------------
+
+    if examples_path:
+        print("\n⚠ PATH CHANGE EXAMPLES:")
+        for rec_id, old, new in examples_path:
+            print(f"[id={rec_id}]")
+            print(" DB :", old)
+            print(" NEW:", new)
+            print()
+
+    if examples_hash:
+        print("\n❌ HASH CHANGE EXAMPLES:")
+        for rec_id, path, old_hash, new_hash in examples_hash:
+            print(f"[id={rec_id}] {path}")
+            print(" Stored :", old_hash)
+            print(" New    :", new_hash)
+            print()
+
+    cur.close()
+    db.close()
+
+
+if __name__ == "__main__":
+    main()
--- a/Onetimepathnormalization.py
+++ b/Onetimepathnormalization.py
@@ -0,0 +1,188 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+"""
+ONE-TIME MIGRATION: Normalize full_path (NFC, forward slashes) + recompute path_hash
+- Targets ONLY one host_name (Tower1 by default)
+- Safe with UNIQUE(host_name, path_hash)
+- Handles collisions by skipping conflicting rows and logging them
+- DRY_RUN supported
+"""
+
+import sys
+import time
+import hashlib
+import posixpath
+import unicodedata
+import pymysql
+from pymysql.err import IntegrityError
+
+# =========================
+# CONFIG
+# =========================
+HOST_TO_FIX = "Tower"     # <-- set your Unraid host_name exactly as stored in DB
+DRY_RUN = True             # <-- first run True; then switch to False to apply
+BATCH_SELECT_FETCH = 5000  # server-side cursor fetch size (streaming)
+COMMIT_EVERY = 2000        # commit after N successful updates (when DRY_RUN=False)
+LOG_EVERY = 50000          # progress print
+
+DB_CONFIG = {
+    "host": "192.168.1.50",
+    "port": 3306,
+    "user": "root",
+    "password": "Vlado9674+",
+    "database": "torrents",
+    "charset": "utf8mb4",
+    "autocommit": False,
+}
+
+# =========================
+# CANONICALIZATION
+# =========================
+def canonical_path(path_str: str) -> str:
+    if not path_str:
+        return path_str
+    path_str = path_str.replace("\\", "/")
+    path_str = posixpath.normpath(path_str)
+    path_str = unicodedata.normalize("NFC", path_str)
+    return path_str
+
+def md5_bytes(path_str: str) -> bytes:
+    return hashlib.md5(path_str.encode("utf-8")).digest()  # 16 raw bytes for BINARY(16)
+
+# =========================
+# MAIN
+# =========================
+def main():
+    print(f"[{time.strftime('%Y-%m-%d %H:%M:%S')}] 🚀 Tower path_hash migration")
+    print(f"Host: {HOST_TO_FIX}")
+    print(f"DRY_RUN: {DRY_RUN}")
+    sys.stdout.flush()
+
+    db = pymysql.connect(**DB_CONFIG)
+
+    # streaming cursor for reading
+    read_cur = db.cursor(pymysql.cursors.SSCursor)
+    read_cur.execute(
+        """
+        SELECT id, full_path, path_hash
+        FROM file_md5_index
+        WHERE host_name = %s
+        """,
+        (HOST_TO_FIX,),
+    )
+
+    # normal cursor for updates
+    upd_cur = db.cursor()
+
+    total = 0
+    needs_change = 0
+    updated_ok = 0
+    collisions = 0
+    other_errors = 0
+
+    start = time.time()
+    pending_commits = 0
+
+    # Optional: make server-side cursor fetch a bit larger
+    # (PyMySQL streams regardless; this just makes loop smoother)
+    # Not strictly necessary.
+
+    while True:
+        rows = read_cur.fetchmany(BATCH_SELECT_FETCH)
+        if not rows:
+            break
+
+        for rec_id, full_path, stored_hash in rows:
+            total += 1
+
+            new_path = canonical_path(full_path)
+            new_hash = md5_bytes(new_path)
+
+            # already canonical & correct
+            if new_path == full_path and new_hash == stored_hash:
+                if total % LOG_EVERY == 0:
+                    elapsed = time.time() - start
+                    print(f"Checked {total:,} | needs_change {needs_change:,} | updated {updated_ok:,} | collisions {collisions:,} | {elapsed:.1f}s")
+                    sys.stdout.flush()
+                continue
+
+            needs_change += 1
+
+            if DRY_RUN:
+                # in dry-run we just count; no DB writes
+                continue
+
+            # Update with collision handling via UNIQUE(host_name, path_hash)
+            try:
+                # Use a savepoint so a duplicate-key error doesn't kill the whole transaction
+                upd_cur.execute("SAVEPOINT sp_one;")
+
+                upd_cur.execute(
+                    """
+                    UPDATE file_md5_index
+                    SET full_path = %s,
+                        path_hash = %s
+                    WHERE id = %s
+                    """,
+                    (new_path, new_hash, rec_id),
+                )
+
+                upd_cur.execute("RELEASE SAVEPOINT sp_one;")
+
+                updated_ok += 1
+                pending_commits += 1
+
+                if pending_commits >= COMMIT_EVERY:
+                    db.commit()
+                    pending_commits = 0
+
+            except IntegrityError as e:
+                # Duplicate key = collision on (host_name, path_hash)
+                # This means some OTHER row in the same host already has this new_hash.
+                upd_cur.execute("ROLLBACK TO SAVEPOINT sp_one;")
+                upd_cur.execute("RELEASE SAVEPOINT sp_one;")
+                collisions += 1
+
+                # Print a short line occasionally (avoid huge spam)
+                if collisions <= 50 or collisions % 1000 == 0:
+                    print(f"⚠ COLLISION id={rec_id} | {e}")
+                    sys.stdout.flush()
+
+            except Exception as e:
+                upd_cur.execute("ROLLBACK TO SAVEPOINT sp_one;")
+                upd_cur.execute("RELEASE SAVEPOINT sp_one;")
+                other_errors += 1
+                if other_errors <= 50 or other_errors % 1000 == 0:
+                    print(f"❌ ERROR id={rec_id} | {e}")
+                    sys.stdout.flush()
+
+            if total % LOG_EVERY == 0:
+                elapsed = time.time() - start
+                print(f"Checked {total:,} | needs_change {needs_change:,} | updated {updated_ok:,} | collisions {collisions:,} | {elapsed:.1f}s")
+                sys.stdout.flush()
+
+    # finalize
+    if not DRY_RUN:
+        if pending_commits:
+            db.commit()
+        print("✅ Migration finished (committed).")
+    else:
+        print("⚠ DRY_RUN finished (no changes written).")
+
+    elapsed = time.time() - start
+    print("=" * 70)
+    print(f"Total rows checked   : {total:,}")
+    print(f"Rows needing change  : {needs_change:,}")
+    print(f"Rows updated         : {updated_ok:,}")
+    print(f"Collisions (skipped) : {collisions:,}")
+    print(f"Other errors         : {other_errors:,}")
+    print(f"Elapsed              : {elapsed:.1f}s")
+    print("=" * 70)
+
+    read_cur.close()
+    upd_cur.close()
+    db.close()
+
+if __name__ == "__main__":
+    main()
--- a/testthoseneedchangewhetherok.py
+++ b/testthoseneedchangewhetherok.py
@@ -0,0 +1,146 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+import os
+import hashlib
+import posixpath
+import unicodedata
+import pymysql
+import time
+
+# =========================
+# CONFIG
+# =========================
+
+HOST_TO_CHECK = "Tower"
+WINDOWS_UNC_BASE = r"\\tower"
+
+DB_CONFIG = {
+    "host": "192.168.1.50",
+    "port": 3306,
+    "user": "root",
+    "password": "Vlado9674+",
+    "database": "torrents",
+    "charset": "utf8mb4",
+}
+
+PRINT_FIRST_CHANGES = 20
+LOG_EVERY = 5000
+
+# =========================
+# CANONICAL
+# =========================
+
+def canonical_path(path_str):
+    path_str = path_str.replace("\\", "/")
+    path_str = posixpath.normpath(path_str)
+    path_str = unicodedata.normalize("NFC", path_str)
+    return path_str
+
+def md5_bytes(path_str):
+    return hashlib.md5(path_str.encode("utf-8")).digest()
+
+# =========================
+# PATH MAP
+# =========================
+
+def linux_to_windows_unc(linux_path):
+    rel = linux_path[len("/mnt/user/"):]
+    return os.path.join(WINDOWS_UNC_BASE, *rel.split("/"))
+
+# =========================
+# MAIN
+# =========================
+
+def main():
+
+    print("=" * 70)
+    print("🔍 Tower Canonical Path SMB Verification")
+    print(f"Host: {HOST_TO_CHECK}")
+    print(f"UNC Base: {WINDOWS_UNC_BASE}")
+    print("=" * 70)
+
+    db = pymysql.connect(**DB_CONFIG)
+    cur = db.cursor(pymysql.cursors.SSCursor)
+
+    cur.execute("""
+        SELECT id, full_path, path_hash
+        FROM file_md5_index
+        WHERE host_name = %s
+    """, (HOST_TO_CHECK,))
+
+    total = 0
+    needs_change = 0
+    exists_ok = 0
+    missing = 0
+
+    printed_changes = 0
+
+    start = time.time()
+
+    for rec_id, full_path, stored_hash in cur:
+
+        total += 1
+
+        new_path = canonical_path(full_path)
+        new_hash = md5_bytes(new_path)
+
+        # Already canonical
+        if new_path == full_path and new_hash == stored_hash:
+            continue
+
+        needs_change += 1
+
+        win_path = linux_to_windows_unc(new_path)
+        exists = os.path.exists(win_path)
+
+        if exists:
+            exists_ok += 1
+        else:
+            missing += 1
+
+        # ---- Print first examples ----
+        if printed_changes < PRINT_FIRST_CHANGES:
+            print("\n🔧 CHANGE DETECTED")
+            print(f"ID       : {rec_id}")
+            print(f"DB PATH  : {full_path}")
+            print(f"NEW PATH : {new_path}")
+            print(f"WIN PATH : {win_path}")
+            print(f"Exists   : {exists}")
+            printed_changes += 1
+
+        # ---- Progress ----
+        if total % LOG_EVERY == 0:
+            elapsed = time.time() - start
+            rate = total / elapsed if elapsed else 0
+
+            print(
+                f"📊 Checked {total:,} rows | "
+                f"Needs change {needs_change:,} | "
+                f"Exists {exists_ok:,} | "
+                f"Missing {missing:,} | "
+                f"{rate:,.0f} rows/sec"
+            )
+
+    # =========================
+    # SUMMARY
+    # =========================
+
+    elapsed = time.time() - start
+
+    print("\n" + "=" * 70)
+    print("✅ FINAL SUMMARY")
+    print("=" * 70)
+    print(f"Total scanned     : {total:,}")
+    print(f"Needs change     : {needs_change:,}")
+    print(f"Exists on Tower  : {exists_ok:,}")
+    print(f"Missing on Tower : {missing:,}")
+    print(f"Runtime          : {elapsed:.1f}s")
+    print("=" * 70)
+
+    cur.close()
+    db.close()
+
+
+if __name__ == "__main__":
+    main()
--- a/WalkFilesOnBackupHDD/53
+++ b/WalkFilesOnBackupHDD/53
@@ -0,0 +1,139 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+"""
+TOWER PATH NORMALIZATION MIGRATION
+----------------------------------
+✔ Normalizes full_path → NFC canonical
+✔ Recalculates path_hash
+✔ Uses two DB connections (streaming safe)
+✔ Idempotent (safe to rerun)
+✔ Production safe
+"""
+
+import pymysql
+import hashlib
+import posixpath
+import unicodedata
+import time
+
+# =========================
+# CONFIG
+# =========================
+
+HOST_TO_FIX = "tower1"
+BATCH_FETCH = 5000
+COMMIT_EVERY = 2000
+
+DB_CONFIG = {
+    "host": "192.168.1.50",
+    "port": 3306,
+    "user": "root",
+    "password": "Vlado9674+",
+    "database": "torrents",
+    "charset": "utf8mb4",
+    "autocommit": False,
+}
+
+# =========================
+# CANONICALIZATION
+# =========================
+
+def canonical_path(path_str: str) -> str:
+    path_str = path_str.replace("\\", "/")
+    path_str = posixpath.normpath(path_str)
+    path_str = unicodedata.normalize("NFC", path_str)
+    return path_str
+
+def md5_bytes(path_str: str) -> bytes:
+    return hashlib.md5(path_str.encode("utf-8")).digest()
+
+# =========================
+# MAIN
+# =========================
+
+def main():
+
+    print("=" * 70)
+    print("🚀 TOWER PATH NORMALIZATION MIGRATION")
+    print(f"Host: {HOST_TO_FIX}")
+    print("=" * 70)
+
+    start = time.time()
+
+    # --- TWO CONNECTIONS ---
+    db_read = pymysql.connect(**DB_CONFIG)
+    db_write = pymysql.connect(**DB_CONFIG)
+
+    read_cur = db_read.cursor(pymysql.cursors.SSCursor)
+    write_cur = db_write.cursor()
+
+    read_cur.execute("""
+        SELECT id, full_path, path_hash
+        FROM file_md5_index
+        WHERE host_name = %s
+    """, (HOST_TO_FIX,))
+
+    total = 0
+    updated = 0
+    skipped = 0
+    pending_commit = 0
+
+    while True:
+
+        rows = read_cur.fetchmany(BATCH_FETCH)
+
+        if not rows:
+            break
+
+        for rec_id, full_path, stored_hash in rows:
+
+            total += 1
+
+            new_path = canonical_path(full_path)
+            new_hash = md5_bytes(new_path)
+
+            if new_path == full_path and new_hash == stored_hash:
+                skipped += 1
+                continue
+
+            write_cur.execute("""
+                UPDATE file_md5_index
+                SET full_path = %s,
+                    path_hash = %s
+                WHERE id = %s
+            """, (new_path, new_hash, rec_id))
+
+            updated += 1
+            pending_commit += 1
+
+            if pending_commit >= COMMIT_EVERY:
+                db_write.commit()
+                pending_commit = 0
+
+        print(
+            f"Checked {total:,} | Updated {updated:,} | Skipped {skipped:,}"
+        )
+
+    if pending_commit:
+        db_write.commit()
+
+    elapsed = time.time() - start
+
+    print("\n" + "=" * 70)
+    print("✅ MIGRATION FINISHED")
+    print("=" * 70)
+    print(f"Total checked : {total:,}")
+    print(f"Rows updated  : {updated:,}")
+    print(f"Rows skipped  : {skipped:,}")
+    print(f"Runtime       : {elapsed:.1f}s")
+    print("=" * 70)
+
+    read_cur.close()
+    write_cur.close()
+    db_read.close()
+    db_write.close()
+
+
+if __name__ == "__main__":
+    main()
Author	SHA1	Message	Date
vladimir.buzalka	a19281c3a4	z230	2026-02-03 18:01:23 +01:00
vladimir.buzalka	0c94333abb	z230	2026-02-03 13:26:11 +01:00
vladimir.buzalka	51c77a8793	Merge remote-tracking branch 'origin/master'	2026-02-02 09:22:02 +01:00
vlado	f052362b31	tw22	2026-02-02 09:19:11 +01:00
Vladimir Buzalka	773e67c9b6	ntb	2026-02-01 13:49:23 +01:00
vlado	b0275928d2	tw22	2026-01-24 08:41:48 +01:00
vladimir.buzalka	4c420060ec	z230	2026-01-22 17:44:19 +01:00
vlado	c6334c2244	tw22	2026-01-22 15:03:54 +01:00
vlado	50ee068af9	tw22	2026-01-17 20:23:58 +01:00
vladimir.buzalka	c30a582323	Merge remote-tracking branch 'origin/master'	2026-01-13 16:43:13 +01:00
vladimir.buzalka	01aa1249b9	z230	2026-01-13 16:42:40 +01:00
vlado	b74e180022	tw22	2026-01-11 21:13:38 +01:00
vlado	2037d1b887	tw22	2026-01-11 20:14:52 +01:00
vlado	6cdabc64b4	tw22	2026-01-08 10:15:45 +01:00
vladimir.buzalka	2aee823e87	z230	2026-01-06 10:09:51 +01:00
vladimir.buzalka	b61a8a5473	z230	2026-01-06 10:09:25 +01:00
vladimir.buzalka	83f2d0dafc	z230	2026-01-06 10:05:35 +01:00