Fix typography and wording in README, build spec, main

2026-03-13 17:31:37 +02:00
parent 8ee67e9ef3
commit e86fab07d1
2 changed files with 158 additions and 96 deletions
@@ -8,6 +8,7 @@
 # NO heavy dependencies (torch, PySide6, etc.) are bundled.
 import os
 import sys
 import glob
 block_cipher = None
@@ -61,7 +62,7 @@ a = Analysis(
        'psutil', 'pynvml', 'pystray', 'PIL', 'Pillow',
        'darkdetect', 'huggingface_hub', 'requests',
        'tqdm', 'onnxruntime', 'av',
-        'tkinter', 'matplotlib', 'notebook', 'IPython',
+        'matplotlib', 'notebook', 'IPython',
    ],
    win_no_prefer_redirects=False,
    win_private_assemblies=False,
@@ -91,5 +92,5 @@ exe = EXE(
    target_arch=None,
    codesign_identity=None,
    entitlements_file=None,
-    icon='assets/icon.ico',
+    icon='assets/icon.ico' if sys.platform == 'win32' else None,
 )
@@ -9,6 +9,14 @@ app_dir = os.path.dirname(os.path.abspath(__file__))
 if app_dir not in sys.path:
    sys.path.insert(0, app_dir)
 # -----------------------------------------------------------------------------
 # LINUX: Force XWayland (X11) for reliable window positioning & overlay behavior.
 # Our input stack (evdev, UInput, wl-copy) is compositor-agnostic so this is safe.
 # Native Wayland lacks app-controlled window positioning which the overlay needs.
 # -----------------------------------------------------------------------------
 if sys.platform == 'linux' and os.environ.get('WAYLAND_DISPLAY'):
    os.environ.setdefault('QT_QPA_PLATFORM', 'xcb')
 # -----------------------------------------------------------------------------
 # WINDOWS DLL FIX (CRITICAL for Portable CUDA)
 # Python 3.8+ on Windows requires explicit DLL directory addition.
@@ -16,20 +24,32 @@ if app_dir not in sys.path:
 if os.name == 'nt' and hasattr(os, 'add_dll_directory'):
    try:
        from pathlib import Path
-        # Scan sys.path for site-packages
+        _candidate_dirs = set()
        # 1. From sys.path (scan ALL site-packages, not just the first)
        for p in sys.path:
            path_obj = Path(p)
            if path_obj.name == 'site-packages' and path_obj.exists():
-                nvidia_path = path_obj / "nvidia"
+                _candidate_dirs.add(str(path_obj.resolve()))
-                if nvidia_path.exists():
+
-                    for subdir in nvidia_path.iterdir():
+        # 2. Relative to the Python executable (critical for embedded Python)
-                        # Add 'bin' folder from each nvidia stub (cublas, cudnn, etc.)
+        _exe_dir = Path(sys.executable).parent
-                        bin_path = subdir / "bin"
+        for _sp in [_exe_dir / "Lib" / "site-packages", _exe_dir / "lib" / "site-packages"]:
-                        if bin_path.exists():
+            if _sp.exists():
-                            os.add_dll_directory(str(bin_path))
+                _candidate_dirs.add(str(_sp.resolve()))
-                # Also try adding site-packages itself just in case
+
-                # os.add_dll_directory(str(path_obj))
+        # 3. Scan all candidates for nvidia DLL directories
-                break
+        for _sp_str in _candidate_dirs:
            nvidia_path = Path(_sp_str) / "nvidia"
            if nvidia_path.exists():
                for subdir in nvidia_path.iterdir():
                    bin_path = subdir / "bin"
                    if bin_path.exists():
                        os.add_dll_directory(str(bin_path))
                        # Also add to PATH as fallback - some libraries
                        # (e.g. CTranslate2) load DLLs lazily via LoadLibrary
                        # which may not respect os.add_dll_directory()
                        os.environ['PATH'] = str(bin_path) + os.pathsep + os.environ.get('PATH', '')
    except Exception:
        pass
 # -----------------------------------------------------------------------------
@@ -49,7 +69,8 @@ from src.core.hotkey_manager import HotkeyManager
 from src.core.config import ConfigManager
 from src.utils.injector import InputInjector
 from src.core.paths import get_models_path, get_bundle_path
-from src.utils.window_hook import WindowHook
+if os.name == 'nt':
    from src.utils.window_hook import WindowHook
 from PySide6.QtGui import QSurfaceFormat
@@ -63,37 +84,52 @@ os.environ["QT_ENABLE_HIGHDPI_SCALING"] = "1"
 os.environ["QT_AUTOSCREENSCALEFACTOR"] = "1"
 # Detect resolution without creating QApplication (Fixes crash)
-try:
+if os.name == 'nt':
-    import ctypes
+    try:
-    user32 = ctypes.windll.user32
+        import ctypes
-    # Get physical screen width (unscaled)
+        user32 = ctypes.windll.user32
-    # SetProcessDPIAware is needed to get the true resolution
+        # Get physical screen width (unscaled)
-    user32.SetProcessDPIAware()
+        # SetProcessDPIAware is needed to get the true resolution
-    width = user32.GetSystemMetrics(0)
+        user32.SetProcessDPIAware()
-    # Base scale centers around 1920 width.
+        width = user32.GetSystemMetrics(0)
-    # At 3840 (4k), res_scale is 2.0. If we want it ~40% smaller, we multiply by 0.6 = 1.2
+        # Base scale centers around 1920 width.
-    res_scale = (width / 1920)
+        # At 3840 (4k), res_scale is 2.0. If we want it ~40% smaller, we multiply by 0.6 = 1.2
-    if width >= 3840:
+        res_scale = (width / 1920)
-        res_scale *= 0.6 # Make it significantly smaller at 4k as requested
+        if width >= 3840:
            res_scale *= 0.6 # Make it significantly smaller at 4k as requested
-    os.environ["QT_SCALE_FACTOR"] = str(max(1.0, res_scale))
+        os.environ["QT_SCALE_FACTOR"] = str(max(1.0, res_scale))
-except:
+    except:
-    pass
+        pass
 # On Linux, Qt handles DPI automatically via QT_ENABLE_HIGHDPI_SCALING
-# Detect Windows "Reduce Motion" preference
+# Detect "Reduce Motion" preference
-try:
+if os.name == 'nt':
-    import ctypes
+    try:
-    SPI_GETCLIENTAREAANIMATION = 0x1042
+        import ctypes
-    animation_enabled = ctypes.c_bool(True)
+        SPI_GETCLIENTAREAANIMATION = 0x1042
-    ctypes.windll.user32.SystemParametersInfoW(
+        animation_enabled = ctypes.c_bool(True)
-        SPI_GETCLIENTAREAANIMATION, 0,
+        ctypes.windll.user32.SystemParametersInfoW(
-        ctypes.byref(animation_enabled), 0
+            SPI_GETCLIENTAREAANIMATION, 0,
-    )
+            ctypes.byref(animation_enabled), 0
-    if not animation_enabled.value:
+        )
-        ConfigManager().data["reduce_motion"] = True
+        if not animation_enabled.value:
-        ConfigManager().save()
+            ConfigManager().data["reduce_motion"] = True
-except Exception:
+            ConfigManager().save()
-    pass
+    except Exception:
        pass
 elif sys.platform == 'linux':
    try:
        import subprocess as _sp
        result = _sp.run(
            ['gsettings', 'get', 'org.gnome.desktop.interface', 'enable-animations'],
            capture_output=True, text=True, timeout=2
        )
        if result.stdout.strip() == 'false':
            ConfigManager().data["reduce_motion"] = True
            ConfigManager().save()
    except Exception:
        pass
 # Configure Logging
 class QmlLoggingHandler(logging.Handler, QObject):
@@ -140,15 +176,25 @@ class DownloadWorker(QThread):
    def run(self):
        try:
            import requests
-            from tqdm import tqdm
+            import shutil
            model_path = get_models_path()
            # Determine what to download
            dest_dir = model_path / f"faster-whisper-{self.model_name}"
            repo_id = f"Systran/faster-whisper-{self.model_name}"
-            files = ["config.json", "model.bin", "tokenizer.json", "vocabulary.json"]
+            required_files = ["config.json", "model.bin", "tokenizer.json", "vocabulary.json"]
            base_url = f"https://huggingface.co/{repo_id}/resolve/main"
-            dest_dir.mkdir(parents=True, exist_ok=True)
+            # Skip if already complete
            if dest_dir.exists() and all((dest_dir / f).exists() for f in required_files):
                logging.info(f"Model {self.model_name} already downloaded.")
                self.finished.emit()
                return
            # Download to a temp dir first, move on success
            tmp_dir = model_path / f".tmp-faster-whisper-{self.model_name}"
            if tmp_dir.exists():
                shutil.rmtree(tmp_dir)
            tmp_dir.mkdir(parents=True, exist_ok=True)
            logging.info(f"Downloading {self.model_name} to {dest_dir}...")
            # 1. Calculate Total Size
@@ -156,7 +202,7 @@ class DownloadWorker(QThread):
            file_sizes = {}
            with requests.Session() as s:
-                for fname in files:
+                for fname in required_files:
                    url = f"{base_url}/{fname}"
                    head = s.head(url, allow_redirects=True)
                    if head.status_code == 200:
@@ -164,25 +210,21 @@ class DownloadWorker(QThread):
                        file_sizes[fname] = size
                        total_size += size
                    else:
-                        # Fallback for vocabulary.json vs vocabulary.txt
+                        logging.warning(f"HEAD failed for {fname}: HTTP {head.status_code}")
-                        if fname == "vocabulary.json":
+
-                             # Try .txt? Or just skip if not found? 
+            # Abort if any required file is unavailable
-                             # Faster-whisper usually has vocabulary.json
+            missing = [f for f in required_files if f not in file_sizes]
-                             pass
+            if missing:
                shutil.rmtree(tmp_dir, ignore_errors=True)
                raise RuntimeError(f"Required model files unavailable: {missing}")
            # 2. Download loop
            downloaded_bytes = 0
            with requests.Session() as s:
-                for fname in files:
+                for fname in required_files:
                    if fname not in file_sizes: continue
                    url = f"{base_url}/{fname}"
-                    dest_file = dest_dir / fname
+                    dest_file = tmp_dir / fname
                    # Resume check? 
                    # Simpler to just overwrite for reliability unless we want complex resume logic.
                    # We'll overwrite.
                    resp = s.get(url, stream=True)
                    resp.raise_for_status()
@@ -192,12 +234,22 @@ class DownloadWorker(QThread):
                            if chunk:
                                f.write(chunk)
                                downloaded_bytes += len(chunk)
                                # Emit Progress
                                if total_size > 0:
                                    pct = int((downloaded_bytes / total_size) * 100)
                                    self.progress.emit(pct)
            # 3. Validate all files present and non-empty
            for fname in required_files:
                fpath = tmp_dir / fname
                if not fpath.exists() or fpath.stat().st_size == 0:
                    shutil.rmtree(tmp_dir, ignore_errors=True)
                    raise RuntimeError(f"Download incomplete: {fname} missing or empty")
            # 4. Atomic move: replace dest with completed download
            if dest_dir.exists():
                shutil.rmtree(dest_dir)
            tmp_dir.rename(dest_dir)
            self.finished.emit()
        except Exception as e:
@@ -311,6 +363,7 @@ class WhisperApp(QObject):
        self.bridge.llmDownloadRequested.connect(self.on_llm_download_requested)
        self.engine.rootContext().setContextProperty("ui", self.bridge)
        self.engine.rootContext().setContextProperty("isLinux", sys.platform == 'linux')
        # 2. Tray setup
        self.tray = SystemTray()
@@ -382,23 +435,27 @@ class WhisperApp(QObject):
            self.settings_root.setVisible(False)
        # Install Low-Level Window Hook for Transparent Hit Test
-        try:
+        if os.name == 'nt':
-            from src.utils.window_hook import WindowHook
+            try:
-            hwnd = self.overlay_root.winId()
+                from src.utils.window_hook import WindowHook
-            # Initial scale from config
+                hwnd = self.overlay_root.winId()
-            scale = float(self.config.get("ui_scale"))
+                # Initial scale from config
                scale = float(self.config.get("ui_scale"))
-            # Current Overlay Dimensions
+                # Current Overlay Dimensions
-            win_w = int(460 * scale)
+                win_w = int(460 * scale)
-            win_h = int(180 * scale)
+                win_h = int(180 * scale)
-            self.window_hook = WindowHook(hwnd, win_w, win_h, initial_scale=scale)
+                self.window_hook = WindowHook(hwnd, win_w, win_h, initial_scale=scale)
-            self.window_hook.install()
+                self.window_hook.install()
-            # Initial state: Disabled because we start inactive
+                # Initial state: Disabled because we start inactive
-            self.window_hook.set_enabled(False)
+                self.window_hook.set_enabled(False)
-        except Exception as e:
+            except Exception as e:
-            logging.error(f"Failed to install WindowHook: {e}")
+                logging.error(f"Failed to install WindowHook: {e}")
        else:
            # On Linux, use Qt flag for click-through overlay
            self.overlay_root.setFlag(Qt.WindowTransparentForInput, True)
    def center_overlay(self):
        """Calculates and sets the Overlay position above the taskbar."""
@@ -812,19 +869,23 @@ class WhisperApp(QObject):
        self.bridge.update_status("Error")
        logging.error(f"Download Error: {err}")
    def _update_overlay_state(self, is_active):
        """Update overlay visibility and input handling based on active state."""
        if hasattr(self, 'window_hook'):
            self.window_hook.set_enabled(is_active)
        elif sys.platform == 'linux' and self.overlay_root:
            self.overlay_root.setFlag(Qt.WindowTransparentForInput, not is_active)
    @Slot(bool)
    def on_ui_toggle_request(self, is_recording):
        """Called when recording state changes."""
        # Update Window Hook to allow clicking if active
        is_active = is_recording or self.bridge.isProcessing
-        if hasattr(self, 'window_hook'):
+        self._update_overlay_state(is_active)
            self.window_hook.set_enabled(is_active)
    @Slot(bool)
    def on_processing_changed(self, is_processing):
        is_active = self.bridge.isRecording or is_processing
-        if hasattr(self, 'window_hook'):
+        self._update_overlay_state(is_active)
            self.window_hook.set_enabled(is_active)
 if __name__ == "__main__":
    import sys