feat: use ollama to cleanup context window

author: Pinapelz <yukais@pinapelz.com> 2026-04-26 20:55:53 -0700
committer: Pinapelz <yukais@pinapelz.com> 2026-04-26 21:02:29 -0700
commit: 58c5449a35c51d9edea0fedacec964a9e5196e8f (patch)
tree: d549f9004ccddd9e1829380144fee52ecbba4d73 /gui.py
parent: 1ff76ea759b966bc7683fcaff17314788687c950 (diff)
1 files changed, 81 insertions, 33 deletions
diff --git a/gui.py b/gui.py
index aece888..7425567 100644
--- a/gui.py
+++ b/gui.py
@@ -20,16 +20,21 @@ def select_settings(
         return settings.get(key, default_settings.get(key, fallback))
 
     root = tk.Tk()
-    root.title("Audio & Whisper Settings")
+    root.title("Settings")
     root.resizable(False, False)
 
-    frame = ttk.Frame(root, padding=10)
-    frame.pack(fill="both", expand=True)
-    frame.columnconfigure(1, weight=1)
+    notebook = ttk.Notebook(root)
+    notebook.pack(fill="both", expand=True, padx=10, pady=(10, 0))
 
-    def add_row(row: int, label_text: str, widget: tk.Widget) -> None:
-        label = ttk.Label(frame, text=label_text)
-        label.grid(row=row, column=0, sticky="w", pady=4)
+    # ------------------------------------------------------------------ #
+    # Tab 1 – Whisper                                                      #
+    # ------------------------------------------------------------------ #
+    whisper_tab = ttk.Frame(notebook, padding=10)
+    whisper_tab.columnconfigure(1, weight=1)
+    notebook.add(whisper_tab, text="Whisper")
+
+    def add_row(parent: ttk.Frame, row: int, label_text: str, widget: tk.Widget) -> None:
+        ttk.Label(parent, text=label_text).grid(row=row, column=0, sticky="w", pady=4, padx=(0, 12))
         widget.grid(row=row, column=1, sticky="ew", pady=4)
 
     device_options = [
@@ -37,70 +42,92 @@ def select_settings(
         for idx, dev in input_devices
     ]
     device_names = [dev["name"] for _idx, dev in input_devices]
-    device_combo = ttk.Combobox(frame, values=device_options, state="readonly", width=60)
-
+    device_combo = ttk.Combobox(whisper_tab, values=device_options, state="readonly", width=60)
     default_device_name = get_value("audio_device_name", "")
     if default_device_name in device_names:
         device_combo.current(device_names.index(default_device_name))
     else:
         device_combo.current(0)
-    add_row(0, "Audio input device:", device_combo)
+    add_row(whisper_tab, 0, "Audio input device:", device_combo)
 
     model_var = tk.StringVar(value=get_value("model_name", "medium"))
-    model_combo = ttk.Combobox(frame, values=list(model_choices), textvariable=model_var)
+    model_combo = ttk.Combobox(whisper_tab, values=list(model_choices), textvariable=model_var)
     model_combo.set(model_var.get())
-    add_row(1, "Model:", model_combo)
+    add_row(whisper_tab, 1, "Model:", model_combo)
 
     device_type_var = tk.StringVar(value=get_value("device", "cpu"))
     device_type_combo = ttk.Combobox(
-        frame, values=list(device_choices), textvariable=device_type_var, state="readonly"
+        whisper_tab, values=list(device_choices), textvariable=device_type_var, state="readonly"
     )
     device_type_combo.set(device_type_var.get())
-    add_row(2, "Compute device:", device_type_combo)
+    add_row(whisper_tab, 2, "Compute device:", device_type_combo)
 
     compute_type_var = tk.StringVar(value=get_value("compute_type", "int8"))
-    compute_type_combo = ttk.Combobox(
-        frame, values=list(compute_choices), textvariable=compute_type_var
-    )
+    compute_type_combo = ttk.Combobox(whisper_tab, values=list(compute_choices), textvariable=compute_type_var)
     compute_type_combo.set(compute_type_var.get())
-    add_row(3, "Compute type:", compute_type_combo)
+    add_row(whisper_tab, 3, "Compute type:", compute_type_combo)
 
     task_var = tk.StringVar(value=get_value("task", "translate"))
-    task_combo = ttk.Combobox(frame, values=list(task_choices), textvariable=task_var, state="readonly")
+    task_combo = ttk.Combobox(whisper_tab, values=list(task_choices), textvariable=task_var, state="readonly")
     task_combo.set(task_var.get())
-    add_row(4, "Task:", task_combo)
+    add_row(whisper_tab, 4, "Task:", task_combo)
 
     beam_size_var = tk.StringVar(value=str(get_value("beam_size", 3)))
-    beam_entry = ttk.Entry(frame, textvariable=beam_size_var, width=10)
-    add_row(5, "Beam size:", beam_entry)
+    add_row(whisper_tab, 5, "Beam size:", ttk.Entry(whisper_tab, textvariable=beam_size_var, width=10))
 
     language_var = tk.StringVar(value=get_value("language", ""))
-    language_entry = ttk.Entry(frame, textvariable=language_var)
-    add_row(6, "Language (optional):", language_entry)
+    add_row(whisper_tab, 6, "Language (optional):", ttk.Entry(whisper_tab, textvariable=language_var))
 
     context_seconds_var = tk.StringVar(value=str(get_value("context_seconds", 10)))
-    context_entry = ttk.Entry(frame, textvariable=context_seconds_var, width=10)
-    add_row(7, "Context seconds:", context_entry)
+    add_row(whisper_tab, 7, "Context seconds:", ttk.Entry(whisper_tab, textvariable=context_seconds_var, width=10))
 
     update_interval_var = tk.StringVar(value=str(get_value("update_interval_seconds", 2)))
-    update_interval_entry = ttk.Entry(frame, textvariable=update_interval_var, width=10)
-    add_row(8, "Update interval (s):", update_interval_entry)
+    add_row(whisper_tab, 8, "Update interval (s):", ttk.Entry(whisper_tab, textvariable=update_interval_var, width=10))
+
+    # ------------------------------------------------------------------ #
+    # Tab 2 – Ollama                                                       #
+    # ------------------------------------------------------------------ #
+    ollama_tab = ttk.Frame(notebook, padding=10)
+    ollama_tab.columnconfigure(1, weight=1)
+    notebook.add(ollama_tab, text="Ollama")
+
+    use_ollama_cleanup_var = tk.BooleanVar(value=get_value("use_ollama_cleanup", True))
+    add_row(ollama_tab, 0, "LLM subtitle cleanup:", ttk.Checkbutton(ollama_tab, variable=use_ollama_cleanup_var))
+
+    ollama_device_var = tk.StringVar(value=get_value("ollama_device", "CPU"))
+    ollama_device_combo = ttk.Combobox(
+        ollama_tab, values=["CPU", "GPU"], textvariable=ollama_device_var, state="readonly", width=10
+    )
+    ollama_device_combo.set(ollama_device_var.get())
+    add_row(ollama_tab, 1, "Ollama compute:", ollama_device_combo)
 
-    button_frame = ttk.Frame(root, padding=(10, 0, 10, 10))
+    ollama_context_var = tk.StringVar(value=str(get_value("ollama_context_window", 6)))
+    add_row(ollama_tab, 2, "Context window (segments):", ttk.Entry(ollama_tab, textvariable=ollama_context_var, width=10))
+
+    ollama_batch_var = tk.StringVar(value=str(get_value("ollama_raw_batch_size", 3)))
+    add_row(ollama_tab, 3, "Batch size (lines per LLM call):", ttk.Entry(ollama_tab, textvariable=ollama_batch_var, width=10))
+
+    # ------------------------------------------------------------------ #
+    # Buttons                                                              #
+    # ------------------------------------------------------------------ #
+    button_frame = ttk.Frame(root, padding=(10, 6, 10, 10))
     button_frame.pack(fill="x")
 
     selected_settings: Dict[str, Any] = {}
 
     def on_ok() -> None:
         nonlocal selected_settings
+
         selection = device_combo.current()
         if selection < 0:
             messagebox.showwarning("Select a device", "Please select an audio input device.")
             return
+
         model_name = model_var.get().strip()
         if not model_name:
             messagebox.showwarning("Model required", "Please select or enter a model name.")
             return
+
         try:
             beam_size = int(beam_size_var.get().strip())
             if beam_size <= 0:
@@ -108,6 +135,7 @@ def select_settings(
         except ValueError:
             messagebox.showwarning("Invalid beam size", "Beam size must be a positive integer.")
             return
+
         try:
             context_seconds = float(context_seconds_var.get().strip())
             if context_seconds <= 0:
@@ -115,15 +143,31 @@ def select_settings(
         except ValueError:
             messagebox.showwarning("Invalid context seconds", "Context seconds must be a positive number.")
             return
+
         try:
             update_interval_seconds = float(update_interval_var.get().strip())
             if update_interval_seconds <= 0:
                 raise ValueError
         except ValueError:
-            messagebox.showwarning(
-                "Invalid update interval", "Update interval must be a positive number."
-            )
+            messagebox.showwarning("Invalid update interval", "Update interval must be a positive number.")
+            return
+
+        try:
+            ollama_context_window = int(ollama_context_var.get().strip())
+            if ollama_context_window <= 0:
+                raise ValueError
+        except ValueError:
+            messagebox.showwarning("Invalid context window", "Context window must be a positive integer.")
             return
+
+        try:
+            ollama_raw_batch_size = int(ollama_batch_var.get().strip())
+            if ollama_raw_batch_size <= 0:
+                raise ValueError
+        except ValueError:
+            messagebox.showwarning("Invalid batch size", "Batch size must be a positive integer.")
+            return
+
         selected_settings = {
             "audio_device_name": device_names[selection],
             "model_name": model_name,
@@ -134,6 +178,10 @@ def select_settings(
             "language": language_var.get().strip(),
             "context_seconds": context_seconds,
             "update_interval_seconds": update_interval_seconds,
+            "use_ollama_cleanup": use_ollama_cleanup_var.get(),
+            "ollama_device": ollama_device_var.get(),
+            "ollama_context_window": ollama_context_window,
+            "ollama_raw_batch_size": ollama_raw_batch_size,
         }
         root.quit()
 
@@ -185,4 +233,4 @@ def prompt_input_sample_rate(device_index: int, common_rates: Iterable[int] | No
                     parent=root,
                 )
     finally:
-        root.destroy()
-\ No newline at end of file
+        root.destroy()
author	Pinapelz <yukais@pinapelz.com>	2026-04-26 20:55:53 -0700
committer	Pinapelz <yukais@pinapelz.com>	2026-04-26 21:02:29 -0700
commit	58c5449a35c51d9edea0fedacec964a9e5196e8f (patch)
tree	d549f9004ccddd9e1829380144fee52ecbba4d73 /gui.py
parent	1ff76ea759b966bc7683fcaff17314788687c950 (diff)