aboutsummaryrefslogtreecommitdiffstats
path: root/config.py
diff options
context:
space:
mode:
authorPinapelz <yukais@pinapelz.com>2026-04-26 21:31:26 -0700
committerPinapelz <yukais@pinapelz.com>2026-04-26 21:31:26 -0700
commitc545916ac1bba20112a98c3a75b3280b3042186e (patch)
treedffa3e18c5bdf67e00f996b13ee121dbc2edc691 /config.py
parentf31cfc228319199ae808cb3cfbffd94d2003a31c (diff)
add filtering for common whisper hallucination words
Diffstat (limited to 'config.py')
-rw-r--r--config.py34
1 files changed, 34 insertions, 0 deletions
diff --git a/config.py b/config.py
index 1101085..676e8e1 100644
--- a/config.py
+++ b/config.py
@@ -22,3 +22,37 @@ _SYSTEM_PROMPT: str = (
" output an empty string and nothing else.\n"
" 7. Output ONLY the final subtitle text. No labels, no explanations."
)
+
+_LLM_EMPTY_SENTINELS: frozenset = frozenset({
+ "empty string", "empty", "(empty)", "[empty]",
+ "(empty string)", "[empty string]", "(none)", "none", "n/a",
+})
+
+_HALLUCINATION_PHRASES: frozenset = frozenset({
+ "empty string",
+ "thank you for watching",
+ "thanks for watching",
+ "thank you for watching this video",
+ "thanks for watching this video",
+ "thank you for watching and ill see you next time",
+ "thank you for watching ill see you in the next video",
+ "thanks for watching ill see you next time",
+ "thank you so much for watching",
+ "thanks for watching and ill see you in the next one",
+ "see you next time",
+ "see you in the next video",
+ "ill see you in the next video",
+ "ill see you next time",
+ "see you later",
+ "bye bye",
+ "please subscribe",
+ "like and subscribe",
+ "dont forget to like and subscribe",
+ "please like and subscribe",
+ "subscribe to my channel",
+ "if you enjoyed this video please like and subscribe",
+ "you",
+ "uh",
+ "um",
+ "hmm",
+})
send patches to the email below
yukais@pinapelz.com
include the subject [PATCH repo_name]
pinapelz.com
homepage