diff options
| author | Pinapelz <yukais@pinapelz.com> | 2026-04-26 21:31:26 -0700 |
|---|---|---|
| committer | Pinapelz <yukais@pinapelz.com> | 2026-04-26 21:31:26 -0700 |
| commit | c545916ac1bba20112a98c3a75b3280b3042186e (patch) | |
| tree | dffa3e18c5bdf67e00f996b13ee121dbc2edc691 /config.py | |
| parent | f31cfc228319199ae808cb3cfbffd94d2003a31c (diff) | |
add filtering for common whisper hallucination words
Diffstat (limited to 'config.py')
| -rw-r--r-- | config.py | 34 |
1 files changed, 34 insertions, 0 deletions
@@ -22,3 +22,37 @@ _SYSTEM_PROMPT: str = ( " output an empty string and nothing else.\n" " 7. Output ONLY the final subtitle text. No labels, no explanations." ) + +_LLM_EMPTY_SENTINELS: frozenset = frozenset({ + "empty string", "empty", "(empty)", "[empty]", + "(empty string)", "[empty string]", "(none)", "none", "n/a", +}) + +_HALLUCINATION_PHRASES: frozenset = frozenset({ + "empty string", + "thank you for watching", + "thanks for watching", + "thank you for watching this video", + "thanks for watching this video", + "thank you for watching and ill see you next time", + "thank you for watching ill see you in the next video", + "thanks for watching ill see you next time", + "thank you so much for watching", + "thanks for watching and ill see you in the next one", + "see you next time", + "see you in the next video", + "ill see you in the next video", + "ill see you next time", + "see you later", + "bye bye", + "please subscribe", + "like and subscribe", + "dont forget to like and subscribe", + "please like and subscribe", + "subscribe to my channel", + "if you enjoyed this video please like and subscribe", + "you", + "uh", + "um", + "hmm", +}) |
